larson-gemma-2b-chinese-v0.1 / trainer_log.jsonl
ccrains's picture
update files
63d2d58
raw
history blame contribute delete
No virus
99.9 kB
{"current_steps": 10, "total_steps": 4000, "loss": 0.6938, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.998749374687344e-05, "epoch": 0.01, "percentage": 0.25, "elapsed_time": "0:00:46", "remaining_time": "5:06:46"}
{"current_steps": 20, "total_steps": 4000, "loss": 0.4097, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9874937468734366e-05, "epoch": 0.03, "percentage": 0.5, "elapsed_time": "0:01:34", "remaining_time": "5:12:22"}
{"current_steps": 30, "total_steps": 4000, "loss": 0.3894, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9749874937468736e-05, "epoch": 0.04, "percentage": 0.75, "elapsed_time": "0:02:23", "remaining_time": "5:15:35"}
{"current_steps": 40, "total_steps": 4000, "loss": 0.4047, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9624812406203106e-05, "epoch": 0.05, "percentage": 1.0, "elapsed_time": "0:03:11", "remaining_time": "5:15:42"}
{"current_steps": 50, "total_steps": 4000, "loss": 0.4542, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9499749874937476e-05, "epoch": 0.06, "percentage": 1.25, "elapsed_time": "0:04:00", "remaining_time": "5:16:43"}
{"current_steps": 60, "total_steps": 4000, "loss": 0.4522, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.937468734367184e-05, "epoch": 0.07, "percentage": 1.5, "elapsed_time": "0:04:48", "remaining_time": "5:16:15"}
{"current_steps": 70, "total_steps": 4000, "loss": 0.4822, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.92496248124062e-05, "epoch": 0.09, "percentage": 1.75, "elapsed_time": "0:05:37", "remaining_time": "5:15:37"}
{"current_steps": 80, "total_steps": 4000, "loss": 0.5055, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.912456228114057e-05, "epoch": 0.1, "percentage": 2.0, "elapsed_time": "0:06:25", "remaining_time": "5:14:56"}
{"current_steps": 90, "total_steps": 4000, "loss": 0.473, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.8999499749874936e-05, "epoch": 0.11, "percentage": 2.25, "elapsed_time": "0:07:13", "remaining_time": "5:14:14"}
{"current_steps": 100, "total_steps": 4000, "loss": 0.5087, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.887443721860931e-05, "epoch": 0.12, "percentage": 2.5, "elapsed_time": "0:08:01", "remaining_time": "5:13:10"}
{"current_steps": 110, "total_steps": 4000, "loss": 0.5234, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.8749374687343676e-05, "epoch": 0.14, "percentage": 2.75, "elapsed_time": "0:08:50", "remaining_time": "5:12:34"}
{"current_steps": 120, "total_steps": 4000, "loss": 0.5141, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.862431215607804e-05, "epoch": 0.15, "percentage": 3.0, "elapsed_time": "0:09:39", "remaining_time": "5:12:05"}
{"current_steps": 130, "total_steps": 4000, "loss": 0.5434, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.849924962481241e-05, "epoch": 0.16, "percentage": 3.25, "elapsed_time": "0:10:27", "remaining_time": "5:11:33"}
{"current_steps": 140, "total_steps": 4000, "loss": 0.5293, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.837418709354677e-05, "epoch": 0.17, "percentage": 3.5, "elapsed_time": "0:11:16", "remaining_time": "5:10:50"}
{"current_steps": 150, "total_steps": 4000, "loss": 0.511, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.824912456228114e-05, "epoch": 0.19, "percentage": 3.75, "elapsed_time": "0:12:06", "remaining_time": "5:10:53"}
{"current_steps": 160, "total_steps": 4000, "loss": 0.5401, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.812406203101551e-05, "epoch": 0.2, "percentage": 4.0, "elapsed_time": "0:12:55", "remaining_time": "5:10:05"}
{"current_steps": 170, "total_steps": 4000, "loss": 0.6019, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.7998999499749876e-05, "epoch": 0.21, "percentage": 4.25, "elapsed_time": "0:13:43", "remaining_time": "5:09:06"}
{"current_steps": 180, "total_steps": 4000, "loss": 0.5633, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.7873936968484246e-05, "epoch": 0.23, "percentage": 4.5, "elapsed_time": "0:14:31", "remaining_time": "5:08:18"}
{"current_steps": 190, "total_steps": 4000, "loss": 0.583, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.774887443721861e-05, "epoch": 0.24, "percentage": 4.75, "elapsed_time": "0:15:20", "remaining_time": "5:07:40"}
{"current_steps": 200, "total_steps": 4000, "loss": 0.6201, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.762381190595298e-05, "epoch": 0.25, "percentage": 5.0, "elapsed_time": "0:16:09", "remaining_time": "5:07:02"}
{"current_steps": 210, "total_steps": 4000, "loss": 0.6125, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.749874937468735e-05, "epoch": 0.26, "percentage": 5.25, "elapsed_time": "0:16:57", "remaining_time": "5:06:07"}
{"current_steps": 220, "total_steps": 4000, "loss": 0.5686, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.737368684342171e-05, "epoch": 0.28, "percentage": 5.5, "elapsed_time": "0:17:46", "remaining_time": "5:05:25"}
{"current_steps": 230, "total_steps": 4000, "loss": 0.6173, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.724862431215608e-05, "epoch": 0.29, "percentage": 5.75, "elapsed_time": "0:18:35", "remaining_time": "5:04:46"}
{"current_steps": 240, "total_steps": 4000, "loss": 0.6373, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.7123561780890446e-05, "epoch": 0.3, "percentage": 6.0, "elapsed_time": "0:19:24", "remaining_time": "5:03:58"}
{"current_steps": 250, "total_steps": 4000, "loss": 0.5606, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.6998499249624816e-05, "epoch": 0.31, "percentage": 6.25, "elapsed_time": "0:20:14", "remaining_time": "5:03:31"}
{"current_steps": 260, "total_steps": 4000, "loss": 0.5903, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.687343671835918e-05, "epoch": 0.33, "percentage": 6.5, "elapsed_time": "0:21:02", "remaining_time": "5:02:36"}
{"current_steps": 270, "total_steps": 4000, "loss": 0.6201, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.674837418709355e-05, "epoch": 0.34, "percentage": 6.75, "elapsed_time": "0:21:50", "remaining_time": "5:01:42"}
{"current_steps": 280, "total_steps": 4000, "loss": 0.6295, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.662331165582792e-05, "epoch": 0.35, "percentage": 7.0, "elapsed_time": "0:22:38", "remaining_time": "5:00:51"}
{"current_steps": 290, "total_steps": 4000, "loss": 0.6242, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.649824912456228e-05, "epoch": 0.36, "percentage": 7.25, "elapsed_time": "0:23:27", "remaining_time": "5:00:06"}
{"current_steps": 300, "total_steps": 4000, "loss": 0.6343, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.637318659329665e-05, "epoch": 0.38, "percentage": 7.5, "elapsed_time": "0:24:16", "remaining_time": "4:59:19"}
{"current_steps": 310, "total_steps": 4000, "loss": 0.6293, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.6248124062031015e-05, "epoch": 0.39, "percentage": 7.75, "elapsed_time": "0:25:04", "remaining_time": "4:58:31"}
{"current_steps": 320, "total_steps": 4000, "loss": 0.6699, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.6123061530765386e-05, "epoch": 0.4, "percentage": 8.0, "elapsed_time": "0:25:52", "remaining_time": "4:57:38"}
{"current_steps": 330, "total_steps": 4000, "loss": 0.6448, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.5997998999499756e-05, "epoch": 0.41, "percentage": 8.25, "elapsed_time": "0:26:42", "remaining_time": "4:56:57"}
{"current_steps": 340, "total_steps": 4000, "loss": 0.6776, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.587293646823412e-05, "epoch": 0.42, "percentage": 8.5, "elapsed_time": "0:27:30", "remaining_time": "4:56:08"}
{"current_steps": 350, "total_steps": 4000, "loss": 0.6558, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.574787393696849e-05, "epoch": 0.44, "percentage": 8.75, "elapsed_time": "0:28:18", "remaining_time": "4:55:14"}
{"current_steps": 360, "total_steps": 4000, "loss": 0.705, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.562281140570285e-05, "epoch": 0.45, "percentage": 9.0, "elapsed_time": "0:29:06", "remaining_time": "4:54:21"}
{"current_steps": 370, "total_steps": 4000, "loss": 0.6564, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.5497748874437215e-05, "epoch": 0.46, "percentage": 9.25, "elapsed_time": "0:29:55", "remaining_time": "4:53:31"}
{"current_steps": 380, "total_steps": 4000, "loss": 0.6734, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.5372686343171585e-05, "epoch": 0.47, "percentage": 9.5, "elapsed_time": "0:30:43", "remaining_time": "4:52:39"}
{"current_steps": 390, "total_steps": 4000, "loss": 0.7523, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.5247623811905955e-05, "epoch": 0.49, "percentage": 9.75, "elapsed_time": "0:31:31", "remaining_time": "4:51:50"}
{"current_steps": 400, "total_steps": 4000, "loss": 0.7124, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.5122561280640325e-05, "epoch": 0.5, "percentage": 10.0, "elapsed_time": "0:32:19", "remaining_time": "4:50:55"}
{"current_steps": 410, "total_steps": 4000, "loss": 0.702, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.499749874937469e-05, "epoch": 0.51, "percentage": 10.25, "elapsed_time": "0:33:08", "remaining_time": "4:50:07"}
{"current_steps": 420, "total_steps": 4000, "loss": 0.6917, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.487243621810905e-05, "epoch": 0.53, "percentage": 10.5, "elapsed_time": "0:33:56", "remaining_time": "4:49:20"}
{"current_steps": 430, "total_steps": 4000, "loss": 0.675, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.474737368684342e-05, "epoch": 0.54, "percentage": 10.75, "elapsed_time": "0:34:44", "remaining_time": "4:48:29"}
{"current_steps": 440, "total_steps": 4000, "loss": 0.6916, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.462231115557779e-05, "epoch": 0.55, "percentage": 11.0, "elapsed_time": "0:35:33", "remaining_time": "4:47:43"}
{"current_steps": 450, "total_steps": 4000, "loss": 0.6664, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.449724862431216e-05, "epoch": 0.56, "percentage": 11.25, "elapsed_time": "0:36:21", "remaining_time": "4:46:52"}
{"current_steps": 460, "total_steps": 4000, "loss": 0.7281, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.4372186093046525e-05, "epoch": 0.57, "percentage": 11.5, "elapsed_time": "0:37:10", "remaining_time": "4:46:03"}
{"current_steps": 470, "total_steps": 4000, "loss": 0.6826, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.424712356178089e-05, "epoch": 0.59, "percentage": 11.75, "elapsed_time": "0:37:59", "remaining_time": "4:45:17"}
{"current_steps": 480, "total_steps": 4000, "loss": 0.6919, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.412206103051526e-05, "epoch": 0.6, "percentage": 12.0, "elapsed_time": "0:38:50", "remaining_time": "4:44:49"}
{"current_steps": 490, "total_steps": 4000, "loss": 0.689, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.399699849924963e-05, "epoch": 0.61, "percentage": 12.25, "elapsed_time": "0:39:41", "remaining_time": "4:44:20"}
{"current_steps": 500, "total_steps": 4000, "loss": 0.7207, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.3871935967984e-05, "epoch": 0.62, "percentage": 12.5, "elapsed_time": "0:40:32", "remaining_time": "4:43:49"}
{"current_steps": 510, "total_steps": 4000, "loss": 0.7047, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.374687343671836e-05, "epoch": 0.64, "percentage": 12.75, "elapsed_time": "0:41:23", "remaining_time": "4:43:15"}
{"current_steps": 520, "total_steps": 4000, "loss": 0.6799, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.3621810905452725e-05, "epoch": 0.65, "percentage": 13.0, "elapsed_time": "0:42:14", "remaining_time": "4:42:43"}
{"current_steps": 530, "total_steps": 4000, "loss": 0.7035, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.3496748374187095e-05, "epoch": 0.66, "percentage": 13.25, "elapsed_time": "0:43:05", "remaining_time": "4:42:08"}
{"current_steps": 540, "total_steps": 4000, "loss": 0.7166, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.337168584292146e-05, "epoch": 0.68, "percentage": 13.5, "elapsed_time": "0:43:57", "remaining_time": "4:41:38"}
{"current_steps": 550, "total_steps": 4000, "loss": 0.7128, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.324662331165583e-05, "epoch": 0.69, "percentage": 13.75, "elapsed_time": "0:44:48", "remaining_time": "4:41:05"}
{"current_steps": 560, "total_steps": 4000, "loss": 0.7314, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.31215607803902e-05, "epoch": 0.7, "percentage": 14.0, "elapsed_time": "0:45:40", "remaining_time": "4:40:35"}
{"current_steps": 570, "total_steps": 4000, "loss": 0.7351, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.299649824912456e-05, "epoch": 0.71, "percentage": 14.25, "elapsed_time": "0:46:32", "remaining_time": "4:40:05"}
{"current_steps": 580, "total_steps": 4000, "loss": 0.7117, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.287143571785893e-05, "epoch": 0.72, "percentage": 14.5, "elapsed_time": "0:47:24", "remaining_time": "4:39:31"}
{"current_steps": 590, "total_steps": 4000, "loss": 0.7075, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.2746373186593295e-05, "epoch": 0.74, "percentage": 14.75, "elapsed_time": "0:48:15", "remaining_time": "4:38:56"}
{"current_steps": 600, "total_steps": 4000, "loss": 0.7332, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.2621310655327665e-05, "epoch": 0.75, "percentage": 15.0, "elapsed_time": "0:49:08", "remaining_time": "4:38:29"}
{"current_steps": 610, "total_steps": 4000, "loss": 0.6525, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.2496248124062035e-05, "epoch": 0.76, "percentage": 15.25, "elapsed_time": "0:50:00", "remaining_time": "4:37:54"}
{"current_steps": 620, "total_steps": 4000, "loss": 0.734, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.2371185592796405e-05, "epoch": 0.78, "percentage": 15.5, "elapsed_time": "0:50:52", "remaining_time": "4:37:19"}
{"current_steps": 630, "total_steps": 4000, "loss": 0.665, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.224612306153077e-05, "epoch": 0.79, "percentage": 15.75, "elapsed_time": "0:51:43", "remaining_time": "4:36:43"}
{"current_steps": 640, "total_steps": 4000, "loss": 0.7485, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.212106053026513e-05, "epoch": 0.8, "percentage": 16.0, "elapsed_time": "0:52:36", "remaining_time": "4:36:10"}
{"current_steps": 650, "total_steps": 4000, "loss": 0.7342, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.19959979989995e-05, "epoch": 0.81, "percentage": 16.25, "elapsed_time": "0:53:28", "remaining_time": "4:35:34"}
{"current_steps": 660, "total_steps": 4000, "loss": 0.7082, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.1870935467733865e-05, "epoch": 0.82, "percentage": 16.5, "elapsed_time": "0:54:20", "remaining_time": "4:34:57"}
{"current_steps": 670, "total_steps": 4000, "loss": 0.7262, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.174587293646824e-05, "epoch": 0.84, "percentage": 16.75, "elapsed_time": "0:55:11", "remaining_time": "4:34:19"}
{"current_steps": 680, "total_steps": 4000, "loss": 0.6719, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.1620810405202605e-05, "epoch": 0.85, "percentage": 17.0, "elapsed_time": "0:56:03", "remaining_time": "4:33:39"}
{"current_steps": 690, "total_steps": 4000, "loss": 0.7369, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.149574787393697e-05, "epoch": 0.86, "percentage": 17.25, "elapsed_time": "0:56:55", "remaining_time": "4:33:02"}
{"current_steps": 700, "total_steps": 4000, "loss": 0.7526, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.137068534267134e-05, "epoch": 0.88, "percentage": 17.5, "elapsed_time": "0:57:46", "remaining_time": "4:32:22"}
{"current_steps": 710, "total_steps": 4000, "loss": 0.6593, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.12456228114057e-05, "epoch": 0.89, "percentage": 17.75, "elapsed_time": "0:58:39", "remaining_time": "4:31:48"}
{"current_steps": 720, "total_steps": 4000, "loss": 0.7003, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.112056028014007e-05, "epoch": 0.9, "percentage": 18.0, "elapsed_time": "0:59:30", "remaining_time": "4:31:05"}
{"current_steps": 730, "total_steps": 4000, "loss": 0.7414, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.099549774887444e-05, "epoch": 0.91, "percentage": 18.25, "elapsed_time": "1:00:21", "remaining_time": "4:30:22"}
{"current_steps": 740, "total_steps": 4000, "loss": 0.7034, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.0870435217608805e-05, "epoch": 0.93, "percentage": 18.5, "elapsed_time": "1:01:12", "remaining_time": "4:29:39"}
{"current_steps": 750, "total_steps": 4000, "loss": 0.6962, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.0745372686343175e-05, "epoch": 0.94, "percentage": 18.75, "elapsed_time": "1:02:04", "remaining_time": "4:28:57"}
{"current_steps": 760, "total_steps": 4000, "loss": 0.7137, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.062031015507754e-05, "epoch": 0.95, "percentage": 19.0, "elapsed_time": "1:02:55", "remaining_time": "4:28:14"}
{"current_steps": 770, "total_steps": 4000, "loss": 0.7035, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.049524762381191e-05, "epoch": 0.96, "percentage": 19.25, "elapsed_time": "1:03:47", "remaining_time": "4:27:33"}
{"current_steps": 780, "total_steps": 4000, "loss": 0.7133, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.037018509254628e-05, "epoch": 0.97, "percentage": 19.5, "elapsed_time": "1:04:38", "remaining_time": "4:26:51"}
{"current_steps": 790, "total_steps": 4000, "loss": 0.7161, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.024512256128064e-05, "epoch": 0.99, "percentage": 19.75, "elapsed_time": "1:05:30", "remaining_time": "4:26:12"}
{"current_steps": 800, "total_steps": 4000, "loss": 0.722, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.012006003001501e-05, "epoch": 1.0, "percentage": 20.0, "elapsed_time": "1:06:22", "remaining_time": "4:25:29"}
{"current_steps": 810, "total_steps": 4000, "loss": 0.3054, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.9994997498749375e-05, "epoch": 1.01, "percentage": 20.25, "elapsed_time": "1:07:13", "remaining_time": "4:24:45"}
{"current_steps": 820, "total_steps": 4000, "loss": 0.3016, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.9869934967483745e-05, "epoch": 1.02, "percentage": 20.5, "elapsed_time": "1:08:04", "remaining_time": "4:24:00"}
{"current_steps": 830, "total_steps": 4000, "loss": 0.3077, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.974487243621811e-05, "epoch": 1.04, "percentage": 20.75, "elapsed_time": "1:08:55", "remaining_time": "4:23:15"}
{"current_steps": 840, "total_steps": 4000, "loss": 0.2966, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.961980990495248e-05, "epoch": 1.05, "percentage": 21.0, "elapsed_time": "1:09:47", "remaining_time": "4:22:31"}
{"current_steps": 850, "total_steps": 4000, "loss": 0.3203, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.949474737368685e-05, "epoch": 1.06, "percentage": 21.25, "elapsed_time": "1:10:38", "remaining_time": "4:21:48"}
{"current_steps": 860, "total_steps": 4000, "loss": 0.3019, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.936968484242121e-05, "epoch": 1.07, "percentage": 21.5, "elapsed_time": "1:11:30", "remaining_time": "4:21:04"}
{"current_steps": 870, "total_steps": 4000, "loss": 0.325, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.924462231115558e-05, "epoch": 1.09, "percentage": 21.75, "elapsed_time": "1:12:21", "remaining_time": "4:20:20"}
{"current_steps": 880, "total_steps": 4000, "loss": 0.3371, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.9119559779889945e-05, "epoch": 1.1, "percentage": 22.0, "elapsed_time": "1:13:13", "remaining_time": "4:19:36"}
{"current_steps": 890, "total_steps": 4000, "loss": 0.3306, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.8994497248624315e-05, "epoch": 1.11, "percentage": 22.25, "elapsed_time": "1:14:06", "remaining_time": "4:18:56"}
{"current_steps": 900, "total_steps": 4000, "loss": 0.2961, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.8869434717358685e-05, "epoch": 1.12, "percentage": 22.5, "elapsed_time": "1:14:58", "remaining_time": "4:18:16"}
{"current_steps": 910, "total_steps": 4000, "loss": 0.3159, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.874437218609305e-05, "epoch": 1.14, "percentage": 22.75, "elapsed_time": "1:15:50", "remaining_time": "4:17:30"}
{"current_steps": 920, "total_steps": 4000, "loss": 0.3321, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.861930965482742e-05, "epoch": 1.15, "percentage": 23.0, "elapsed_time": "1:16:42", "remaining_time": "4:16:49"}
{"current_steps": 930, "total_steps": 4000, "loss": 0.316, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.849424712356178e-05, "epoch": 1.16, "percentage": 23.25, "elapsed_time": "1:17:34", "remaining_time": "4:16:03"}
{"current_steps": 940, "total_steps": 4000, "loss": 0.3539, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.8369184592296145e-05, "epoch": 1.18, "percentage": 23.5, "elapsed_time": "1:18:25", "remaining_time": "4:15:18"}
{"current_steps": 950, "total_steps": 4000, "loss": 0.3293, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.824412206103052e-05, "epoch": 1.19, "percentage": 23.75, "elapsed_time": "1:19:17", "remaining_time": "4:14:34"}
{"current_steps": 960, "total_steps": 4000, "loss": 0.3169, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.8119059529764885e-05, "epoch": 1.2, "percentage": 24.0, "elapsed_time": "1:20:10", "remaining_time": "4:13:52"}
{"current_steps": 970, "total_steps": 4000, "loss": 0.3321, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.7993996998499255e-05, "epoch": 1.21, "percentage": 24.25, "elapsed_time": "1:21:02", "remaining_time": "4:13:09"}
{"current_steps": 980, "total_steps": 4000, "loss": 0.3418, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.786893446723362e-05, "epoch": 1.23, "percentage": 24.5, "elapsed_time": "1:21:55", "remaining_time": "4:12:26"}
{"current_steps": 990, "total_steps": 4000, "loss": 0.3277, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.774387193596798e-05, "epoch": 1.24, "percentage": 24.75, "elapsed_time": "1:22:47", "remaining_time": "4:11:42"}
{"current_steps": 1000, "total_steps": 4000, "loss": 0.3371, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.761880940470235e-05, "epoch": 1.25, "percentage": 25.0, "elapsed_time": "1:23:39", "remaining_time": "4:10:58"}
{"current_steps": 1010, "total_steps": 4000, "loss": 0.347, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.749374687343672e-05, "epoch": 1.26, "percentage": 25.25, "elapsed_time": "1:24:31", "remaining_time": "4:10:14"}
{"current_steps": 1020, "total_steps": 4000, "loss": 0.3358, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.736868434217109e-05, "epoch": 1.27, "percentage": 25.5, "elapsed_time": "1:25:23", "remaining_time": "4:09:28"}
{"current_steps": 1030, "total_steps": 4000, "loss": 0.3461, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.7243621810905455e-05, "epoch": 1.29, "percentage": 25.75, "elapsed_time": "1:26:16", "remaining_time": "4:08:46"}
{"current_steps": 1040, "total_steps": 4000, "loss": 0.3362, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.711855927963982e-05, "epoch": 1.3, "percentage": 26.0, "elapsed_time": "1:27:08", "remaining_time": "4:08:00"}
{"current_steps": 1050, "total_steps": 4000, "loss": 0.3418, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.699349674837419e-05, "epoch": 1.31, "percentage": 26.25, "elapsed_time": "1:28:00", "remaining_time": "4:07:15"}
{"current_steps": 1060, "total_steps": 4000, "loss": 0.3372, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.686843421710856e-05, "epoch": 1.32, "percentage": 26.5, "elapsed_time": "1:28:53", "remaining_time": "4:06:33"}
{"current_steps": 1070, "total_steps": 4000, "loss": 0.3254, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.674337168584293e-05, "epoch": 1.34, "percentage": 26.75, "elapsed_time": "1:29:45", "remaining_time": "4:05:46"}
{"current_steps": 1080, "total_steps": 4000, "loss": 0.3471, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.661830915457729e-05, "epoch": 1.35, "percentage": 27.0, "elapsed_time": "1:30:38", "remaining_time": "4:05:03"}
{"current_steps": 1090, "total_steps": 4000, "loss": 0.3432, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.6493246623311655e-05, "epoch": 1.36, "percentage": 27.25, "elapsed_time": "1:31:30", "remaining_time": "4:04:17"}
{"current_steps": 1100, "total_steps": 4000, "loss": 0.3533, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.6368184092046025e-05, "epoch": 1.38, "percentage": 27.5, "elapsed_time": "1:32:22", "remaining_time": "4:03:31"}
{"current_steps": 1110, "total_steps": 4000, "loss": 0.3551, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.624312156078039e-05, "epoch": 1.39, "percentage": 27.75, "elapsed_time": "1:33:13", "remaining_time": "4:02:44"}
{"current_steps": 1120, "total_steps": 4000, "loss": 0.3321, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.611805902951476e-05, "epoch": 1.4, "percentage": 28.0, "elapsed_time": "1:34:04", "remaining_time": "4:01:54"}
{"current_steps": 1130, "total_steps": 4000, "loss": 0.3339, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.599299649824913e-05, "epoch": 1.41, "percentage": 28.25, "elapsed_time": "1:34:56", "remaining_time": "4:01:06"}
{"current_steps": 1140, "total_steps": 4000, "loss": 0.3272, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.586793396698349e-05, "epoch": 1.43, "percentage": 28.5, "elapsed_time": "1:35:46", "remaining_time": "4:00:17"}
{"current_steps": 1150, "total_steps": 4000, "loss": 0.3527, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.574287143571786e-05, "epoch": 1.44, "percentage": 28.75, "elapsed_time": "1:36:38", "remaining_time": "3:59:30"}
{"current_steps": 1160, "total_steps": 4000, "loss": 0.3513, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.5617808904452225e-05, "epoch": 1.45, "percentage": 29.0, "elapsed_time": "1:37:29", "remaining_time": "3:58:41"}
{"current_steps": 1170, "total_steps": 4000, "loss": 0.339, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.5492746373186595e-05, "epoch": 1.46, "percentage": 29.25, "elapsed_time": "1:38:21", "remaining_time": "3:57:53"}
{"current_steps": 1180, "total_steps": 4000, "loss": 0.3511, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.5367683841920965e-05, "epoch": 1.48, "percentage": 29.5, "elapsed_time": "1:39:12", "remaining_time": "3:57:04"}
{"current_steps": 1190, "total_steps": 4000, "loss": 0.3349, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.524262131065533e-05, "epoch": 1.49, "percentage": 29.75, "elapsed_time": "1:40:04", "remaining_time": "3:56:17"}
{"current_steps": 1200, "total_steps": 4000, "loss": 0.3619, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.51175587793897e-05, "epoch": 1.5, "percentage": 30.0, "elapsed_time": "1:40:54", "remaining_time": "3:55:27"}
{"current_steps": 1210, "total_steps": 4000, "loss": 0.3487, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.499249624812406e-05, "epoch": 1.51, "percentage": 30.25, "elapsed_time": "1:41:45", "remaining_time": "3:54:39"}
{"current_steps": 1220, "total_steps": 4000, "loss": 0.3293, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.486743371685843e-05, "epoch": 1.52, "percentage": 30.5, "elapsed_time": "1:42:37", "remaining_time": "3:53:50"}
{"current_steps": 1230, "total_steps": 4000, "loss": 0.3424, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.4742371185592795e-05, "epoch": 1.54, "percentage": 30.75, "elapsed_time": "1:43:28", "remaining_time": "3:53:01"}
{"current_steps": 1240, "total_steps": 4000, "loss": 0.3453, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.4617308654327165e-05, "epoch": 1.55, "percentage": 31.0, "elapsed_time": "1:44:20", "remaining_time": "3:52:13"}
{"current_steps": 1250, "total_steps": 4000, "loss": 0.3576, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.4492246123061535e-05, "epoch": 1.56, "percentage": 31.25, "elapsed_time": "1:45:11", "remaining_time": "3:51:25"}
{"current_steps": 1260, "total_steps": 4000, "loss": 0.3597, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.43671835917959e-05, "epoch": 1.57, "percentage": 31.5, "elapsed_time": "1:46:02", "remaining_time": "3:50:36"}
{"current_steps": 1270, "total_steps": 4000, "loss": 0.3274, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.424212106053027e-05, "epoch": 1.59, "percentage": 31.75, "elapsed_time": "1:46:54", "remaining_time": "3:49:49"}
{"current_steps": 1280, "total_steps": 4000, "loss": 0.345, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.411705852926463e-05, "epoch": 1.6, "percentage": 32.0, "elapsed_time": "1:47:46", "remaining_time": "3:49:00"}
{"current_steps": 1290, "total_steps": 4000, "loss": 0.3432, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.3991995997999e-05, "epoch": 1.61, "percentage": 32.25, "elapsed_time": "1:48:37", "remaining_time": "3:48:12"}
{"current_steps": 1300, "total_steps": 4000, "loss": 0.3643, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.386693346673337e-05, "epoch": 1.62, "percentage": 32.5, "elapsed_time": "1:49:29", "remaining_time": "3:47:23"}
{"current_steps": 1310, "total_steps": 4000, "loss": 0.3488, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.3741870935467735e-05, "epoch": 1.64, "percentage": 32.75, "elapsed_time": "1:50:20", "remaining_time": "3:46:34"}
{"current_steps": 1320, "total_steps": 4000, "loss": 0.3505, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.3616808404202105e-05, "epoch": 1.65, "percentage": 33.0, "elapsed_time": "1:51:11", "remaining_time": "3:45:46"}
{"current_steps": 1330, "total_steps": 4000, "loss": 0.3577, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.349174587293647e-05, "epoch": 1.66, "percentage": 33.25, "elapsed_time": "1:52:03", "remaining_time": "3:44:57"}
{"current_steps": 1340, "total_steps": 4000, "loss": 0.3471, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.336668334167083e-05, "epoch": 1.68, "percentage": 33.5, "elapsed_time": "1:52:54", "remaining_time": "3:44:08"}
{"current_steps": 1350, "total_steps": 4000, "loss": 0.3489, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.324162081040521e-05, "epoch": 1.69, "percentage": 33.75, "elapsed_time": "1:53:47", "remaining_time": "3:43:22"}
{"current_steps": 1360, "total_steps": 4000, "loss": 0.3362, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.311655827913957e-05, "epoch": 1.7, "percentage": 34.0, "elapsed_time": "1:54:39", "remaining_time": "3:42:33"}
{"current_steps": 1370, "total_steps": 4000, "loss": 0.3496, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.299149574787394e-05, "epoch": 1.71, "percentage": 34.25, "elapsed_time": "1:55:30", "remaining_time": "3:41:44"}
{"current_steps": 1380, "total_steps": 4000, "loss": 0.3565, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.2866433216608305e-05, "epoch": 1.73, "percentage": 34.5, "elapsed_time": "1:56:21", "remaining_time": "3:40:55"}
{"current_steps": 1390, "total_steps": 4000, "loss": 0.3419, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.274137068534267e-05, "epoch": 1.74, "percentage": 34.75, "elapsed_time": "1:57:13", "remaining_time": "3:40:05"}
{"current_steps": 1400, "total_steps": 4000, "loss": 0.3368, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.261630815407704e-05, "epoch": 1.75, "percentage": 35.0, "elapsed_time": "1:58:04", "remaining_time": "3:39:16"}
{"current_steps": 1410, "total_steps": 4000, "loss": 0.34, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.249124562281141e-05, "epoch": 1.76, "percentage": 35.25, "elapsed_time": "1:58:55", "remaining_time": "3:38:27"}
{"current_steps": 1420, "total_steps": 4000, "loss": 0.346, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.236618309154578e-05, "epoch": 1.77, "percentage": 35.5, "elapsed_time": "1:59:47", "remaining_time": "3:37:38"}
{"current_steps": 1430, "total_steps": 4000, "loss": 0.3422, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.224112056028014e-05, "epoch": 1.79, "percentage": 35.75, "elapsed_time": "2:00:38", "remaining_time": "3:36:49"}
{"current_steps": 1440, "total_steps": 4000, "loss": 0.3457, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.2116058029014505e-05, "epoch": 1.8, "percentage": 36.0, "elapsed_time": "2:01:30", "remaining_time": "3:36:00"}
{"current_steps": 1450, "total_steps": 4000, "loss": 0.3428, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.1990995497748875e-05, "epoch": 1.81, "percentage": 36.25, "elapsed_time": "2:02:22", "remaining_time": "3:35:12"}
{"current_steps": 1460, "total_steps": 4000, "loss": 0.3423, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.1865932966483245e-05, "epoch": 1.82, "percentage": 36.5, "elapsed_time": "2:03:13", "remaining_time": "3:34:23"}
{"current_steps": 1470, "total_steps": 4000, "loss": 0.3353, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.1740870435217615e-05, "epoch": 1.84, "percentage": 36.75, "elapsed_time": "2:04:04", "remaining_time": "3:33:33"}
{"current_steps": 1480, "total_steps": 4000, "loss": 0.3313, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.161580790395198e-05, "epoch": 1.85, "percentage": 37.0, "elapsed_time": "2:04:56", "remaining_time": "3:32:44"}
{"current_steps": 1490, "total_steps": 4000, "loss": 0.3448, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.149074537268634e-05, "epoch": 1.86, "percentage": 37.25, "elapsed_time": "2:05:48", "remaining_time": "3:31:56"}
{"current_steps": 1500, "total_steps": 4000, "loss": 0.3515, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.136568284142071e-05, "epoch": 1.88, "percentage": 37.5, "elapsed_time": "2:06:39", "remaining_time": "3:31:05"}
{"current_steps": 1510, "total_steps": 4000, "loss": 0.3462, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.1240620310155075e-05, "epoch": 1.89, "percentage": 37.75, "elapsed_time": "2:07:30", "remaining_time": "3:30:15"}
{"current_steps": 1520, "total_steps": 4000, "loss": 0.3593, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.111555777888945e-05, "epoch": 1.9, "percentage": 38.0, "elapsed_time": "2:08:21", "remaining_time": "3:29:25"}
{"current_steps": 1530, "total_steps": 4000, "loss": 0.3467, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.0990495247623815e-05, "epoch": 1.91, "percentage": 38.25, "elapsed_time": "2:09:12", "remaining_time": "3:28:35"}
{"current_steps": 1540, "total_steps": 4000, "loss": 0.3447, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.086543271635818e-05, "epoch": 1.93, "percentage": 38.5, "elapsed_time": "2:10:03", "remaining_time": "3:27:45"}
{"current_steps": 1550, "total_steps": 4000, "loss": 0.3575, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.074037018509255e-05, "epoch": 1.94, "percentage": 38.75, "elapsed_time": "2:10:54", "remaining_time": "3:26:55"}
{"current_steps": 1560, "total_steps": 4000, "loss": 0.3392, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.061530765382691e-05, "epoch": 1.95, "percentage": 39.0, "elapsed_time": "2:11:45", "remaining_time": "3:26:04"}
{"current_steps": 1570, "total_steps": 4000, "loss": 0.341, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.0490245122561285e-05, "epoch": 1.96, "percentage": 39.25, "elapsed_time": "2:12:36", "remaining_time": "3:25:15"}
{"current_steps": 1580, "total_steps": 4000, "loss": 0.3337, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.0365182591295648e-05, "epoch": 1.98, "percentage": 39.5, "elapsed_time": "2:13:28", "remaining_time": "3:24:26"}
{"current_steps": 1590, "total_steps": 4000, "loss": 0.3352, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.0240120060030014e-05, "epoch": 1.99, "percentage": 39.75, "elapsed_time": "2:14:19", "remaining_time": "3:23:36"}
{"current_steps": 1600, "total_steps": 4000, "loss": 0.338, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.0115057528764385e-05, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "2:15:10", "remaining_time": "3:22:46"}
{"current_steps": 1610, "total_steps": 4000, "loss": 0.1203, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.9989994997498748e-05, "epoch": 2.01, "percentage": 40.25, "elapsed_time": "2:16:02", "remaining_time": "3:21:56"}
{"current_steps": 1620, "total_steps": 4000, "loss": 0.1226, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.986493246623312e-05, "epoch": 2.02, "percentage": 40.5, "elapsed_time": "2:16:50", "remaining_time": "3:21:02"}
{"current_steps": 1630, "total_steps": 4000, "loss": 0.1236, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.9739869934967484e-05, "epoch": 2.04, "percentage": 40.75, "elapsed_time": "2:17:38", "remaining_time": "3:20:07"}
{"current_steps": 1640, "total_steps": 4000, "loss": 0.1242, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.961480740370185e-05, "epoch": 2.05, "percentage": 41.0, "elapsed_time": "2:18:26", "remaining_time": "3:19:13"}
{"current_steps": 1650, "total_steps": 4000, "loss": 0.1243, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.948974487243622e-05, "epoch": 2.06, "percentage": 41.25, "elapsed_time": "2:19:14", "remaining_time": "3:18:19"}
{"current_steps": 1660, "total_steps": 4000, "loss": 0.1235, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.9364682341170584e-05, "epoch": 2.08, "percentage": 41.5, "elapsed_time": "2:20:02", "remaining_time": "3:17:24"}
{"current_steps": 1670, "total_steps": 4000, "loss": 0.1226, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.9239619809904954e-05, "epoch": 2.09, "percentage": 41.75, "elapsed_time": "2:20:51", "remaining_time": "3:16:31"}
{"current_steps": 1680, "total_steps": 4000, "loss": 0.1207, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.911455727863932e-05, "epoch": 2.1, "percentage": 42.0, "elapsed_time": "2:21:39", "remaining_time": "3:15:36"}
{"current_steps": 1690, "total_steps": 4000, "loss": 0.1324, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.8989494747373684e-05, "epoch": 2.11, "percentage": 42.25, "elapsed_time": "2:22:27", "remaining_time": "3:14:43"}
{"current_steps": 1700, "total_steps": 4000, "loss": 0.132, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.8864432216108054e-05, "epoch": 2.12, "percentage": 42.5, "elapsed_time": "2:23:16", "remaining_time": "3:13:50"}
{"current_steps": 1710, "total_steps": 4000, "loss": 0.1264, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.873936968484242e-05, "epoch": 2.14, "percentage": 42.75, "elapsed_time": "2:24:04", "remaining_time": "3:12:56"}
{"current_steps": 1720, "total_steps": 4000, "loss": 0.1366, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.861430715357679e-05, "epoch": 2.15, "percentage": 43.0, "elapsed_time": "2:24:52", "remaining_time": "3:12:02"}
{"current_steps": 1730, "total_steps": 4000, "loss": 0.1377, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.8489244622311158e-05, "epoch": 2.16, "percentage": 43.25, "elapsed_time": "2:25:40", "remaining_time": "3:11:08"}
{"current_steps": 1740, "total_steps": 4000, "loss": 0.1225, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.836418209104552e-05, "epoch": 2.17, "percentage": 43.5, "elapsed_time": "2:26:29", "remaining_time": "3:10:15"}
{"current_steps": 1750, "total_steps": 4000, "loss": 0.1466, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.823911955977989e-05, "epoch": 2.19, "percentage": 43.75, "elapsed_time": "2:27:17", "remaining_time": "3:09:22"}
{"current_steps": 1760, "total_steps": 4000, "loss": 0.1415, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.8114057028514258e-05, "epoch": 2.2, "percentage": 44.0, "elapsed_time": "2:28:06", "remaining_time": "3:08:30"}
{"current_steps": 1770, "total_steps": 4000, "loss": 0.1309, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7988994497248628e-05, "epoch": 2.21, "percentage": 44.25, "elapsed_time": "2:28:55", "remaining_time": "3:07:38"}
{"current_steps": 1780, "total_steps": 4000, "loss": 0.1432, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.786393196598299e-05, "epoch": 2.23, "percentage": 44.5, "elapsed_time": "2:29:44", "remaining_time": "3:06:45"}
{"current_steps": 1790, "total_steps": 4000, "loss": 0.1366, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7738869434717364e-05, "epoch": 2.24, "percentage": 44.75, "elapsed_time": "2:30:32", "remaining_time": "3:05:52"}
{"current_steps": 1800, "total_steps": 4000, "loss": 0.1408, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7613806903451728e-05, "epoch": 2.25, "percentage": 45.0, "elapsed_time": "2:31:20", "remaining_time": "3:04:58"}
{"current_steps": 1810, "total_steps": 4000, "loss": 0.1474, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7488744372186094e-05, "epoch": 2.26, "percentage": 45.25, "elapsed_time": "2:32:08", "remaining_time": "3:04:05"}
{"current_steps": 1820, "total_steps": 4000, "loss": 0.1393, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7363681840920464e-05, "epoch": 2.27, "percentage": 45.5, "elapsed_time": "2:32:56", "remaining_time": "3:03:11"}
{"current_steps": 1830, "total_steps": 4000, "loss": 0.1271, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7238619309654828e-05, "epoch": 2.29, "percentage": 45.75, "elapsed_time": "2:33:44", "remaining_time": "3:02:18"}
{"current_steps": 1840, "total_steps": 4000, "loss": 0.1401, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7113556778389198e-05, "epoch": 2.3, "percentage": 46.0, "elapsed_time": "2:34:32", "remaining_time": "3:01:24"}
{"current_steps": 1850, "total_steps": 4000, "loss": 0.1363, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6988494247123564e-05, "epoch": 2.31, "percentage": 46.25, "elapsed_time": "2:35:19", "remaining_time": "3:00:30"}
{"current_steps": 1860, "total_steps": 4000, "loss": 0.1346, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6863431715857928e-05, "epoch": 2.33, "percentage": 46.5, "elapsed_time": "2:36:08", "remaining_time": "2:59:38"}
{"current_steps": 1870, "total_steps": 4000, "loss": 0.1341, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6738369184592298e-05, "epoch": 2.34, "percentage": 46.75, "elapsed_time": "2:36:57", "remaining_time": "2:58:46"}
{"current_steps": 1880, "total_steps": 4000, "loss": 0.1365, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6613306653326664e-05, "epoch": 2.35, "percentage": 47.0, "elapsed_time": "2:37:45", "remaining_time": "2:57:53"}
{"current_steps": 1890, "total_steps": 4000, "loss": 0.1302, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6488244122061034e-05, "epoch": 2.36, "percentage": 47.25, "elapsed_time": "2:38:34", "remaining_time": "2:57:02"}
{"current_steps": 1900, "total_steps": 4000, "loss": 0.1437, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.63631815907954e-05, "epoch": 2.38, "percentage": 47.5, "elapsed_time": "2:39:22", "remaining_time": "2:56:09"}
{"current_steps": 1910, "total_steps": 4000, "loss": 0.1329, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6238119059529764e-05, "epoch": 2.39, "percentage": 47.75, "elapsed_time": "2:40:10", "remaining_time": "2:55:16"}
{"current_steps": 1920, "total_steps": 4000, "loss": 0.1307, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6113056528264134e-05, "epoch": 2.4, "percentage": 48.0, "elapsed_time": "2:40:58", "remaining_time": "2:54:23"}
{"current_steps": 1930, "total_steps": 4000, "loss": 0.1345, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.59879939969985e-05, "epoch": 2.41, "percentage": 48.25, "elapsed_time": "2:41:47", "remaining_time": "2:53:31"}
{"current_steps": 1940, "total_steps": 4000, "loss": 0.134, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.586293146573287e-05, "epoch": 2.42, "percentage": 48.5, "elapsed_time": "2:42:35", "remaining_time": "2:52:39"}
{"current_steps": 1950, "total_steps": 4000, "loss": 0.1287, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.5737868934467234e-05, "epoch": 2.44, "percentage": 48.75, "elapsed_time": "2:43:23", "remaining_time": "2:51:46"}
{"current_steps": 1960, "total_steps": 4000, "loss": 0.157, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.56128064032016e-05, "epoch": 2.45, "percentage": 49.0, "elapsed_time": "2:44:11", "remaining_time": "2:50:53"}
{"current_steps": 1970, "total_steps": 4000, "loss": 0.124, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.548774387193597e-05, "epoch": 2.46, "percentage": 49.25, "elapsed_time": "2:45:00", "remaining_time": "2:50:02"}
{"current_steps": 1980, "total_steps": 4000, "loss": 0.1403, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.5362681340670334e-05, "epoch": 2.48, "percentage": 49.5, "elapsed_time": "2:45:48", "remaining_time": "2:49:09"}
{"current_steps": 1990, "total_steps": 4000, "loss": 0.1422, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.5237618809404708e-05, "epoch": 2.49, "percentage": 49.75, "elapsed_time": "2:46:36", "remaining_time": "2:48:16"}
{"current_steps": 2000, "total_steps": 4000, "loss": 0.1326, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.511255627813907e-05, "epoch": 2.5, "percentage": 50.0, "elapsed_time": "2:47:23", "remaining_time": "2:47:23"}
{"current_steps": 2010, "total_steps": 4000, "loss": 0.1295, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4987493746873438e-05, "epoch": 2.51, "percentage": 50.25, "elapsed_time": "2:48:12", "remaining_time": "2:46:31"}
{"current_steps": 2020, "total_steps": 4000, "loss": 0.1314, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4862431215607804e-05, "epoch": 2.52, "percentage": 50.5, "elapsed_time": "2:49:00", "remaining_time": "2:45:39"}
{"current_steps": 2030, "total_steps": 4000, "loss": 0.1346, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.473736868434217e-05, "epoch": 2.54, "percentage": 50.75, "elapsed_time": "2:49:48", "remaining_time": "2:44:47"}
{"current_steps": 2040, "total_steps": 4000, "loss": 0.134, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.461230615307654e-05, "epoch": 2.55, "percentage": 51.0, "elapsed_time": "2:50:36", "remaining_time": "2:43:55"}
{"current_steps": 2050, "total_steps": 4000, "loss": 0.1237, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4487243621810908e-05, "epoch": 2.56, "percentage": 51.25, "elapsed_time": "2:51:25", "remaining_time": "2:43:03"}
{"current_steps": 2060, "total_steps": 4000, "loss": 0.1374, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4362181090545274e-05, "epoch": 2.58, "percentage": 51.5, "elapsed_time": "2:52:14", "remaining_time": "2:42:12"}
{"current_steps": 2070, "total_steps": 4000, "loss": 0.1375, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.423711855927964e-05, "epoch": 2.59, "percentage": 51.75, "elapsed_time": "2:53:02", "remaining_time": "2:41:20"}
{"current_steps": 2080, "total_steps": 4000, "loss": 0.1392, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4112056028014007e-05, "epoch": 2.6, "percentage": 52.0, "elapsed_time": "2:53:50", "remaining_time": "2:40:27"}
{"current_steps": 2090, "total_steps": 4000, "loss": 0.1218, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.3986993496748374e-05, "epoch": 2.61, "percentage": 52.25, "elapsed_time": "2:54:38", "remaining_time": "2:39:36"}
{"current_steps": 2100, "total_steps": 4000, "loss": 0.1304, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.3861930965482744e-05, "epoch": 2.62, "percentage": 52.5, "elapsed_time": "2:55:26", "remaining_time": "2:38:43"}
{"current_steps": 2110, "total_steps": 4000, "loss": 0.1278, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.373686843421711e-05, "epoch": 2.64, "percentage": 52.75, "elapsed_time": "2:56:14", "remaining_time": "2:37:51"}
{"current_steps": 2120, "total_steps": 4000, "loss": 0.1297, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.3611805902951477e-05, "epoch": 2.65, "percentage": 53.0, "elapsed_time": "2:57:02", "remaining_time": "2:36:59"}
{"current_steps": 2130, "total_steps": 4000, "loss": 0.1203, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.3486743371685844e-05, "epoch": 2.66, "percentage": 53.25, "elapsed_time": "2:57:49", "remaining_time": "2:36:07"}
{"current_steps": 2140, "total_steps": 4000, "loss": 0.118, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.336168084042021e-05, "epoch": 2.67, "percentage": 53.5, "elapsed_time": "2:58:37", "remaining_time": "2:35:15"}
{"current_steps": 2150, "total_steps": 4000, "loss": 0.132, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.3236618309154577e-05, "epoch": 2.69, "percentage": 53.75, "elapsed_time": "2:59:24", "remaining_time": "2:34:22"}
{"current_steps": 2160, "total_steps": 4000, "loss": 0.137, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.3111555777888947e-05, "epoch": 2.7, "percentage": 54.0, "elapsed_time": "3:00:12", "remaining_time": "2:33:30"}
{"current_steps": 2170, "total_steps": 4000, "loss": 0.1359, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2986493246623314e-05, "epoch": 2.71, "percentage": 54.25, "elapsed_time": "3:01:01", "remaining_time": "2:32:40"}
{"current_steps": 2180, "total_steps": 4000, "loss": 0.1264, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2861430715357677e-05, "epoch": 2.73, "percentage": 54.5, "elapsed_time": "3:01:49", "remaining_time": "2:31:48"}
{"current_steps": 2190, "total_steps": 4000, "loss": 0.1251, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2736368184092047e-05, "epoch": 2.74, "percentage": 54.75, "elapsed_time": "3:02:37", "remaining_time": "2:30:56"}
{"current_steps": 2200, "total_steps": 4000, "loss": 0.1296, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2611305652826414e-05, "epoch": 2.75, "percentage": 55.0, "elapsed_time": "3:03:25", "remaining_time": "2:30:04"}
{"current_steps": 2210, "total_steps": 4000, "loss": 0.1247, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.248624312156078e-05, "epoch": 2.76, "percentage": 55.25, "elapsed_time": "3:04:13", "remaining_time": "2:29:13"}
{"current_steps": 2220, "total_steps": 4000, "loss": 0.1303, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.236118059029515e-05, "epoch": 2.77, "percentage": 55.5, "elapsed_time": "3:05:02", "remaining_time": "2:28:21"}
{"current_steps": 2230, "total_steps": 4000, "loss": 0.131, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2236118059029514e-05, "epoch": 2.79, "percentage": 55.75, "elapsed_time": "3:05:49", "remaining_time": "2:27:29"}
{"current_steps": 2240, "total_steps": 4000, "loss": 0.1427, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2111055527763884e-05, "epoch": 2.8, "percentage": 56.0, "elapsed_time": "3:06:38", "remaining_time": "2:26:38"}
{"current_steps": 2250, "total_steps": 4000, "loss": 0.1313, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.198599299649825e-05, "epoch": 2.81, "percentage": 56.25, "elapsed_time": "3:07:26", "remaining_time": "2:25:47"}
{"current_steps": 2260, "total_steps": 4000, "loss": 0.1306, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.1860930465232617e-05, "epoch": 2.83, "percentage": 56.5, "elapsed_time": "3:08:15", "remaining_time": "2:24:56"}
{"current_steps": 2270, "total_steps": 4000, "loss": 0.127, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.1735867933966987e-05, "epoch": 2.84, "percentage": 56.75, "elapsed_time": "3:09:03", "remaining_time": "2:24:04"}
{"current_steps": 2280, "total_steps": 4000, "loss": 0.1191, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.161080540270135e-05, "epoch": 2.85, "percentage": 57.0, "elapsed_time": "3:09:51", "remaining_time": "2:23:13"}
{"current_steps": 2290, "total_steps": 4000, "loss": 0.1256, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.1485742871435717e-05, "epoch": 2.86, "percentage": 57.25, "elapsed_time": "3:10:39", "remaining_time": "2:22:22"}
{"current_steps": 2300, "total_steps": 4000, "loss": 0.1238, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.1360680340170087e-05, "epoch": 2.88, "percentage": 57.5, "elapsed_time": "3:11:29", "remaining_time": "2:21:32"}
{"current_steps": 2310, "total_steps": 4000, "loss": 0.1271, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.1235617808904454e-05, "epoch": 2.89, "percentage": 57.75, "elapsed_time": "3:12:17", "remaining_time": "2:20:40"}
{"current_steps": 2320, "total_steps": 4000, "loss": 0.1255, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.111055527763882e-05, "epoch": 2.9, "percentage": 58.0, "elapsed_time": "3:13:05", "remaining_time": "2:19:49"}
{"current_steps": 2330, "total_steps": 4000, "loss": 0.1291, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0985492746373187e-05, "epoch": 2.91, "percentage": 58.25, "elapsed_time": "3:13:52", "remaining_time": "2:18:57"}
{"current_steps": 2340, "total_steps": 4000, "loss": 0.137, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0860430215107554e-05, "epoch": 2.92, "percentage": 58.5, "elapsed_time": "3:14:40", "remaining_time": "2:18:06"}
{"current_steps": 2350, "total_steps": 4000, "loss": 0.1274, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.073536768384192e-05, "epoch": 2.94, "percentage": 58.75, "elapsed_time": "3:15:28", "remaining_time": "2:17:14"}
{"current_steps": 2360, "total_steps": 4000, "loss": 0.121, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.061030515257629e-05, "epoch": 2.95, "percentage": 59.0, "elapsed_time": "3:16:16", "remaining_time": "2:16:23"}
{"current_steps": 2370, "total_steps": 4000, "loss": 0.1221, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0485242621310657e-05, "epoch": 2.96, "percentage": 59.25, "elapsed_time": "3:17:04", "remaining_time": "2:15:32"}
{"current_steps": 2380, "total_steps": 4000, "loss": 0.1274, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0360180090045024e-05, "epoch": 2.98, "percentage": 59.5, "elapsed_time": "3:17:52", "remaining_time": "2:14:41"}
{"current_steps": 2390, "total_steps": 4000, "loss": 0.1161, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.023511755877939e-05, "epoch": 2.99, "percentage": 59.75, "elapsed_time": "3:18:40", "remaining_time": "2:13:50"}
{"current_steps": 2400, "total_steps": 4000, "loss": 0.1261, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0110055027513757e-05, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "3:19:28", "remaining_time": "2:12:59"}
{"current_steps": 2410, "total_steps": 4000, "loss": 0.0474, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9984992496248124e-05, "epoch": 3.01, "percentage": 60.25, "elapsed_time": "3:20:16", "remaining_time": "2:12:07"}
{"current_steps": 2420, "total_steps": 4000, "loss": 0.0443, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9859929964982494e-05, "epoch": 3.02, "percentage": 60.5, "elapsed_time": "3:21:03", "remaining_time": "2:11:16"}
{"current_steps": 2430, "total_steps": 4000, "loss": 0.0424, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9734867433716857e-05, "epoch": 3.04, "percentage": 60.75, "elapsed_time": "3:21:51", "remaining_time": "2:10:25"}
{"current_steps": 2440, "total_steps": 4000, "loss": 0.0545, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9609804902451227e-05, "epoch": 3.05, "percentage": 61.0, "elapsed_time": "3:22:39", "remaining_time": "2:09:34"}
{"current_steps": 2450, "total_steps": 4000, "loss": 0.0539, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9484742371185594e-05, "epoch": 3.06, "percentage": 61.25, "elapsed_time": "3:23:27", "remaining_time": "2:08:43"}
{"current_steps": 2460, "total_steps": 4000, "loss": 0.0516, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.935967983991996e-05, "epoch": 3.08, "percentage": 61.5, "elapsed_time": "3:24:14", "remaining_time": "2:07:51"}
{"current_steps": 2470, "total_steps": 4000, "loss": 0.0496, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.923461730865433e-05, "epoch": 3.09, "percentage": 61.75, "elapsed_time": "3:25:02", "remaining_time": "2:07:00"}
{"current_steps": 2480, "total_steps": 4000, "loss": 0.048, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9109554777388694e-05, "epoch": 3.1, "percentage": 62.0, "elapsed_time": "3:25:50", "remaining_time": "2:06:09"}
{"current_steps": 2490, "total_steps": 4000, "loss": 0.054, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.898449224612306e-05, "epoch": 3.11, "percentage": 62.25, "elapsed_time": "3:26:38", "remaining_time": "2:05:18"}
{"current_steps": 2500, "total_steps": 4000, "loss": 0.06, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.885942971485743e-05, "epoch": 3.12, "percentage": 62.5, "elapsed_time": "3:27:26", "remaining_time": "2:04:28"}
{"current_steps": 2510, "total_steps": 4000, "loss": 0.056, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8734367183591797e-05, "epoch": 3.14, "percentage": 62.75, "elapsed_time": "3:28:14", "remaining_time": "2:03:37"}
{"current_steps": 2520, "total_steps": 4000, "loss": 0.0558, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8609304652326164e-05, "epoch": 3.15, "percentage": 63.0, "elapsed_time": "3:29:03", "remaining_time": "2:02:46"}
{"current_steps": 2530, "total_steps": 4000, "loss": 0.0541, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.848424212106053e-05, "epoch": 3.16, "percentage": 63.25, "elapsed_time": "3:29:51", "remaining_time": "2:01:55"}
{"current_steps": 2540, "total_steps": 4000, "loss": 0.0586, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8359179589794897e-05, "epoch": 3.17, "percentage": 63.5, "elapsed_time": "3:30:38", "remaining_time": "2:01:04"}
{"current_steps": 2550, "total_steps": 4000, "loss": 0.05, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8234117058529264e-05, "epoch": 3.19, "percentage": 63.75, "elapsed_time": "3:31:26", "remaining_time": "2:00:14"}
{"current_steps": 2560, "total_steps": 4000, "loss": 0.0578, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8109054527263634e-05, "epoch": 3.2, "percentage": 64.0, "elapsed_time": "3:32:14", "remaining_time": "1:59:23"}
{"current_steps": 2570, "total_steps": 4000, "loss": 0.0524, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7983991995998e-05, "epoch": 3.21, "percentage": 64.25, "elapsed_time": "3:33:02", "remaining_time": "1:58:32"}
{"current_steps": 2580, "total_steps": 4000, "loss": 0.0481, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7858929464732367e-05, "epoch": 3.23, "percentage": 64.5, "elapsed_time": "3:33:50", "remaining_time": "1:57:41"}
{"current_steps": 2590, "total_steps": 4000, "loss": 0.0475, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7733866933466734e-05, "epoch": 3.24, "percentage": 64.75, "elapsed_time": "3:34:39", "remaining_time": "1:56:51"}
{"current_steps": 2600, "total_steps": 4000, "loss": 0.0522, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.76088044022011e-05, "epoch": 3.25, "percentage": 65.0, "elapsed_time": "3:35:27", "remaining_time": "1:56:00"}
{"current_steps": 2610, "total_steps": 4000, "loss": 0.0541, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.748374187093547e-05, "epoch": 3.26, "percentage": 65.25, "elapsed_time": "3:36:15", "remaining_time": "1:55:10"}
{"current_steps": 2620, "total_steps": 4000, "loss": 0.0507, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7358679339669837e-05, "epoch": 3.27, "percentage": 65.5, "elapsed_time": "3:37:03", "remaining_time": "1:54:19"}
{"current_steps": 2630, "total_steps": 4000, "loss": 0.0485, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.72336168084042e-05, "epoch": 3.29, "percentage": 65.75, "elapsed_time": "3:37:51", "remaining_time": "1:53:29"}
{"current_steps": 2640, "total_steps": 4000, "loss": 0.0532, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.710855427713857e-05, "epoch": 3.3, "percentage": 66.0, "elapsed_time": "3:38:39", "remaining_time": "1:52:38"}
{"current_steps": 2650, "total_steps": 4000, "loss": 0.0577, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6983491745872937e-05, "epoch": 3.31, "percentage": 66.25, "elapsed_time": "3:39:26", "remaining_time": "1:51:47"}
{"current_steps": 2660, "total_steps": 4000, "loss": 0.0456, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6858429214607304e-05, "epoch": 3.33, "percentage": 66.5, "elapsed_time": "3:40:14", "remaining_time": "1:50:56"}
{"current_steps": 2670, "total_steps": 4000, "loss": 0.0546, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6733366683341674e-05, "epoch": 3.34, "percentage": 66.75, "elapsed_time": "3:41:02", "remaining_time": "1:50:06"}
{"current_steps": 2680, "total_steps": 4000, "loss": 0.0535, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.660830415207604e-05, "epoch": 3.35, "percentage": 67.0, "elapsed_time": "3:41:50", "remaining_time": "1:49:15"}
{"current_steps": 2690, "total_steps": 4000, "loss": 0.0451, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6483241620810404e-05, "epoch": 3.36, "percentage": 67.25, "elapsed_time": "3:42:38", "remaining_time": "1:48:25"}
{"current_steps": 2700, "total_steps": 4000, "loss": 0.0547, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6358179089544774e-05, "epoch": 3.38, "percentage": 67.5, "elapsed_time": "3:43:26", "remaining_time": "1:47:34"}
{"current_steps": 2710, "total_steps": 4000, "loss": 0.0545, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.623311655827914e-05, "epoch": 3.39, "percentage": 67.75, "elapsed_time": "3:44:14", "remaining_time": "1:46:44"}
{"current_steps": 2720, "total_steps": 4000, "loss": 0.048, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6108054027013507e-05, "epoch": 3.4, "percentage": 68.0, "elapsed_time": "3:45:02", "remaining_time": "1:45:54"}
{"current_steps": 2730, "total_steps": 4000, "loss": 0.0508, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5982991495747877e-05, "epoch": 3.41, "percentage": 68.25, "elapsed_time": "3:45:51", "remaining_time": "1:45:04"}
{"current_steps": 2740, "total_steps": 4000, "loss": 0.048, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.585792896448224e-05, "epoch": 3.42, "percentage": 68.5, "elapsed_time": "3:46:38", "remaining_time": "1:44:13"}
{"current_steps": 2750, "total_steps": 4000, "loss": 0.0535, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.573286643321661e-05, "epoch": 3.44, "percentage": 68.75, "elapsed_time": "3:47:27", "remaining_time": "1:43:23"}
{"current_steps": 2760, "total_steps": 4000, "loss": 0.0511, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5607803901950977e-05, "epoch": 3.45, "percentage": 69.0, "elapsed_time": "3:48:16", "remaining_time": "1:42:33"}
{"current_steps": 2770, "total_steps": 4000, "loss": 0.0492, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5482741370685344e-05, "epoch": 3.46, "percentage": 69.25, "elapsed_time": "3:49:04", "remaining_time": "1:41:42"}
{"current_steps": 2780, "total_steps": 4000, "loss": 0.0508, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.535767883941971e-05, "epoch": 3.48, "percentage": 69.5, "elapsed_time": "3:49:52", "remaining_time": "1:40:52"}
{"current_steps": 2790, "total_steps": 4000, "loss": 0.0515, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5232616308154077e-05, "epoch": 3.49, "percentage": 69.75, "elapsed_time": "3:50:40", "remaining_time": "1:40:02"}
{"current_steps": 2800, "total_steps": 4000, "loss": 0.0469, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5107553776888445e-05, "epoch": 3.5, "percentage": 70.0, "elapsed_time": "3:51:29", "remaining_time": "1:39:12"}
{"current_steps": 2810, "total_steps": 4000, "loss": 0.0424, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4982491245622812e-05, "epoch": 3.51, "percentage": 70.25, "elapsed_time": "3:52:18", "remaining_time": "1:38:22"}
{"current_steps": 2820, "total_steps": 4000, "loss": 0.0452, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.485742871435718e-05, "epoch": 3.52, "percentage": 70.5, "elapsed_time": "3:53:06", "remaining_time": "1:37:32"}
{"current_steps": 2830, "total_steps": 4000, "loss": 0.054, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4732366183091547e-05, "epoch": 3.54, "percentage": 70.75, "elapsed_time": "3:53:54", "remaining_time": "1:36:42"}
{"current_steps": 2840, "total_steps": 4000, "loss": 0.05, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4607303651825912e-05, "epoch": 3.55, "percentage": 71.0, "elapsed_time": "3:54:41", "remaining_time": "1:35:51"}
{"current_steps": 2850, "total_steps": 4000, "loss": 0.0484, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.448224112056028e-05, "epoch": 3.56, "percentage": 71.25, "elapsed_time": "3:55:29", "remaining_time": "1:35:01"}
{"current_steps": 2860, "total_steps": 4000, "loss": 0.0495, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4357178589294649e-05, "epoch": 3.58, "percentage": 71.5, "elapsed_time": "3:56:20", "remaining_time": "1:34:12"}
{"current_steps": 2870, "total_steps": 4000, "loss": 0.0449, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4232116058029015e-05, "epoch": 3.59, "percentage": 71.75, "elapsed_time": "3:57:11", "remaining_time": "1:33:23"}
{"current_steps": 2880, "total_steps": 4000, "loss": 0.0535, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4107053526763384e-05, "epoch": 3.6, "percentage": 72.0, "elapsed_time": "3:58:03", "remaining_time": "1:32:34"}
{"current_steps": 2890, "total_steps": 4000, "loss": 0.0497, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3981990995497749e-05, "epoch": 3.61, "percentage": 72.25, "elapsed_time": "3:58:53", "remaining_time": "1:31:45"}
{"current_steps": 2900, "total_steps": 4000, "loss": 0.0479, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3856928464232117e-05, "epoch": 3.62, "percentage": 72.5, "elapsed_time": "3:59:44", "remaining_time": "1:30:56"}
{"current_steps": 2910, "total_steps": 4000, "loss": 0.0456, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3731865932966484e-05, "epoch": 3.64, "percentage": 72.75, "elapsed_time": "4:00:36", "remaining_time": "1:30:07"}
{"current_steps": 2920, "total_steps": 4000, "loss": 0.0581, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3606803401700852e-05, "epoch": 3.65, "percentage": 73.0, "elapsed_time": "4:01:27", "remaining_time": "1:29:18"}
{"current_steps": 2930, "total_steps": 4000, "loss": 0.0467, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.348174087043522e-05, "epoch": 3.66, "percentage": 73.25, "elapsed_time": "4:02:18", "remaining_time": "1:28:29"}
{"current_steps": 2940, "total_steps": 4000, "loss": 0.0427, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3356678339169585e-05, "epoch": 3.67, "percentage": 73.5, "elapsed_time": "4:03:10", "remaining_time": "1:27:40"}
{"current_steps": 2950, "total_steps": 4000, "loss": 0.0451, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3231615807903952e-05, "epoch": 3.69, "percentage": 73.75, "elapsed_time": "4:04:01", "remaining_time": "1:26:51"}
{"current_steps": 2960, "total_steps": 4000, "loss": 0.0478, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.310655327663832e-05, "epoch": 3.7, "percentage": 74.0, "elapsed_time": "4:04:52", "remaining_time": "1:26:02"}
{"current_steps": 2970, "total_steps": 4000, "loss": 0.0468, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2981490745372687e-05, "epoch": 3.71, "percentage": 74.25, "elapsed_time": "4:05:43", "remaining_time": "1:25:13"}
{"current_steps": 2980, "total_steps": 4000, "loss": 0.0433, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2856428214107055e-05, "epoch": 3.73, "percentage": 74.5, "elapsed_time": "4:06:35", "remaining_time": "1:24:24"}
{"current_steps": 2990, "total_steps": 4000, "loss": 0.0491, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.273136568284142e-05, "epoch": 3.74, "percentage": 74.75, "elapsed_time": "4:07:27", "remaining_time": "1:23:35"}
{"current_steps": 3000, "total_steps": 4000, "loss": 0.0441, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2606303151575788e-05, "epoch": 3.75, "percentage": 75.0, "elapsed_time": "4:08:18", "remaining_time": "1:22:46"}
{"current_steps": 3010, "total_steps": 4000, "loss": 0.0442, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2481240620310155e-05, "epoch": 3.76, "percentage": 75.25, "elapsed_time": "4:09:10", "remaining_time": "1:21:57"}
{"current_steps": 3020, "total_steps": 4000, "loss": 0.0438, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2356178089044523e-05, "epoch": 3.77, "percentage": 75.5, "elapsed_time": "4:10:01", "remaining_time": "1:21:07"}
{"current_steps": 3030, "total_steps": 4000, "loss": 0.05, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.223111555777889e-05, "epoch": 3.79, "percentage": 75.75, "elapsed_time": "4:10:52", "remaining_time": "1:20:18"}
{"current_steps": 3040, "total_steps": 4000, "loss": 0.0442, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2106053026513257e-05, "epoch": 3.8, "percentage": 76.0, "elapsed_time": "4:11:44", "remaining_time": "1:19:29"}
{"current_steps": 3050, "total_steps": 4000, "loss": 0.0453, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1980990495247623e-05, "epoch": 3.81, "percentage": 76.25, "elapsed_time": "4:12:35", "remaining_time": "1:18:40"}
{"current_steps": 3060, "total_steps": 4000, "loss": 0.0444, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1855927963981992e-05, "epoch": 3.83, "percentage": 76.5, "elapsed_time": "4:13:26", "remaining_time": "1:17:51"}
{"current_steps": 3070, "total_steps": 4000, "loss": 0.0408, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1730865432716358e-05, "epoch": 3.84, "percentage": 76.75, "elapsed_time": "4:14:17", "remaining_time": "1:17:01"}
{"current_steps": 3080, "total_steps": 4000, "loss": 0.0392, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1605802901450725e-05, "epoch": 3.85, "percentage": 77.0, "elapsed_time": "4:15:07", "remaining_time": "1:16:12"}
{"current_steps": 3090, "total_steps": 4000, "loss": 0.0388, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1480740370185093e-05, "epoch": 3.86, "percentage": 77.25, "elapsed_time": "4:15:58", "remaining_time": "1:15:23"}
{"current_steps": 3100, "total_steps": 4000, "loss": 0.0432, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1355677838919462e-05, "epoch": 3.88, "percentage": 77.5, "elapsed_time": "4:16:49", "remaining_time": "1:14:33"}
{"current_steps": 3110, "total_steps": 4000, "loss": 0.0441, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1230615307653827e-05, "epoch": 3.89, "percentage": 77.75, "elapsed_time": "4:17:41", "remaining_time": "1:13:44"}
{"current_steps": 3120, "total_steps": 4000, "loss": 0.0475, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1105552776388195e-05, "epoch": 3.9, "percentage": 78.0, "elapsed_time": "4:18:32", "remaining_time": "1:12:55"}
{"current_steps": 3130, "total_steps": 4000, "loss": 0.0398, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0980490245122562e-05, "epoch": 3.91, "percentage": 78.25, "elapsed_time": "4:19:24", "remaining_time": "1:12:06"}
{"current_steps": 3140, "total_steps": 4000, "loss": 0.0471, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0855427713856928e-05, "epoch": 3.92, "percentage": 78.5, "elapsed_time": "4:20:15", "remaining_time": "1:11:16"}
{"current_steps": 3150, "total_steps": 4000, "loss": 0.0443, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0730365182591297e-05, "epoch": 3.94, "percentage": 78.75, "elapsed_time": "4:21:06", "remaining_time": "1:10:27"}
{"current_steps": 3160, "total_steps": 4000, "loss": 0.0472, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0605302651325663e-05, "epoch": 3.95, "percentage": 79.0, "elapsed_time": "4:21:57", "remaining_time": "1:09:38"}
{"current_steps": 3170, "total_steps": 4000, "loss": 0.0433, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0480240120060032e-05, "epoch": 3.96, "percentage": 79.25, "elapsed_time": "4:22:49", "remaining_time": "1:08:49"}
{"current_steps": 3180, "total_steps": 4000, "loss": 0.0383, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0355177588794397e-05, "epoch": 3.98, "percentage": 79.5, "elapsed_time": "4:23:41", "remaining_time": "1:07:59"}
{"current_steps": 3190, "total_steps": 4000, "loss": 0.0459, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0230115057528765e-05, "epoch": 3.99, "percentage": 79.75, "elapsed_time": "4:24:34", "remaining_time": "1:07:10"}
{"current_steps": 3200, "total_steps": 4000, "loss": 0.0419, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0105052526263133e-05, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "4:25:25", "remaining_time": "1:06:21"}
{"current_steps": 3210, "total_steps": 4000, "loss": 0.0166, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.979989994997498e-06, "epoch": 4.01, "percentage": 80.25, "elapsed_time": "4:26:18", "remaining_time": "1:05:32"}
{"current_steps": 3220, "total_steps": 4000, "loss": 0.0147, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.854927463731867e-06, "epoch": 4.03, "percentage": 80.5, "elapsed_time": "4:27:09", "remaining_time": "1:04:42"}
{"current_steps": 3230, "total_steps": 4000, "loss": 0.0157, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.729864932466233e-06, "epoch": 4.04, "percentage": 80.75, "elapsed_time": "4:28:01", "remaining_time": "1:03:53"}
{"current_steps": 3240, "total_steps": 4000, "loss": 0.0188, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.604802401200602e-06, "epoch": 4.05, "percentage": 81.0, "elapsed_time": "4:28:51", "remaining_time": "1:03:04"}
{"current_steps": 3250, "total_steps": 4000, "loss": 0.0133, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.479739869934968e-06, "epoch": 4.06, "percentage": 81.25, "elapsed_time": "4:29:43", "remaining_time": "1:02:14"}
{"current_steps": 3260, "total_steps": 4000, "loss": 0.0139, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.354677338669335e-06, "epoch": 4.08, "percentage": 81.5, "elapsed_time": "4:30:35", "remaining_time": "1:01:25"}
{"current_steps": 3270, "total_steps": 4000, "loss": 0.0178, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.229614807403703e-06, "epoch": 4.09, "percentage": 81.75, "elapsed_time": "4:31:25", "remaining_time": "1:00:35"}
{"current_steps": 3280, "total_steps": 4000, "loss": 0.0166, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.104552276138068e-06, "epoch": 4.1, "percentage": 82.0, "elapsed_time": "4:32:17", "remaining_time": "0:59:46"}
{"current_steps": 3290, "total_steps": 4000, "loss": 0.0126, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.979489744872437e-06, "epoch": 4.11, "percentage": 82.25, "elapsed_time": "4:33:09", "remaining_time": "0:58:56"}
{"current_steps": 3300, "total_steps": 4000, "loss": 0.0194, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.854427213606805e-06, "epoch": 4.12, "percentage": 82.5, "elapsed_time": "4:34:00", "remaining_time": "0:58:07"}
{"current_steps": 3310, "total_steps": 4000, "loss": 0.0185, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.72936468234117e-06, "epoch": 4.14, "percentage": 82.75, "elapsed_time": "4:34:52", "remaining_time": "0:57:18"}
{"current_steps": 3320, "total_steps": 4000, "loss": 0.0127, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.604302151075538e-06, "epoch": 4.15, "percentage": 83.0, "elapsed_time": "4:35:43", "remaining_time": "0:56:28"}
{"current_steps": 3330, "total_steps": 4000, "loss": 0.0153, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.479239619809905e-06, "epoch": 4.16, "percentage": 83.25, "elapsed_time": "4:36:35", "remaining_time": "0:55:39"}
{"current_steps": 3340, "total_steps": 4000, "loss": 0.0196, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.354177088544273e-06, "epoch": 4.17, "percentage": 83.5, "elapsed_time": "4:37:27", "remaining_time": "0:54:49"}
{"current_steps": 3350, "total_steps": 4000, "loss": 0.0157, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.22911455727864e-06, "epoch": 4.19, "percentage": 83.75, "elapsed_time": "4:38:18", "remaining_time": "0:54:00"}
{"current_steps": 3360, "total_steps": 4000, "loss": 0.0161, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.104052026013006e-06, "epoch": 4.2, "percentage": 84.0, "elapsed_time": "4:39:10", "remaining_time": "0:53:10"}
{"current_steps": 3370, "total_steps": 4000, "loss": 0.0147, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.978989494747375e-06, "epoch": 4.21, "percentage": 84.25, "elapsed_time": "4:40:02", "remaining_time": "0:52:21"}
{"current_steps": 3380, "total_steps": 4000, "loss": 0.0133, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.85392696348174e-06, "epoch": 4.22, "percentage": 84.5, "elapsed_time": "4:40:53", "remaining_time": "0:51:31"}
{"current_steps": 3390, "total_steps": 4000, "loss": 0.0148, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.728864432216108e-06, "epoch": 4.24, "percentage": 84.75, "elapsed_time": "4:41:44", "remaining_time": "0:50:41"}
{"current_steps": 3400, "total_steps": 4000, "loss": 0.0142, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.603801900950476e-06, "epoch": 4.25, "percentage": 85.0, "elapsed_time": "4:42:36", "remaining_time": "0:49:52"}
{"current_steps": 3410, "total_steps": 4000, "loss": 0.016, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.478739369684842e-06, "epoch": 4.26, "percentage": 85.25, "elapsed_time": "4:43:27", "remaining_time": "0:49:02"}
{"current_steps": 3420, "total_steps": 4000, "loss": 0.0144, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.35367683841921e-06, "epoch": 4.28, "percentage": 85.5, "elapsed_time": "4:44:18", "remaining_time": "0:48:13"}
{"current_steps": 3430, "total_steps": 4000, "loss": 0.0145, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.228614307153578e-06, "epoch": 4.29, "percentage": 85.75, "elapsed_time": "4:45:10", "remaining_time": "0:47:23"}
{"current_steps": 3440, "total_steps": 4000, "loss": 0.0144, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.103551775887944e-06, "epoch": 4.3, "percentage": 86.0, "elapsed_time": "4:46:01", "remaining_time": "0:46:33"}
{"current_steps": 3450, "total_steps": 4000, "loss": 0.0134, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.978489244622312e-06, "epoch": 4.31, "percentage": 86.25, "elapsed_time": "4:46:53", "remaining_time": "0:45:44"}
{"current_steps": 3460, "total_steps": 4000, "loss": 0.0136, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.853426713356678e-06, "epoch": 4.33, "percentage": 86.5, "elapsed_time": "4:47:44", "remaining_time": "0:44:54"}
{"current_steps": 3470, "total_steps": 4000, "loss": 0.017, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.7283641820910456e-06, "epoch": 4.34, "percentage": 86.75, "elapsed_time": "4:48:35", "remaining_time": "0:44:04"}
{"current_steps": 3480, "total_steps": 4000, "loss": 0.0138, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.603301650825414e-06, "epoch": 4.35, "percentage": 87.0, "elapsed_time": "4:49:26", "remaining_time": "0:43:15"}
{"current_steps": 3490, "total_steps": 4000, "loss": 0.0131, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.47823911955978e-06, "epoch": 4.36, "percentage": 87.25, "elapsed_time": "4:50:18", "remaining_time": "0:42:25"}
{"current_steps": 3500, "total_steps": 4000, "loss": 0.0152, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.353176588294148e-06, "epoch": 4.38, "percentage": 87.5, "elapsed_time": "4:51:09", "remaining_time": "0:41:35"}
{"current_steps": 3510, "total_steps": 4000, "loss": 0.0136, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.228114057028515e-06, "epoch": 4.39, "percentage": 87.75, "elapsed_time": "4:52:00", "remaining_time": "0:40:45"}
{"current_steps": 3520, "total_steps": 4000, "loss": 0.0158, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.103051525762881e-06, "epoch": 4.4, "percentage": 88.0, "elapsed_time": "4:52:52", "remaining_time": "0:39:56"}
{"current_steps": 3530, "total_steps": 4000, "loss": 0.0143, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.977988994497249e-06, "epoch": 4.41, "percentage": 88.25, "elapsed_time": "4:53:43", "remaining_time": "0:39:06"}
{"current_steps": 3540, "total_steps": 4000, "loss": 0.0133, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.8529264632316155e-06, "epoch": 4.42, "percentage": 88.5, "elapsed_time": "4:54:34", "remaining_time": "0:38:16"}
{"current_steps": 3550, "total_steps": 4000, "loss": 0.0154, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.727863931965984e-06, "epoch": 4.44, "percentage": 88.75, "elapsed_time": "4:55:25", "remaining_time": "0:37:26"}
{"current_steps": 3560, "total_steps": 4000, "loss": 0.0114, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.6028014007003505e-06, "epoch": 4.45, "percentage": 89.0, "elapsed_time": "4:56:16", "remaining_time": "0:36:37"}
{"current_steps": 3570, "total_steps": 4000, "loss": 0.0135, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.477738869434718e-06, "epoch": 4.46, "percentage": 89.25, "elapsed_time": "4:57:05", "remaining_time": "0:35:47"}
{"current_steps": 3580, "total_steps": 4000, "loss": 0.0131, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.352676338169085e-06, "epoch": 4.47, "percentage": 89.5, "elapsed_time": "4:57:53", "remaining_time": "0:34:56"}
{"current_steps": 3590, "total_steps": 4000, "loss": 0.0128, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.227613806903451e-06, "epoch": 4.49, "percentage": 89.75, "elapsed_time": "4:58:41", "remaining_time": "0:34:06"}
{"current_steps": 3600, "total_steps": 4000, "loss": 0.0112, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.10255127563782e-06, "epoch": 4.5, "percentage": 90.0, "elapsed_time": "4:59:29", "remaining_time": "0:33:16"}
{"current_steps": 3610, "total_steps": 4000, "loss": 0.0154, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.977488744372186e-06, "epoch": 4.51, "percentage": 90.25, "elapsed_time": "5:00:17", "remaining_time": "0:32:26"}
{"current_steps": 3620, "total_steps": 4000, "loss": 0.0131, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.852426213106554e-06, "epoch": 4.53, "percentage": 90.5, "elapsed_time": "5:01:05", "remaining_time": "0:31:36"}
{"current_steps": 3630, "total_steps": 4000, "loss": 0.0152, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.7273636818409205e-06, "epoch": 4.54, "percentage": 90.75, "elapsed_time": "5:01:54", "remaining_time": "0:30:46"}
{"current_steps": 3640, "total_steps": 4000, "loss": 0.01, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.602301150575288e-06, "epoch": 4.55, "percentage": 91.0, "elapsed_time": "5:02:42", "remaining_time": "0:29:56"}
{"current_steps": 3650, "total_steps": 4000, "loss": 0.0158, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.4772386193096554e-06, "epoch": 4.56, "percentage": 91.25, "elapsed_time": "5:03:30", "remaining_time": "0:29:06"}
{"current_steps": 3660, "total_steps": 4000, "loss": 0.0137, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.352176088044022e-06, "epoch": 4.58, "percentage": 91.5, "elapsed_time": "5:04:19", "remaining_time": "0:28:16"}
{"current_steps": 3670, "total_steps": 4000, "loss": 0.0108, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.22711355677839e-06, "epoch": 4.59, "percentage": 91.75, "elapsed_time": "5:05:07", "remaining_time": "0:27:26"}
{"current_steps": 3680, "total_steps": 4000, "loss": 0.0125, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.102051025512756e-06, "epoch": 4.6, "percentage": 92.0, "elapsed_time": "5:05:55", "remaining_time": "0:26:36"}
{"current_steps": 3690, "total_steps": 4000, "loss": 0.0157, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.976988494247124e-06, "epoch": 4.61, "percentage": 92.25, "elapsed_time": "5:06:43", "remaining_time": "0:25:46"}
{"current_steps": 3700, "total_steps": 4000, "loss": 0.0109, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.851925962981491e-06, "epoch": 4.62, "percentage": 92.5, "elapsed_time": "5:07:31", "remaining_time": "0:24:56"}
{"current_steps": 3710, "total_steps": 4000, "loss": 0.012, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.726863431715858e-06, "epoch": 4.64, "percentage": 92.75, "elapsed_time": "5:08:20", "remaining_time": "0:24:06"}
{"current_steps": 3720, "total_steps": 4000, "loss": 0.0118, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.601800900450225e-06, "epoch": 4.65, "percentage": 93.0, "elapsed_time": "5:09:08", "remaining_time": "0:23:16"}
{"current_steps": 3730, "total_steps": 4000, "loss": 0.0136, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.476738369184592e-06, "epoch": 4.66, "percentage": 93.25, "elapsed_time": "5:09:56", "remaining_time": "0:22:26"}
{"current_steps": 3740, "total_steps": 4000, "loss": 0.0162, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.35167583791896e-06, "epoch": 4.67, "percentage": 93.5, "elapsed_time": "5:10:44", "remaining_time": "0:21:36"}
{"current_steps": 3750, "total_steps": 4000, "loss": 0.0115, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.226613306653327e-06, "epoch": 4.69, "percentage": 93.75, "elapsed_time": "5:11:32", "remaining_time": "0:20:46"}
{"current_steps": 3760, "total_steps": 4000, "loss": 0.0096, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.101550775387694e-06, "epoch": 4.7, "percentage": 94.0, "elapsed_time": "5:12:20", "remaining_time": "0:19:56"}
{"current_steps": 3770, "total_steps": 4000, "loss": 0.0172, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.976488244122061e-06, "epoch": 4.71, "percentage": 94.25, "elapsed_time": "5:13:08", "remaining_time": "0:19:06"}
{"current_steps": 3780, "total_steps": 4000, "loss": 0.0123, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.8514257128564283e-06, "epoch": 4.72, "percentage": 94.5, "elapsed_time": "5:13:55", "remaining_time": "0:18:16"}
{"current_steps": 3790, "total_steps": 4000, "loss": 0.0111, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7263631815907953e-06, "epoch": 4.74, "percentage": 94.75, "elapsed_time": "5:14:43", "remaining_time": "0:17:26"}
{"current_steps": 3800, "total_steps": 4000, "loss": 0.0143, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.601300650325163e-06, "epoch": 4.75, "percentage": 95.0, "elapsed_time": "5:15:32", "remaining_time": "0:16:36"}
{"current_steps": 3810, "total_steps": 4000, "loss": 0.0106, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.47623811905953e-06, "epoch": 4.76, "percentage": 95.25, "elapsed_time": "5:16:20", "remaining_time": "0:15:46"}
{"current_steps": 3820, "total_steps": 4000, "loss": 0.0103, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.351175587793897e-06, "epoch": 4.78, "percentage": 95.5, "elapsed_time": "5:17:09", "remaining_time": "0:14:56"}
{"current_steps": 3830, "total_steps": 4000, "loss": 0.0112, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.226113056528264e-06, "epoch": 4.79, "percentage": 95.75, "elapsed_time": "5:17:57", "remaining_time": "0:14:06"}
{"current_steps": 3840, "total_steps": 4000, "loss": 0.0136, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.1010505252626315e-06, "epoch": 4.8, "percentage": 96.0, "elapsed_time": "5:18:45", "remaining_time": "0:13:16"}
{"current_steps": 3850, "total_steps": 4000, "loss": 0.0143, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9759879939969986e-06, "epoch": 4.81, "percentage": 96.25, "elapsed_time": "5:19:34", "remaining_time": "0:12:27"}
{"current_steps": 3860, "total_steps": 4000, "loss": 0.0121, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8509254627313657e-06, "epoch": 4.83, "percentage": 96.5, "elapsed_time": "5:20:23", "remaining_time": "0:11:37"}
{"current_steps": 3870, "total_steps": 4000, "loss": 0.0134, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.725862931465733e-06, "epoch": 4.84, "percentage": 96.75, "elapsed_time": "5:21:11", "remaining_time": "0:10:47"}
{"current_steps": 3880, "total_steps": 4000, "loss": 0.0117, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6008004002001e-06, "epoch": 4.85, "percentage": 97.0, "elapsed_time": "5:21:58", "remaining_time": "0:09:57"}
{"current_steps": 3890, "total_steps": 4000, "loss": 0.0117, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4757378689344673e-06, "epoch": 4.86, "percentage": 97.25, "elapsed_time": "5:22:46", "remaining_time": "0:09:07"}
{"current_steps": 3900, "total_steps": 4000, "loss": 0.0104, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3506753376688344e-06, "epoch": 4.88, "percentage": 97.5, "elapsed_time": "5:23:35", "remaining_time": "0:08:17"}
{"current_steps": 3910, "total_steps": 4000, "loss": 0.0127, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2256128064032017e-06, "epoch": 4.89, "percentage": 97.75, "elapsed_time": "5:24:22", "remaining_time": "0:07:27"}
{"current_steps": 3920, "total_steps": 4000, "loss": 0.0108, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1005502751375688e-06, "epoch": 4.9, "percentage": 98.0, "elapsed_time": "5:25:10", "remaining_time": "0:06:38"}
{"current_steps": 3930, "total_steps": 4000, "loss": 0.0114, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.75487743871936e-07, "epoch": 4.91, "percentage": 98.25, "elapsed_time": "5:25:58", "remaining_time": "0:05:48"}
{"current_steps": 3940, "total_steps": 4000, "loss": 0.0103, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.504252126063032e-07, "epoch": 4.92, "percentage": 98.5, "elapsed_time": "5:26:46", "remaining_time": "0:04:58"}
{"current_steps": 3950, "total_steps": 4000, "loss": 0.0129, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.253626813406703e-07, "epoch": 4.94, "percentage": 98.75, "elapsed_time": "5:27:35", "remaining_time": "0:04:08"}
{"current_steps": 3960, "total_steps": 4000, "loss": 0.0147, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.003001500750376e-07, "epoch": 4.95, "percentage": 99.0, "elapsed_time": "5:28:23", "remaining_time": "0:03:19"}
{"current_steps": 3970, "total_steps": 4000, "loss": 0.0138, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.7523761880940473e-07, "epoch": 4.96, "percentage": 99.25, "elapsed_time": "5:29:11", "remaining_time": "0:02:29"}
{"current_steps": 3980, "total_steps": 4000, "loss": 0.0121, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.501750875437719e-07, "epoch": 4.97, "percentage": 99.5, "elapsed_time": "5:29:59", "remaining_time": "0:01:39"}
{"current_steps": 3990, "total_steps": 4000, "loss": 0.0102, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2511255627813906e-07, "epoch": 4.99, "percentage": 99.75, "elapsed_time": "5:30:48", "remaining_time": "0:00:49"}
{"current_steps": 4000, "total_steps": 4000, "loss": 0.0094, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0005002501250625e-07, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "5:31:35", "remaining_time": "0:00:00"}
{"current_steps": 4000, "total_steps": 4000, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "5:31:35", "remaining_time": "0:00:00"}