Training in progress, step 200000

Browse files

Files changed (9) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +123 -3
last-checkpoint/training_args.bin +1 -1
pytorch_model.bin +1 -1
training_args.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bdf19b8ac1ef38105671f7e3ed466178582ff690b2e4244bda799fabd849a44a
 size 893439185

 version https://git-lfs.github.com/spec/v1
+oid sha256:6e4e20c1ef2ac6843c886418e98a47bae638ea7d617febd310a65b1910a8f8e4
 size 893439185

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:34cdc450f36015ade18e6cf8d347ba98eed346e9fca052902560b578799df39f
 size 449471589

 version https://git-lfs.github.com/spec/v1
+oid sha256:65fa8e0f8a447fcc5954aa678e61448bcfe8f8387d2caed08d0f1179f60750d7
 size 449471589

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e2a05b33f27bc07e845ac5ddf394e12d5aa9e01cff4a464ac84d19c70049e32
 size 15587

 version https://git-lfs.github.com/spec/v1
+oid sha256:fc8cc6cb0c14f159f66977ee3dfa2ab864df7c0e19869ebf5c6d7b0393c02b8d
 size 15587

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:09ac2f6b5dab3c2f241653e24158eb8e5933ba687a501a1fa916c1b82a746b90
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:b0c7a6adc45a0eea76cb785076f51f02ab2ddc692d12cb942437e9bf8e23bc08
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2639f53746eae2335e88ed02acce8977dcbe3ece7ab8cbccde5b25d715fd5406
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:de21128fb4d2d9fbd6335f650a62e3e1299cfe449b8f64957937f253cda36cc0
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.2,
-  "global_step": 190000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2446,11 +2446,131 @@
       "learning_rate": 1.0566893240808188e-05,
       "loss": 0.3743,
       "step": 190000
     }
   ],
   "max_steps": 200000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 4.4743682799304704e+21,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.05,
+  "global_step": 200000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.0566893240808188e-05,
       "loss": 0.3743,
       "step": 190000
+    },
+    {
+      "epoch": 0.0,
+      "learning_rate": 1.0512109659997981e-05,
+      "loss": 0.3673,
+      "step": 190500
+    },
+    {
+      "epoch": 0.01,
+      "learning_rate": 1.0460094397410629e-05,
+      "loss": 0.3658,
+      "step": 191000
+    },
+    {
+      "epoch": 0.01,
+      "learning_rate": 1.041085066159254e-05,
+      "loss": 0.3661,
+      "step": 191500
+    },
+    {
+      "epoch": 0.01,
+      "learning_rate": 1.036447165752325e-05,
+      "loss": 0.3648,
+      "step": 192000
+    },
+    {
+      "epoch": 0.01,
+      "learning_rate": 1.03207743592438e-05,
+      "loss": 0.3649,
+      "step": 192500
+    },
+    {
+      "epoch": 0.01,
+      "learning_rate": 1.0279936239738395e-05,
+      "loss": 0.3645,
+      "step": 193000
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 1.0241796139099991e-05,
+      "loss": 0.3646,
+      "step": 193500
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 1.0206441030895691e-05,
+      "loss": 0.3652,
+      "step": 194000
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 1.0173873095995124e-05,
+      "loss": 0.3659,
+      "step": 194500
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 1.0144094343341912e-05,
+      "loss": 0.3645,
+      "step": 195000
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 1.011715779872454e-05,
+      "loss": 0.3676,
+      "step": 195500
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 1.0092957162169376e-05,
+      "loss": 0.3673,
+      "step": 196000
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 1.0071550699137517e-05,
+      "loss": 0.3674,
+      "step": 196500
+    },
+    {
+      "epoch": 0.04,
+      "learning_rate": 1.0052939730080435e-05,
+      "loss": 0.3678,
+      "step": 197000
+    },
+    {
+      "epoch": 0.04,
+      "learning_rate": 1.0037125403010368e-05,
+      "loss": 0.3688,
+      "step": 197500
+    },
+    {
+      "epoch": 0.04,
+      "learning_rate": 1.0024108693429497e-05,
+      "loss": 0.3676,
+      "step": 198000
+    },
+    {
+      "epoch": 0.04,
+      "learning_rate": 1.0013890404269793e-05,
+      "loss": 0.3685,
+      "step": 198500
+    },
+    {
+      "epoch": 0.04,
+      "learning_rate": 1.0006471165843453e-05,
+      "loss": 0.3664,
+      "step": 199000
+    },
+    {
+      "epoch": 0.05,
+      "learning_rate": 1.000185143580406e-05,
+      "loss": 0.3678,
+      "step": 199500
+    },
+    {
+      "epoch": 0.05,
+      "learning_rate": 1.0000031499118314e-05,
+      "loss": 0.3682,
+      "step": 200000
     }
   ],
   "max_steps": 200000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 4.709861347295232e+21,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:818b7ad8f2aec69753e6ae13a5e403ef3686da3a5de695a9abc49d9951fcd73b
 size 5551

 version https://git-lfs.github.com/spec/v1
+oid sha256:53c18b4efeb50055b9df3de46e48e5ef92c97dea961e5c1e8f4076e024c3c1db
 size 5551

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:34cdc450f36015ade18e6cf8d347ba98eed346e9fca052902560b578799df39f
 size 449471589

 version https://git-lfs.github.com/spec/v1
+oid sha256:65fa8e0f8a447fcc5954aa678e61448bcfe8f8387d2caed08d0f1179f60750d7
 size 449471589

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:818b7ad8f2aec69753e6ae13a5e403ef3686da3a5de695a9abc49d9951fcd73b
 size 5551

 version https://git-lfs.github.com/spec/v1
+oid sha256:53c18b4efeb50055b9df3de46e48e5ef92c97dea961e5c1e8f4076e024c3c1db
 size 5551