Training in progress, step 8000

Files changed (7) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5c136ff0e9cb20c7463cf837c57a825a4e61457ecc99effe498b8cec7d902776
 size 2847145157

 version https://git-lfs.github.com/spec/v1
+oid sha256:ce02a884cff9c0c33b9ea0be5dabed04223f7b92e622f67dd75b20a294f4957c
 size 2847145157

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:89e09ba7644b8ce1be54b5d151fb88c54f7af6e3f93b2834943e87018320b472
 size 1524261149

 version https://git-lfs.github.com/spec/v1
+oid sha256:c1a06359204895a2b4ac4327b2ba9b58a11a645bfab8dc5dc5c1f33cc4c56b05
 size 1524261149

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:89f2ea1099f73d4771d0adfcd2464d3b79ddc8be7baf6cb50692837d58a8a048
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:35d8ee4e99967dfddcdbfa3f701d7c423f15993ec9569b899109556fcf23f606
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:14808219b4a7001cd7bd7967362505aa479b3e57cd0120b221d6370031f10450
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:c8da528fd7f428de97e2b07202a1629e295196c693ae8d5d2bf4e84b9478cdc3
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.501750875437719,
-  "global_step": 7000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -146,11 +146,31 @@
       "eval_samples_per_second": 15.917,
       "eval_steps_per_second": 2.654,
       "step": 7000
     }
   ],
   "max_steps": 9995,
   "num_train_epochs": 5,
-  "total_flos": 1.980744450048e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 4.00200100050025,
+  "global_step": 8000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 15.917,
       "eval_steps_per_second": 2.654,
       "step": 7000
+    },
+    {
+      "epoch": 3.75,
+      "learning_rate": 4.992496248124062e-06,
+      "loss": 2.8219,
+      "step": 7500
+    },
+    {
+      "epoch": 4.0,
+      "learning_rate": 3.991995997999e-06,
+      "loss": 2.8267,
+      "step": 8000
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 3.085977077484131,
+      "eval_runtime": 133.3062,
+      "eval_samples_per_second": 15.881,
+      "eval_steps_per_second": 2.648,
+      "step": 8000
     }
   ],
   "max_steps": 9995,
   "num_train_epochs": 5,
+  "total_flos": 2.263707942912e+16,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:89e09ba7644b8ce1be54b5d151fb88c54f7af6e3f93b2834943e87018320b472
 size 1524261149

 version https://git-lfs.github.com/spec/v1
+oid sha256:c1a06359204895a2b4ac4327b2ba9b58a11a645bfab8dc5dc5c1f33cc4c56b05
 size 1524261149

runs/Mar25_07-47-44_6e686009e3a0/events.out.tfevents.1679730482.6e686009e3a0.183.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:187a073febbce9d08c947a3283b5e8e473950f162a4dbd8c354fd7f957611812
-size 4813

 version https://git-lfs.github.com/spec/v1
+oid sha256:98d16bcaeb6710ed70950d0fec4cd75f9d753b93f3c01047572a1c783a9b6d19
+size 5398