HealthTeam
/

mt5-small-finetuned-MultiHead-230207-finetuned-MultiHead-230210-finetuned-MultiHead-230214

HealthTeam commited on Feb 14, 2023

Commit

e55d09d

•

1 Parent(s): 27ca8bc

Training in progress, step 44192

Browse files

Files changed (8) hide show

last-checkpoint/generation_config.json +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +144 -3
pytorch_model.bin +1 -1
runs/Feb14_18-29-07_39730b194efc/events.out.tfevents.1676399391.39730b194efc.3664.0 +2 -2

last-checkpoint/generation_config.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "_from_model_config": true,
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
-  "max_length": 300,
   "pad_token_id": 0,
   "transformers_version": "4.26.1"
 }

   "_from_model_config": true,
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
+  "max_length": 1024,
   "pad_token_id": 0,
   "transformers_version": "4.26.1"
 }

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f1d04c124647d72d3fc65dfa5db54a576cf67715bb9d9b3adc80890d34fcf2ec
 size 2401461253

 version https://git-lfs.github.com/spec/v1
+oid sha256:735d18dafec0eb0d88dc8f14c6729fbeaedd8e691030fc2db5b2412727e9aee7
 size 2401461253

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:46eba11efcb2f8397d7585a4be3b76d5c6a48fe6fa0c51c3fd0f692262a0214c
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:34ff48fe0ad9782c0ff82a7ab7cbb2a6863c809cb138abf98a7aebec9da7688d
 size 1200739717

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:469b203b30517b41378464133ae500974ade0c5b2d4180972b0a524ae758b0fe
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:9985ba16d61e95c50d1b9cec08c60d6a3a483569fabd9a37aabc0a1c5f05bc9b
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7a14d07d4b77ce7ca47e32ae34b2ecdda9856c350be4e59018afeb5af45fac27
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:932a3fd2a2c6fac0cf60b74f87ec91fc889b1355ae07661a0816ca1fa6dd613f
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.9861057391925263,
-  "global_step": 33144,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -402,11 +402,152 @@
       "learning_rate": 1.3454523816607659e-05,
       "loss": 2.4452,
       "step": 33000
     }
   ],
   "max_steps": 100833,
   "num_train_epochs": 3,
-  "total_flos": 8.921229210825523e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.3148076522567016,
+  "global_step": 44192,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.3454523816607659e-05,
       "loss": 2.4452,
       "step": 33000
+    },
+    {
+      "epoch": 1.0,
+      "learning_rate": 1.3355349935041108e-05,
+      "loss": 2.4438,
+      "step": 33500
+    },
+    {
+      "epoch": 1.0,
+      "eval_bleu": 16.655484084216944,
+      "eval_loss": 2.04453706741333,
+      "eval_runtime": 4558.2525,
+      "eval_samples_per_second": 8.87,
+      "eval_steps_per_second": 0.277,
+      "step": 33611
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 1.3256176053474558e-05,
+      "loss": 2.44,
+      "step": 34000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 1.3157002171908007e-05,
+      "loss": 2.4188,
+      "step": 34500
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 1.3057828290341456e-05,
+      "loss": 2.4264,
+      "step": 35000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 1.2958654408774906e-05,
+      "loss": 2.4337,
+      "step": 35500
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 1.2859480527208354e-05,
+      "loss": 2.433,
+      "step": 36000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 1.2760306645641804e-05,
+      "loss": 2.4277,
+      "step": 36500
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 1.2661132764075254e-05,
+      "loss": 2.43,
+      "step": 37000
+    },
+    {
+      "epoch": 1.12,
+      "learning_rate": 1.2561958882508702e-05,
+      "loss": 2.4343,
+      "step": 37500
+    },
+    {
+      "epoch": 1.13,
+      "learning_rate": 1.2462785000942152e-05,
+      "loss": 2.4278,
+      "step": 38000
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 1.2363611119375602e-05,
+      "loss": 2.4462,
+      "step": 38500
+    },
+    {
+      "epoch": 1.16,
+      "learning_rate": 1.2264437237809052e-05,
+      "loss": 2.4115,
+      "step": 39000
+    },
+    {
+      "epoch": 1.18,
+      "learning_rate": 1.21652633562425e-05,
+      "loss": 2.426,
+      "step": 39500
+    },
+    {
+      "epoch": 1.19,
+      "learning_rate": 1.206608947467595e-05,
+      "loss": 2.4384,
+      "step": 40000
+    },
+    {
+      "epoch": 1.2,
+      "learning_rate": 1.19669155931094e-05,
+      "loss": 2.418,
+      "step": 40500
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 1.1867741711542848e-05,
+      "loss": 2.4409,
+      "step": 41000
+    },
+    {
+      "epoch": 1.23,
+      "learning_rate": 1.1768567829976298e-05,
+      "loss": 2.4147,
+      "step": 41500
+    },
+    {
+      "epoch": 1.25,
+      "learning_rate": 1.1669393948409748e-05,
+      "loss": 2.4325,
+      "step": 42000
+    },
+    {
+      "epoch": 1.26,
+      "learning_rate": 1.1570220066843196e-05,
+      "loss": 2.4317,
+      "step": 42500
+    },
+    {
+      "epoch": 1.28,
+      "learning_rate": 1.1471046185276646e-05,
+      "loss": 2.4253,
+      "step": 43000
+    },
+    {
+      "epoch": 1.29,
+      "learning_rate": 1.1371872303710096e-05,
+      "loss": 2.4249,
+      "step": 43500
+    },
+    {
+      "epoch": 1.31,
+      "learning_rate": 1.1272698422143544e-05,
+      "loss": 2.4322,
+      "step": 44000
     }
   ],
   "max_steps": 100833,
   "num_train_epochs": 3,
+  "total_flos": 1.1901350172465562e+17,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:46eba11efcb2f8397d7585a4be3b76d5c6a48fe6fa0c51c3fd0f692262a0214c
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:34ff48fe0ad9782c0ff82a7ab7cbb2a6863c809cb138abf98a7aebec9da7688d
 size 1200739717

runs/Feb14_18-29-07_39730b194efc/events.out.tfevents.1676399391.39730b194efc.3664.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:56e2e8efcb7cc8ee42e9a2730685187108f9f744f485a7c006151d8a13539954
-size 14827

 version https://git-lfs.github.com/spec/v1
+oid sha256:4d9dfbf22943453ae081381839560fdfbdba7c8a881a29e0a7f925e30d18ae48
+size 18672