Dmitriy007
commited on
Commit
•
b38615c
1
Parent(s):
0dfc9d5
Training in progress, step 14000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +23 -3
- pytorch_model.bin +1 -1
- runs/Mar21_22-11-09_493485ec0ec3/events.out.tfevents.1679436700.493485ec0ec3.312.0 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2847145157
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a6059da0754c3f17d7b81253296560efa12f0d685a2c0911aa4fd5935bf2af4
|
3 |
size 2847145157
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1524261149
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88287f1f90b5ae42a8b989aa8afbb43dc5e525cfb096255ee7d9d1f34294e5e9
|
3 |
size 1524261149
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7d5ebe29bda3aea662c901096bf015abd470cd995bf114bbd127dda875bb86d
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:011be71b07f286a4bba8ba4eb6190e0fe248d987c19e0913a71c4dd7aa7c7cbb
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 3.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -266,11 +266,31 @@
|
|
266 |
"eval_samples_per_second": 14.744,
|
267 |
"eval_steps_per_second": 4.917,
|
268 |
"step": 13000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
269 |
}
|
270 |
],
|
271 |
"max_steps": 19990,
|
272 |
"num_train_epochs": 5,
|
273 |
-
"total_flos": 1.
|
274 |
"trial_name": null,
|
275 |
"trial_params": null
|
276 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 3.501750875437719,
|
5 |
+
"global_step": 14000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
266 |
"eval_samples_per_second": 14.744,
|
267 |
"eval_steps_per_second": 4.917,
|
268 |
"step": 13000
|
269 |
+
},
|
270 |
+
{
|
271 |
+
"epoch": 3.38,
|
272 |
+
"learning_rate": 6.493246623311657e-06,
|
273 |
+
"loss": 2.5079,
|
274 |
+
"step": 13500
|
275 |
+
},
|
276 |
+
{
|
277 |
+
"epoch": 3.5,
|
278 |
+
"learning_rate": 5.992996498249125e-06,
|
279 |
+
"loss": 2.535,
|
280 |
+
"step": 14000
|
281 |
+
},
|
282 |
+
{
|
283 |
+
"epoch": 3.5,
|
284 |
+
"eval_loss": 3.154937267303467,
|
285 |
+
"eval_runtime": 143.3545,
|
286 |
+
"eval_samples_per_second": 14.768,
|
287 |
+
"eval_steps_per_second": 4.925,
|
288 |
+
"step": 14000
|
289 |
}
|
290 |
],
|
291 |
"max_steps": 19990,
|
292 |
"num_train_epochs": 5,
|
293 |
+
"total_flos": 1.980744450048e+16,
|
294 |
"trial_name": null,
|
295 |
"trial_params": null
|
296 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1524261149
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88287f1f90b5ae42a8b989aa8afbb43dc5e525cfb096255ee7d9d1f34294e5e9
|
3 |
size 1524261149
|
runs/Mar21_22-11-09_493485ec0ec3/events.out.tfevents.1679436700.493485ec0ec3.312.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:828c9f35897ab8c1d539a901d22a2d7a6c2175f79660c815eaae302d4f745dec
|
3 |
+
size 6552
|