diogopaes10 commited on
Commit
8eb03d2
β€’
1 Parent(s): 11288fe

Training in progress, epoch 13

Browse files
Files changed (26) hide show
  1. {checkpoint-2000 β†’ checkpoint-3000}/added_tokens.json +0 -0
  2. {checkpoint-2000 β†’ checkpoint-3000}/config.json +0 -0
  3. {checkpoint-2000 β†’ checkpoint-3000}/optimizer.pt +1 -1
  4. {checkpoint-2250 β†’ checkpoint-3000}/pytorch_model.bin +1 -1
  5. {checkpoint-2250 β†’ checkpoint-3000}/rng_state.pth +1 -1
  6. {checkpoint-2250 β†’ checkpoint-3000}/scheduler.pt +1 -1
  7. {checkpoint-2000 β†’ checkpoint-3000}/special_tokens_map.json +0 -0
  8. {checkpoint-2000 β†’ checkpoint-3000}/spm.model +0 -0
  9. {checkpoint-2000 β†’ checkpoint-3000}/tokenizer.json +0 -0
  10. {checkpoint-2000 β†’ checkpoint-3000}/tokenizer_config.json +0 -0
  11. {checkpoint-2250 β†’ checkpoint-3000}/trainer_state.json +107 -3
  12. {checkpoint-2000 β†’ checkpoint-3000}/training_args.bin +0 -0
  13. {checkpoint-2250 β†’ checkpoint-3250}/added_tokens.json +0 -0
  14. {checkpoint-2250 β†’ checkpoint-3250}/config.json +0 -0
  15. {checkpoint-2250 β†’ checkpoint-3250}/optimizer.pt +1 -1
  16. {checkpoint-2000 β†’ checkpoint-3250}/pytorch_model.bin +1 -1
  17. {checkpoint-2000 β†’ checkpoint-3250}/rng_state.pth +1 -1
  18. {checkpoint-2000 β†’ checkpoint-3250}/scheduler.pt +1 -1
  19. {checkpoint-2250 β†’ checkpoint-3250}/special_tokens_map.json +0 -0
  20. {checkpoint-2250 β†’ checkpoint-3250}/spm.model +0 -0
  21. {checkpoint-2250 β†’ checkpoint-3250}/tokenizer.json +0 -0
  22. {checkpoint-2250 β†’ checkpoint-3250}/tokenizer_config.json +0 -0
  23. {checkpoint-2000 β†’ checkpoint-3250}/trainer_state.json +185 -3
  24. {checkpoint-2250 β†’ checkpoint-3250}/training_args.bin +0 -0
  25. pytorch_model.bin +1 -1
  26. runs/Jul22_21-19-20_ab4276e44fca/events.out.tfevents.1690060770.ab4276e44fca.659.0 +2 -2
{checkpoint-2000 β†’ checkpoint-3000}/added_tokens.json RENAMED
File without changes
{checkpoint-2000 β†’ checkpoint-3000}/config.json RENAMED
File without changes
{checkpoint-2000 β†’ checkpoint-3000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81f3216586a58d2085a7f37ca95117d6c10fbcd3dc9c70f034b94e35fd6e9149
3
  size 1475557125
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a06836e74e2ee556f75e4f728cb07fd38bf7dca4688b3915aab2696b9adac99
3
  size 1475557125
{checkpoint-2250 β†’ checkpoint-3000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:627070829ce397286a4c2e3016e3ade6fbe191d90b64283878e08c51320b3b27
3
  size 737788917
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c95f2d92d432e839ff645f87515fc248494db36dac837cae703842d2cbf775e5
3
  size 737788917
{checkpoint-2250 β†’ checkpoint-3000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5e45bb5a3782239e1b011180d84487acde3e428af09ac96bbf315bcb54dd611
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30675d1e37d339cae6e3dc477927b70e39062f0910613a7d90db6c1671bca5bc
3
  size 14575
{checkpoint-2250 β†’ checkpoint-3000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a4113c70550b7a4ade899ac1f4a91272bb6bdc8dc785c5c4e5e342583232813
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68cbe85bad4e57d93e8caf9830d7003e889867d2bc1bdf97b16703437df161a3
3
  size 627
{checkpoint-2000 β†’ checkpoint-3000}/special_tokens_map.json RENAMED
File without changes
{checkpoint-2000 β†’ checkpoint-3000}/spm.model RENAMED
File without changes
{checkpoint-2000 β†’ checkpoint-3000}/tokenizer.json RENAMED
File without changes
{checkpoint-2000 β†’ checkpoint-3000}/tokenizer_config.json RENAMED
File without changes
{checkpoint-2250 β†’ checkpoint-3000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 9.0,
5
- "global_step": 2250,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -298,11 +298,115 @@
298
  "eval_system_ram_total": 83.48074722290039,
299
  "eval_system_ram_used": 4.219398498535156,
300
  "step": 2068
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
301
  }
302
  ],
303
  "max_steps": 3750,
304
  "num_train_epochs": 15,
305
- "total_flos": 4334831263537536.0,
306
  "trial_name": null,
307
  "trial_params": null
308
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 12.0,
5
+ "global_step": 3000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
298
  "eval_system_ram_total": 83.48074722290039,
299
  "eval_system_ram_used": 4.219398498535156,
300
  "step": 2068
301
+ },
302
+ {
303
+ "epoch": 9.02,
304
+ "learning_rate": 7.978666666666667e-06,
305
+ "loss": 0.1505,
306
+ "step": 2256
307
+ },
308
+ {
309
+ "epoch": 9.02,
310
+ "eval_accuracy": 0.7075,
311
+ "eval_disk_space_total": 78.1898422241211,
312
+ "eval_disk_space_used": 35.827659606933594,
313
+ "eval_f1": 0.709341703450241,
314
+ "eval_gpu_ram_allocated": 2.0897817611694336,
315
+ "eval_gpu_ram_cached": 25.85546875,
316
+ "eval_gpu_ram_total": 39.56402587890625,
317
+ "eval_gpu_utilization": 48,
318
+ "eval_loss": 1.4310206174850464,
319
+ "eval_precision": 0.7133423622104005,
320
+ "eval_recall": 0.7075,
321
+ "eval_runtime": 2.4471,
322
+ "eval_samples_per_second": 817.29,
323
+ "eval_steps_per_second": 25.745,
324
+ "eval_system_ram_total": 83.48074722290039,
325
+ "eval_system_ram_used": 4.2417755126953125,
326
+ "step": 2256
327
+ },
328
+ {
329
+ "epoch": 9.78,
330
+ "learning_rate": 6.976000000000001e-06,
331
+ "loss": 0.1132,
332
+ "step": 2444
333
+ },
334
+ {
335
+ "epoch": 9.78,
336
+ "eval_accuracy": 0.7045,
337
+ "eval_disk_space_total": 78.1898422241211,
338
+ "eval_disk_space_used": 35.827754974365234,
339
+ "eval_f1": 0.705265213679387,
340
+ "eval_gpu_ram_allocated": 2.089801788330078,
341
+ "eval_gpu_ram_cached": 25.85546875,
342
+ "eval_gpu_ram_total": 39.56402587890625,
343
+ "eval_gpu_utilization": 48,
344
+ "eval_loss": 1.5454399585723877,
345
+ "eval_precision": 0.7097494768850874,
346
+ "eval_recall": 0.7045,
347
+ "eval_runtime": 2.5035,
348
+ "eval_samples_per_second": 798.873,
349
+ "eval_steps_per_second": 25.165,
350
+ "eval_system_ram_total": 83.48074722290039,
351
+ "eval_system_ram_used": 4.293117523193359,
352
+ "step": 2444
353
+ },
354
+ {
355
+ "epoch": 10.53,
356
+ "learning_rate": 5.973333333333334e-06,
357
+ "loss": 0.0979,
358
+ "step": 2632
359
+ },
360
+ {
361
+ "epoch": 10.53,
362
+ "eval_accuracy": 0.708,
363
+ "eval_disk_space_total": 78.1898422241211,
364
+ "eval_disk_space_used": 35.82805252075195,
365
+ "eval_f1": 0.7090322597492875,
366
+ "eval_gpu_ram_allocated": 2.089801788330078,
367
+ "eval_gpu_ram_cached": 25.85546875,
368
+ "eval_gpu_ram_total": 39.56402587890625,
369
+ "eval_gpu_utilization": 45,
370
+ "eval_loss": 1.64204740524292,
371
+ "eval_precision": 0.7171054872018443,
372
+ "eval_recall": 0.708,
373
+ "eval_runtime": 2.5339,
374
+ "eval_samples_per_second": 789.29,
375
+ "eval_steps_per_second": 24.863,
376
+ "eval_system_ram_total": 83.48074722290039,
377
+ "eval_system_ram_used": 4.279300689697266,
378
+ "step": 2632
379
+ },
380
+ {
381
+ "epoch": 11.28,
382
+ "learning_rate": 4.976e-06,
383
+ "loss": 0.0818,
384
+ "step": 2820
385
+ },
386
+ {
387
+ "epoch": 11.28,
388
+ "eval_accuracy": 0.7065,
389
+ "eval_disk_space_total": 78.1898422241211,
390
+ "eval_disk_space_used": 35.828128814697266,
391
+ "eval_f1": 0.706242034421972,
392
+ "eval_gpu_ram_allocated": 2.0898447036743164,
393
+ "eval_gpu_ram_cached": 25.85546875,
394
+ "eval_gpu_ram_total": 39.56402587890625,
395
+ "eval_gpu_utilization": 49,
396
+ "eval_loss": 1.686875820159912,
397
+ "eval_precision": 0.7102028476355108,
398
+ "eval_recall": 0.7065,
399
+ "eval_runtime": 2.4408,
400
+ "eval_samples_per_second": 819.396,
401
+ "eval_steps_per_second": 25.811,
402
+ "eval_system_ram_total": 83.48074722290039,
403
+ "eval_system_ram_used": 4.2822418212890625,
404
+ "step": 2820
405
  }
406
  ],
407
  "max_steps": 3750,
408
  "num_train_epochs": 15,
409
+ "total_flos": 5780526048262272.0,
410
  "trial_name": null,
411
  "trial_params": null
412
  }
{checkpoint-2000 β†’ checkpoint-3000}/training_args.bin RENAMED
File without changes
{checkpoint-2250 β†’ checkpoint-3250}/added_tokens.json RENAMED
File without changes
{checkpoint-2250 β†’ checkpoint-3250}/config.json RENAMED
File without changes
{checkpoint-2250 β†’ checkpoint-3250}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d092da6a86e9d3fddf667c0e8cc73377daca3a3d8630e425531f34eb77545eea
3
  size 1475557125
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f17eacaf5376c0fabb8aeff03d05e59319e7a180e3c00d273c966e5a26d33f06
3
  size 1475557125
{checkpoint-2000 β†’ checkpoint-3250}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b71e7c7798b6760f8be8c551b4e8951ebe3dfa93da41d1460b9cb33fd0d6f86
3
  size 737788917
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab87f1854f930634513326e51246eb456af5e9a20373ec512925553c65de13d4
3
  size 737788917
{checkpoint-2000 β†’ checkpoint-3250}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96ffa685fc4010a50b57e506b086e0167e48b18c5d9de223e06893b4aa16c22a
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9318169f07f11cd9456a08a8554cc70b98429bd8764cb326d58f8d40bc05005
3
  size 14575
{checkpoint-2000 β†’ checkpoint-3250}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:626c1ac2df61838775a74a9749f04b4d515724a3ccd7da9a914227a50ae26d2d
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b6692caff16315b18091d72ba55872cc98f8a135dd4601d0a933fafdf6b6bcd
3
  size 627
{checkpoint-2250 β†’ checkpoint-3250}/special_tokens_map.json RENAMED
File without changes
{checkpoint-2250 β†’ checkpoint-3250}/spm.model RENAMED
File without changes
{checkpoint-2250 β†’ checkpoint-3250}/tokenizer.json RENAMED
File without changes
{checkpoint-2250 β†’ checkpoint-3250}/tokenizer_config.json RENAMED
File without changes
{checkpoint-2000 β†’ checkpoint-3250}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 8.0,
5
- "global_step": 2000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -272,11 +272,193 @@
272
  "eval_system_ram_total": 83.48074722290039,
273
  "eval_system_ram_used": 4.224781036376953,
274
  "step": 1880
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
275
  }
276
  ],
277
  "max_steps": 3750,
278
  "num_train_epochs": 15,
279
- "total_flos": 3850219425648384.0,
280
  "trial_name": null,
281
  "trial_params": null
282
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 13.0,
5
+ "global_step": 3250,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
272
  "eval_system_ram_total": 83.48074722290039,
273
  "eval_system_ram_used": 4.224781036376953,
274
  "step": 1880
275
+ },
276
+ {
277
+ "epoch": 8.27,
278
+ "learning_rate": 8.981333333333333e-06,
279
+ "loss": 0.197,
280
+ "step": 2068
281
+ },
282
+ {
283
+ "epoch": 8.27,
284
+ "eval_accuracy": 0.712,
285
+ "eval_disk_space_total": 78.1898422241211,
286
+ "eval_disk_space_used": 33.7657470703125,
287
+ "eval_f1": 0.7097931257647566,
288
+ "eval_gpu_ram_allocated": 2.0897903442382812,
289
+ "eval_gpu_ram_cached": 25.85546875,
290
+ "eval_gpu_ram_total": 39.56402587890625,
291
+ "eval_gpu_utilization": 45,
292
+ "eval_loss": 1.3960117101669312,
293
+ "eval_precision": 0.7137187449926237,
294
+ "eval_recall": 0.712,
295
+ "eval_runtime": 2.3878,
296
+ "eval_samples_per_second": 837.604,
297
+ "eval_steps_per_second": 26.385,
298
+ "eval_system_ram_total": 83.48074722290039,
299
+ "eval_system_ram_used": 4.219398498535156,
300
+ "step": 2068
301
+ },
302
+ {
303
+ "epoch": 9.02,
304
+ "learning_rate": 7.978666666666667e-06,
305
+ "loss": 0.1505,
306
+ "step": 2256
307
+ },
308
+ {
309
+ "epoch": 9.02,
310
+ "eval_accuracy": 0.7075,
311
+ "eval_disk_space_total": 78.1898422241211,
312
+ "eval_disk_space_used": 35.827659606933594,
313
+ "eval_f1": 0.709341703450241,
314
+ "eval_gpu_ram_allocated": 2.0897817611694336,
315
+ "eval_gpu_ram_cached": 25.85546875,
316
+ "eval_gpu_ram_total": 39.56402587890625,
317
+ "eval_gpu_utilization": 48,
318
+ "eval_loss": 1.4310206174850464,
319
+ "eval_precision": 0.7133423622104005,
320
+ "eval_recall": 0.7075,
321
+ "eval_runtime": 2.4471,
322
+ "eval_samples_per_second": 817.29,
323
+ "eval_steps_per_second": 25.745,
324
+ "eval_system_ram_total": 83.48074722290039,
325
+ "eval_system_ram_used": 4.2417755126953125,
326
+ "step": 2256
327
+ },
328
+ {
329
+ "epoch": 9.78,
330
+ "learning_rate": 6.976000000000001e-06,
331
+ "loss": 0.1132,
332
+ "step": 2444
333
+ },
334
+ {
335
+ "epoch": 9.78,
336
+ "eval_accuracy": 0.7045,
337
+ "eval_disk_space_total": 78.1898422241211,
338
+ "eval_disk_space_used": 35.827754974365234,
339
+ "eval_f1": 0.705265213679387,
340
+ "eval_gpu_ram_allocated": 2.089801788330078,
341
+ "eval_gpu_ram_cached": 25.85546875,
342
+ "eval_gpu_ram_total": 39.56402587890625,
343
+ "eval_gpu_utilization": 48,
344
+ "eval_loss": 1.5454399585723877,
345
+ "eval_precision": 0.7097494768850874,
346
+ "eval_recall": 0.7045,
347
+ "eval_runtime": 2.5035,
348
+ "eval_samples_per_second": 798.873,
349
+ "eval_steps_per_second": 25.165,
350
+ "eval_system_ram_total": 83.48074722290039,
351
+ "eval_system_ram_used": 4.293117523193359,
352
+ "step": 2444
353
+ },
354
+ {
355
+ "epoch": 10.53,
356
+ "learning_rate": 5.973333333333334e-06,
357
+ "loss": 0.0979,
358
+ "step": 2632
359
+ },
360
+ {
361
+ "epoch": 10.53,
362
+ "eval_accuracy": 0.708,
363
+ "eval_disk_space_total": 78.1898422241211,
364
+ "eval_disk_space_used": 35.82805252075195,
365
+ "eval_f1": 0.7090322597492875,
366
+ "eval_gpu_ram_allocated": 2.089801788330078,
367
+ "eval_gpu_ram_cached": 25.85546875,
368
+ "eval_gpu_ram_total": 39.56402587890625,
369
+ "eval_gpu_utilization": 45,
370
+ "eval_loss": 1.64204740524292,
371
+ "eval_precision": 0.7171054872018443,
372
+ "eval_recall": 0.708,
373
+ "eval_runtime": 2.5339,
374
+ "eval_samples_per_second": 789.29,
375
+ "eval_steps_per_second": 24.863,
376
+ "eval_system_ram_total": 83.48074722290039,
377
+ "eval_system_ram_used": 4.279300689697266,
378
+ "step": 2632
379
+ },
380
+ {
381
+ "epoch": 11.28,
382
+ "learning_rate": 4.976e-06,
383
+ "loss": 0.0818,
384
+ "step": 2820
385
+ },
386
+ {
387
+ "epoch": 11.28,
388
+ "eval_accuracy": 0.7065,
389
+ "eval_disk_space_total": 78.1898422241211,
390
+ "eval_disk_space_used": 35.828128814697266,
391
+ "eval_f1": 0.706242034421972,
392
+ "eval_gpu_ram_allocated": 2.0898447036743164,
393
+ "eval_gpu_ram_cached": 25.85546875,
394
+ "eval_gpu_ram_total": 39.56402587890625,
395
+ "eval_gpu_utilization": 49,
396
+ "eval_loss": 1.686875820159912,
397
+ "eval_precision": 0.7102028476355108,
398
+ "eval_recall": 0.7065,
399
+ "eval_runtime": 2.4408,
400
+ "eval_samples_per_second": 819.396,
401
+ "eval_steps_per_second": 25.811,
402
+ "eval_system_ram_total": 83.48074722290039,
403
+ "eval_system_ram_used": 4.2822418212890625,
404
+ "step": 2820
405
+ },
406
+ {
407
+ "epoch": 12.03,
408
+ "learning_rate": 3.973333333333333e-06,
409
+ "loss": 0.062,
410
+ "step": 3008
411
+ },
412
+ {
413
+ "epoch": 12.03,
414
+ "eval_accuracy": 0.701,
415
+ "eval_disk_space_total": 78.1898422241211,
416
+ "eval_disk_space_used": 35.82817459106445,
417
+ "eval_f1": 0.704316965060789,
418
+ "eval_gpu_ram_allocated": 2.0900821685791016,
419
+ "eval_gpu_ram_cached": 25.85546875,
420
+ "eval_gpu_ram_total": 39.56402587890625,
421
+ "eval_gpu_utilization": 50,
422
+ "eval_loss": 1.781833291053772,
423
+ "eval_precision": 0.7122852239266858,
424
+ "eval_recall": 0.701,
425
+ "eval_runtime": 2.3858,
426
+ "eval_samples_per_second": 838.291,
427
+ "eval_steps_per_second": 26.406,
428
+ "eval_system_ram_total": 83.48074722290039,
429
+ "eval_system_ram_used": 4.286445617675781,
430
+ "step": 3008
431
+ },
432
+ {
433
+ "epoch": 12.78,
434
+ "learning_rate": 2.970666666666667e-06,
435
+ "loss": 0.0433,
436
+ "step": 3196
437
+ },
438
+ {
439
+ "epoch": 12.78,
440
+ "eval_accuracy": 0.707,
441
+ "eval_disk_space_total": 78.1898422241211,
442
+ "eval_disk_space_used": 35.82823181152344,
443
+ "eval_f1": 0.70799964440731,
444
+ "eval_gpu_ram_allocated": 2.089794635772705,
445
+ "eval_gpu_ram_cached": 25.85546875,
446
+ "eval_gpu_ram_total": 39.56402587890625,
447
+ "eval_gpu_utilization": 49,
448
+ "eval_loss": 1.7981120347976685,
449
+ "eval_precision": 0.7109713384315803,
450
+ "eval_recall": 0.707,
451
+ "eval_runtime": 2.4151,
452
+ "eval_samples_per_second": 828.137,
453
+ "eval_steps_per_second": 26.086,
454
+ "eval_system_ram_total": 83.48074722290039,
455
+ "eval_system_ram_used": 4.266563415527344,
456
+ "step": 3196
457
  }
458
  ],
459
  "max_steps": 3750,
460
  "num_train_epochs": 15,
461
+ "total_flos": 6259743625357056.0,
462
  "trial_name": null,
463
  "trial_params": null
464
  }
{checkpoint-2250 β†’ checkpoint-3250}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:627070829ce397286a4c2e3016e3ade6fbe191d90b64283878e08c51320b3b27
3
  size 737788917
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab87f1854f930634513326e51246eb456af5e9a20373ec512925553c65de13d4
3
  size 737788917
runs/Jul22_21-19-20_ab4276e44fca/events.out.tfevents.1690060770.ab4276e44fca.659.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9480f7c1ae50fb4afe8f904897ca584d0ecad3a73621bc2257b9e47e566bf68b
3
- size 17242
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0676d7575783045c7b0b81b3dac8f9748e1362dd10f8ada9768f991e63e7691
3
+ size 23854