{ | |
"epoch": 0.9999558635300348, | |
"eval_accuracy": 0.5028267330154123, | |
"eval_loss": 2.4378154277801514, | |
"eval_runtime": 6.9896, | |
"eval_samples": 318, | |
"eval_samples_per_second": 45.496, | |
"eval_steps_per_second": 0.429, | |
"perplexity": 11.448004413502517, | |
"total_flos": 1.9775705361382638e+20, | |
"train_loss": 2.5878285095516573, | |
"train_runtime": 23032.3399, | |
"train_samples": 2900094, | |
"train_samples_per_second": 125.914, | |
"train_steps_per_second": 0.492 | |
} |