{ | |
"epoch": 0.9999558635300348, | |
"eval_accuracy": 0.5114566774944134, | |
"eval_loss": 2.3657422065734863, | |
"eval_runtime": 6.976, | |
"eval_samples": 318, | |
"eval_samples_per_second": 45.585, | |
"eval_steps_per_second": 0.43, | |
"perplexity": 10.651941825558275, | |
"total_flos": 2.202782600225295e+20, | |
"train_loss": 2.520355888510828, | |
"train_runtime": 24592.232, | |
"train_samples": 2900094, | |
"train_samples_per_second": 117.927, | |
"train_steps_per_second": 0.461 | |
} |