{ | |
"epoch": 0.9999558635300348, | |
"eval_accuracy": 0.4982767756352662, | |
"eval_loss": 2.483206033706665, | |
"eval_runtime": 6.8799, | |
"eval_samples": 318, | |
"eval_samples_per_second": 46.221, | |
"eval_steps_per_second": 0.436, | |
"perplexity": 11.979609949761807, | |
"total_flos": 1.9775705361382638e+20, | |
"train_loss": 2.636019475715982, | |
"train_runtime": 23008.8845, | |
"train_samples": 2900094, | |
"train_samples_per_second": 126.042, | |
"train_steps_per_second": 0.492 | |
} |