{ "epoch": 3.0, "eval_accuracy": 0.8990638351115062, "eval_loss": 0.4193418025970459, "eval_runtime": 3750.3751, "eval_samples": 600753, "eval_samples_per_second": 160.185, "eval_steps_per_second": 5.006, "perplexity": 1.5209601340780117, "total_flos": 8.947355434270848e+18, "train_loss": 0.5702250743976136, "train_runtime": 431071.4094, "train_samples": 11319535, "train_samples_per_second": 78.777, "train_steps_per_second": 2.462 }