longt5_xl_sfd_memsum_30 / all_results.json
learn3r's picture
End of training
68d715b verified
{
"epoch": 29.22,
"eval_loss": 5.132218360900879,
"eval_runtime": 14.2345,
"eval_samples": 338,
"eval_samples_per_second": 23.745,
"eval_steps_per_second": 3.021,
"train_loss": 0.5600467140298514,
"train_runtime": 18789.4517,
"train_samples": 3673,
"train_samples_per_second": 5.864,
"train_steps_per_second": 0.022
}