File size: 1,510 Bytes
8509db4 7998b00 8509db4 7998b00 8509db4 7998b00 aa08ade 8509db4 7998b00 aa08ade 8509db4 7998b00 aa08ade 8509db4 7998b00 aa08ade 7998b00 8509db4 aa08ade 7998b00 8509db4 7998b00 aa08ade 7998b00 8509db4 7998b00 8509db4 7998b00 66e1cfc 8509db4 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 1.0,
"eval_steps": 500,
"global_step": 22,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.05,
"learning_rate": 6.666666666666667e-05,
"loss": 1.1782,
"step": 1
},
{
"epoch": 0.23,
"learning_rate": 0.00019458172417006347,
"loss": 1.1528,
"step": 5
},
{
"epoch": 0.45,
"learning_rate": 0.00014016954246529696,
"loss": 1.0601,
"step": 10
},
{
"epoch": 0.68,
"learning_rate": 5.983045753470308e-05,
"loss": 1.0094,
"step": 15
},
{
"epoch": 0.91,
"learning_rate": 5.418275829936537e-06,
"loss": 1.0053,
"step": 20
},
{
"epoch": 1.0,
"eval_loss": 0.9987491965293884,
"eval_runtime": 10.4464,
"eval_samples_per_second": 14.742,
"eval_steps_per_second": 0.957,
"step": 22
},
{
"epoch": 1.0,
"step": 22,
"total_flos": 1.2907203290936115e+17,
"train_loss": 1.0528897643089294,
"train_runtime": 330.7732,
"train_samples_per_second": 4.181,
"train_steps_per_second": 0.067
}
],
"logging_steps": 5,
"max_steps": 22,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 100,
"total_flos": 1.2907203290936115e+17,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}
|