File size: 1,510 Bytes
8509db4
 
 
 
 
7998b00
8509db4
 
 
 
 
7998b00
 
 
8509db4
 
 
7998b00
 
aa08ade
8509db4
 
 
7998b00
 
aa08ade
8509db4
 
 
7998b00
 
aa08ade
8509db4
 
7998b00
 
 
aa08ade
7998b00
 
8509db4
 
aa08ade
 
 
 
7998b00
8509db4
 
 
7998b00
 
aa08ade
 
 
7998b00
8509db4
 
 
7998b00
8509db4
 
 
7998b00
66e1cfc
8509db4
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 1.0,
  "eval_steps": 500,
  "global_step": 22,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.05,
      "learning_rate": 6.666666666666667e-05,
      "loss": 1.1782,
      "step": 1
    },
    {
      "epoch": 0.23,
      "learning_rate": 0.00019458172417006347,
      "loss": 1.1528,
      "step": 5
    },
    {
      "epoch": 0.45,
      "learning_rate": 0.00014016954246529696,
      "loss": 1.0601,
      "step": 10
    },
    {
      "epoch": 0.68,
      "learning_rate": 5.983045753470308e-05,
      "loss": 1.0094,
      "step": 15
    },
    {
      "epoch": 0.91,
      "learning_rate": 5.418275829936537e-06,
      "loss": 1.0053,
      "step": 20
    },
    {
      "epoch": 1.0,
      "eval_loss": 0.9987491965293884,
      "eval_runtime": 10.4464,
      "eval_samples_per_second": 14.742,
      "eval_steps_per_second": 0.957,
      "step": 22
    },
    {
      "epoch": 1.0,
      "step": 22,
      "total_flos": 1.2907203290936115e+17,
      "train_loss": 1.0528897643089294,
      "train_runtime": 330.7732,
      "train_samples_per_second": 4.181,
      "train_steps_per_second": 0.067
    }
  ],
  "logging_steps": 5,
  "max_steps": 22,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 1,
  "save_steps": 100,
  "total_flos": 1.2907203290936115e+17,
  "train_batch_size": 32,
  "trial_name": null,
  "trial_params": null
}