adamjweintraut commited on
Commit
e7b6293
1 Parent(s): ece8ddb

Training in progress, step 2000, checkpoint

Browse files
last-checkpoint/generation_config.json CHANGED
@@ -1,13 +1,24 @@
1
  {
2
- "_from_model_config": true,
3
  "bos_token_id": 0,
 
4
  "decoder_start_token_id": 2,
 
5
  "early_stopping": true,
6
  "eos_token_id": 2,
7
  "forced_bos_token_id": 0,
8
  "forced_eos_token_id": 2,
9
- "no_repeat_ngram_size": 3,
 
 
10
  "num_beams": 4,
11
- "pad_token_id": 1,
12
- "transformers_version": "4.38.2"
 
 
 
 
 
 
 
 
13
  }
 
1
  {
 
2
  "bos_token_id": 0,
3
+ "clean_up_tokenization_spaces": true,
4
  "decoder_start_token_id": 2,
5
+ "do_sample": true,
6
  "early_stopping": true,
7
  "eos_token_id": 2,
8
  "forced_bos_token_id": 0,
9
  "forced_eos_token_id": 2,
10
+ "max_new_tokens": 64,
11
+ "n_examples": null,
12
+ "no_repeat_ngram_size": 2,
13
  "num_beams": 4,
14
+ "pad_to_max_length": true,
15
+ "pad_token_id": 2,
16
+ "padding": "max_length",
17
+ "renormalize_logits": true,
18
+ "skip_special_tokens": true,
19
+ "temperature": 0.85,
20
+ "top_k": 0,
21
+ "top_p": 0.9,
22
+ "transformers_version": "4.38.2",
23
+ "truncation": true
24
  }
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:659581b09e5435748aa277550674f0f183b697f5746c508d9651061cf462dbdc
3
  size 1625545896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2ba30ac64371eeec3bd9f7d0012d18ad31fd4368aa5d5c706726544da918373
3
  size 1625545896
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f8c99e5062570ad4317ac2151da95c1bd97ba41c7778e5f6b3e94ba9039c805
3
  size 3250997519
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3511177efc1c7eb3119fc64d63abdc1a1ca2b56b0204fccca0ec090d4b49e3b7
3
  size 3250997519
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16834af344003484ce1ba6dc7abd13a4095886a927379926cec2957d37a23fe9
3
  size 14308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36c96bc430eb6a2b1f5305099d0805f117cad183edcf598d7c9e7eefabcd26d1
3
  size 14308
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd5799947fee402d2d731ff73eaff922e4f5de0fe21f2d43fabaefdb89f537da
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1474d57875cd322d43d7b30e8e912f7e2d36108fe51ad2985da2b427239c760
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,42 +1,72 @@
1
  {
2
- "best_metric": 0.4577435553073883,
3
- "best_model_checkpoint": "/content/drive/MyDrive/W210 Capstone - Lyric Generation with Melody/loaf/models/kwsylgen/bart/bart-finetuned-kwsylgen-64/checkpoint-1000",
4
- "epoch": 0.6954102920723226,
5
  "eval_steps": 500,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.35,
13
- "grad_norm": 0.605933427810669,
14
  "learning_rate": 4.5679763560500696e-05,
15
- "loss": 0.476,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.35,
20
- "eval_loss": 0.4631631374359131,
21
- "eval_runtime": 98.3831,
22
- "eval_samples_per_second": 129.128,
23
- "eval_steps_per_second": 2.023,
24
  "step": 500
25
  },
26
  {
27
  "epoch": 0.7,
28
- "grad_norm": 0.46590879559516907,
29
  "learning_rate": 4.133344923504868e-05,
30
- "loss": 0.3918,
31
  "step": 1000
32
  },
33
  {
34
  "epoch": 0.7,
35
- "eval_loss": 0.4577435553073883,
36
- "eval_runtime": 102.7478,
37
- "eval_samples_per_second": 123.643,
38
- "eval_steps_per_second": 1.937,
39
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  }
41
  ],
42
  "logging_steps": 500,
@@ -44,7 +74,7 @@
44
  "num_input_tokens_seen": 0,
45
  "num_train_epochs": 4,
46
  "save_steps": 500,
47
- "total_flos": 8668418408448000.0,
48
  "train_batch_size": 64,
49
  "trial_name": null,
50
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.45656052231788635,
3
+ "best_model_checkpoint": "/content/drive/MyDrive/W210 Capstone - Lyric Generation with Melody/loaf/models/kwsylgen/bart/bart-finetuned-kwsylgen-64/checkpoint-2000",
4
+ "epoch": 1.3908205841446453,
5
  "eval_steps": 500,
6
+ "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.35,
13
+ "grad_norm": 0.5149683952331543,
14
  "learning_rate": 4.5679763560500696e-05,
15
+ "loss": 0.4749,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.35,
20
+ "eval_loss": 0.4616529643535614,
21
+ "eval_runtime": 93.1578,
22
+ "eval_samples_per_second": 136.371,
23
+ "eval_steps_per_second": 2.136,
24
  "step": 500
25
  },
26
  {
27
  "epoch": 0.7,
28
+ "grad_norm": 0.5068113207817078,
29
  "learning_rate": 4.133344923504868e-05,
30
+ "loss": 0.3922,
31
  "step": 1000
32
  },
33
  {
34
  "epoch": 0.7,
35
+ "eval_loss": 0.4581904709339142,
36
+ "eval_runtime": 93.9811,
37
+ "eval_samples_per_second": 135.176,
38
+ "eval_steps_per_second": 2.117,
39
  "step": 1000
40
+ },
41
+ {
42
+ "epoch": 1.04,
43
+ "grad_norm": 0.6911681890487671,
44
+ "learning_rate": 3.698713490959667e-05,
45
+ "loss": 0.3655,
46
+ "step": 1500
47
+ },
48
+ {
49
+ "epoch": 1.04,
50
+ "eval_loss": 0.4568086564540863,
51
+ "eval_runtime": 93.8201,
52
+ "eval_samples_per_second": 135.408,
53
+ "eval_steps_per_second": 2.121,
54
+ "step": 1500
55
+ },
56
+ {
57
+ "epoch": 1.39,
58
+ "grad_norm": 0.5658309459686279,
59
+ "learning_rate": 3.2640820584144646e-05,
60
+ "loss": 0.3455,
61
+ "step": 2000
62
+ },
63
+ {
64
+ "epoch": 1.39,
65
+ "eval_loss": 0.45656052231788635,
66
+ "eval_runtime": 94.4047,
67
+ "eval_samples_per_second": 134.57,
68
+ "eval_steps_per_second": 2.108,
69
+ "step": 2000
70
  }
71
  ],
72
  "logging_steps": 500,
 
74
  "num_input_tokens_seen": 0,
75
  "num_train_epochs": 4,
76
  "save_steps": 500,
77
+ "total_flos": 1.7334669712293888e+16,
78
  "train_batch_size": 64,
79
  "trial_name": null,
80
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a49400ed8744cf57f1a96430857f2cb498143627b7bf3e102c3bef48e432100f
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17e6869522a097ec64314dcf3fed02e0d24916c5cedb8b01b2170c098b079f8a
3
  size 5368