derekngo commited on
Commit
2561944
β€’
1 Parent(s): fa75fc5

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -1,11 +1,12 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "meta-llama/Llama-2-70b-chat-hf",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
 
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
11
  "loftq_config": {},
@@ -19,14 +20,15 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "up_proj",
23
- "gate_proj",
24
- "k_proj",
25
- "down_proj",
26
  "q_proj",
 
 
27
  "v_proj",
28
- "o_proj"
 
 
29
  ],
30
  "task_type": "CAUSAL_LM",
 
31
  "use_rslora": false
32
  }
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "codellama/CodeLlama-7b-hf",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
9
+ "layer_replication": null,
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
 
 
23
  "q_proj",
24
+ "gate_proj",
25
+ "up_proj",
26
  "v_proj",
27
+ "o_proj",
28
+ "down_proj",
29
+ "k_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
+ "use_dora": false,
33
  "use_rslora": false
34
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7792242ad6910a3fe13188098a0853647a383d646ab538d1f420b57220b8a144
3
- size 7675798384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07a893ac183c68eb13b07e8b5ae88538e555554e96b59a93c4da8575b7bc4f77
3
+ size 1803907984
runs/Sep16_04-58-39_8PYKQ04/events.out.tfevents.1726462726.8PYKQ04.4374.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6aa52afdab18e66d68cf899a46938dd5a0d6ba41c774dc63c1a42be276594098
3
+ size 9214
special_tokens_map.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "additional_special_tokens": [
3
  {
4
- "content": "<|im_end|>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
- "content": "<|im_start|>",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
 
1
  {
2
  "additional_special_tokens": [
3
  {
4
+ "content": "<|im_start|>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
+ "content": "<|im_end|>",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
tokenizer.json CHANGED
@@ -31,8 +31,26 @@
31
  "special": true
32
  },
33
  {
34
- "id": 32000,
35
- "content": "<|im_end|>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
36
  "single_word": false,
37
  "lstrip": false,
38
  "rstrip": false,
@@ -40,13 +58,31 @@
40
  "special": true
41
  },
42
  {
43
- "id": 32001,
 
 
 
 
 
 
 
 
 
44
  "content": "<|im_start|>",
45
  "single_word": false,
46
  "lstrip": false,
47
  "rstrip": false,
48
  "normalized": false,
49
  "special": true
 
 
 
 
 
 
 
 
 
50
  }
51
  ],
52
  "normalizer": {
@@ -152,6 +188,7 @@
152
  "end_of_word_suffix": null,
153
  "fuse_unk": true,
154
  "byte_fallback": true,
 
155
  "vocab": {
156
  "<unk>": 0,
157
  "<s>": 1,
@@ -32152,7 +32189,23 @@
32152
  "μ™•": 31996,
32153
  "ζ”Ά": 31997,
32154
  "弘": 31998,
32155
- "η»™": 31999
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
32156
  },
32157
  "merges": [
32158
  "▁ t",
@@ -93403,7 +93456,18 @@
93403
  "▁▁▁▁▁▁▁▁▁ ▁▁▁▁▁▁",
93404
  "▁▁▁▁▁▁▁ ▁▁▁▁▁▁▁▁",
93405
  "▁▁▁▁▁▁▁▁▁▁▁ ▁▁▁▁",
93406
- "▁ ▁▁▁▁▁▁▁▁▁▁▁▁▁▁"
 
 
 
 
 
 
 
 
 
 
 
93407
  ]
93408
  }
93409
  }
 
31
  "special": true
32
  },
33
  {
34
+ "id": 32007,
35
+ "content": "▁<PRE>",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": false,
40
+ "special": true
41
+ },
42
+ {
43
+ "id": 32008,
44
+ "content": "▁<SUF>",
45
+ "single_word": false,
46
+ "lstrip": false,
47
+ "rstrip": false,
48
+ "normalized": false,
49
+ "special": true
50
+ },
51
+ {
52
+ "id": 32009,
53
+ "content": "▁<MID>",
54
  "single_word": false,
55
  "lstrip": false,
56
  "rstrip": false,
 
58
  "special": true
59
  },
60
  {
61
+ "id": 32010,
62
+ "content": "▁<EOT>",
63
+ "single_word": false,
64
+ "lstrip": false,
65
+ "rstrip": false,
66
+ "normalized": false,
67
+ "special": true
68
+ },
69
+ {
70
+ "id": 32016,
71
  "content": "<|im_start|>",
72
  "single_word": false,
73
  "lstrip": false,
74
  "rstrip": false,
75
  "normalized": false,
76
  "special": true
77
+ },
78
+ {
79
+ "id": 32017,
80
+ "content": "<|im_end|>",
81
+ "single_word": false,
82
+ "lstrip": false,
83
+ "rstrip": false,
84
+ "normalized": false,
85
+ "special": true
86
  }
87
  ],
88
  "normalizer": {
 
188
  "end_of_word_suffix": null,
189
  "fuse_unk": true,
190
  "byte_fallback": true,
191
+ "ignore_merges": false,
192
  "vocab": {
193
  "<unk>": 0,
194
  "<s>": 1,
 
32189
  "μ™•": 31996,
32190
  "ζ”Ά": 31997,
32191
  "弘": 31998,
32192
+ "η»™": 31999,
32193
+ "▁<SU": 32000,
32194
+ "▁<SUF": 32001,
32195
+ "▁<PRE": 32002,
32196
+ "▁<M": 32003,
32197
+ "▁<MID": 32004,
32198
+ "▁<E": 32005,
32199
+ "▁<EOT": 32006,
32200
+ "▁<PRE>": 32007,
32201
+ "▁<SUF>": 32008,
32202
+ "▁<MID>": 32009,
32203
+ "▁<EOT>": 32010,
32204
+ "▁<EOT><EOT>": 32011,
32205
+ "▁<EOT><EOT><EOT>": 32012,
32206
+ "▁<EOT><EOT><EOT><EOT>": 32013,
32207
+ "▁<EOT><EOT><EOT><EOT><EOT>": 32014,
32208
+ "▁<EOT><EOT><EOT><EOT><EOT><EOT>": 32015
32209
  },
32210
  "merges": [
32211
  "▁ t",
 
93456
  "▁▁▁▁▁▁▁▁▁ ▁▁▁▁▁▁",
93457
  "▁▁▁▁▁▁▁ ▁▁▁▁▁▁▁▁",
93458
  "▁▁▁▁▁▁▁▁▁▁▁ ▁▁▁▁",
93459
+ "▁ ▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
93460
+ "▁< SU",
93461
+ "▁<SU F",
93462
+ "▁< PRE",
93463
+ "▁< M",
93464
+ "▁<M ID",
93465
+ "▁< E",
93466
+ "▁<E OT",
93467
+ "▁<PRE >",
93468
+ "▁<SUF >",
93469
+ "▁<MID >",
93470
+ "▁<EOT >"
93471
  ]
93472
  }
93473
  }
tokenizer_config.json CHANGED
@@ -26,37 +26,73 @@
26
  "single_word": false,
27
  "special": true
28
  },
29
- "32000": {
30
- "content": "<|im_end|>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
31
  "lstrip": false,
32
  "normalized": false,
33
  "rstrip": false,
34
  "single_word": false,
35
  "special": true
36
  },
37
- "32001": {
 
 
 
 
 
 
 
 
38
  "content": "<|im_start|>",
39
  "lstrip": false,
40
  "normalized": false,
41
  "rstrip": false,
42
  "single_word": false,
43
  "special": true
 
 
 
 
 
 
 
 
44
  }
45
  },
46
  "additional_special_tokens": [
47
- "<|im_end|>",
48
- "<|im_start|>"
49
  ],
50
  "bos_token": "<|im_start|>",
51
  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
52
  "clean_up_tokenization_spaces": false,
53
  "eos_token": "<|im_end|>",
54
- "legacy": false,
 
 
 
55
  "model_max_length": 1000000000000000019884624838656,
56
  "pad_token": "<|im_end|>",
57
- "padding_side": "right",
58
  "sp_model_kwargs": {},
59
- "tokenizer_class": "LlamaTokenizer",
 
60
  "unk_token": "<unk>",
61
  "use_default_system_prompt": false
62
  }
 
26
  "single_word": false,
27
  "special": true
28
  },
29
+ "32007": {
30
+ "content": "▁<PRE>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ },
37
+ "32008": {
38
+ "content": "▁<SUF>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false,
43
+ "special": true
44
+ },
45
+ "32009": {
46
+ "content": "▁<MID>",
47
  "lstrip": false,
48
  "normalized": false,
49
  "rstrip": false,
50
  "single_word": false,
51
  "special": true
52
  },
53
+ "32010": {
54
+ "content": "▁<EOT>",
55
+ "lstrip": false,
56
+ "normalized": false,
57
+ "rstrip": false,
58
+ "single_word": false,
59
+ "special": true
60
+ },
61
+ "32016": {
62
  "content": "<|im_start|>",
63
  "lstrip": false,
64
  "normalized": false,
65
  "rstrip": false,
66
  "single_word": false,
67
  "special": true
68
+ },
69
+ "32017": {
70
+ "content": "<|im_end|>",
71
+ "lstrip": false,
72
+ "normalized": false,
73
+ "rstrip": false,
74
+ "single_word": false,
75
+ "special": true
76
  }
77
  },
78
  "additional_special_tokens": [
79
+ "<|im_start|>",
80
+ "<|im_end|>"
81
  ],
82
  "bos_token": "<|im_start|>",
83
  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
84
  "clean_up_tokenization_spaces": false,
85
  "eos_token": "<|im_end|>",
86
+ "eot_token": "▁<EOT>",
87
+ "fill_token": "<FILL_ME>",
88
+ "legacy": null,
89
+ "middle_token": "▁<MID>",
90
  "model_max_length": 1000000000000000019884624838656,
91
  "pad_token": "<|im_end|>",
92
+ "prefix_token": "▁<PRE>",
93
  "sp_model_kwargs": {},
94
+ "suffix_token": "▁<SUF>",
95
+ "tokenizer_class": "CodeLlamaTokenizer",
96
  "unk_token": "<unk>",
97
  "use_default_system_prompt": false
98
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc46b03d6ce07cc11851cace10a01050c91e0e15a9614e93960b87d32a361063
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b28848c5969bf7d9f57b05e7b1ca571441f8d8d211f3ed305ccb3d8e71a791a
3
+ size 5048