ABerlanga commited on
Commit
ed6e170
β€’
1 Parent(s): ec96793

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "codellama/CodeLlama-7b-hf",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
@@ -19,13 +19,13 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "v_proj",
23
  "up_proj",
24
- "q_proj",
25
  "k_proj",
26
- "gate_proj",
27
  "o_proj",
28
- "down_proj"
 
 
 
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_rslora": false
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "meta-llama/Llama-2-7b-hf",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
22
  "up_proj",
 
23
  "k_proj",
 
24
  "o_proj",
25
+ "v_proj",
26
+ "gate_proj",
27
+ "down_proj",
28
+ "q_proj"
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_rslora": false
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22ec15eca907a9a930db73a5dcd34181aa729faebb5ea1fdeb0fe525d959d08f
3
- size 1803907984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f3db0b893795693946784b261fe7a80ab48a8a714e8e17eb0753d9a8262f97b
3
+ size 1803645840
runs/Jan31_21-15-26_08f61ef6f9b6/events.out.tfevents.1706735860.08f61ef6f9b6.416.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e52617808e03bd71af428423e3c00c6121dae6ef28f969206b30af7804b0515
3
+ size 15559
tokenizer.json CHANGED
@@ -31,43 +31,7 @@
31
  "special": true
32
  },
33
  {
34
- "id": 32007,
35
- "content": "▁<PRE>",
36
- "single_word": false,
37
- "lstrip": false,
38
- "rstrip": false,
39
- "normalized": false,
40
- "special": true
41
- },
42
- {
43
- "id": 32008,
44
- "content": "▁<SUF>",
45
- "single_word": false,
46
- "lstrip": false,
47
- "rstrip": false,
48
- "normalized": false,
49
- "special": true
50
- },
51
- {
52
- "id": 32009,
53
- "content": "▁<MID>",
54
- "single_word": false,
55
- "lstrip": false,
56
- "rstrip": false,
57
- "normalized": false,
58
- "special": true
59
- },
60
- {
61
- "id": 32010,
62
- "content": "▁<EOT>",
63
- "single_word": false,
64
- "lstrip": false,
65
- "rstrip": false,
66
- "normalized": false,
67
- "special": true
68
- },
69
- {
70
- "id": 32016,
71
  "content": "<|im_end|>",
72
  "single_word": false,
73
  "lstrip": false,
@@ -76,7 +40,7 @@
76
  "special": true
77
  },
78
  {
79
- "id": 32017,
80
  "content": "<|im_start|>",
81
  "single_word": false,
82
  "lstrip": false,
@@ -32188,23 +32152,7 @@
32188
  "μ™•": 31996,
32189
  "ζ”Ά": 31997,
32190
  "弘": 31998,
32191
- "η»™": 31999,
32192
- "▁<SU": 32000,
32193
- "▁<SUF": 32001,
32194
- "▁<PRE": 32002,
32195
- "▁<M": 32003,
32196
- "▁<MID": 32004,
32197
- "▁<E": 32005,
32198
- "▁<EOT": 32006,
32199
- "▁<PRE>": 32007,
32200
- "▁<SUF>": 32008,
32201
- "▁<MID>": 32009,
32202
- "▁<EOT>": 32010,
32203
- "▁<EOT><EOT>": 32011,
32204
- "▁<EOT><EOT><EOT>": 32012,
32205
- "▁<EOT><EOT><EOT><EOT>": 32013,
32206
- "▁<EOT><EOT><EOT><EOT><EOT>": 32014,
32207
- "▁<EOT><EOT><EOT><EOT><EOT><EOT>": 32015
32208
  },
32209
  "merges": [
32210
  "▁ t",
@@ -93455,18 +93403,7 @@
93455
  "▁▁▁▁▁▁▁▁▁ ▁▁▁▁▁▁",
93456
  "▁▁▁▁▁▁▁ ▁▁▁▁▁▁▁▁",
93457
  "▁▁▁▁▁▁▁▁▁▁▁ ▁▁▁▁",
93458
- "▁ ▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
93459
- "▁< SU",
93460
- "▁<SU F",
93461
- "▁< PRE",
93462
- "▁< M",
93463
- "▁<M ID",
93464
- "▁< E",
93465
- "▁<E OT",
93466
- "▁<PRE >",
93467
- "▁<SUF >",
93468
- "▁<MID >",
93469
- "▁<EOT >"
93470
  ]
93471
  }
93472
  }
 
31
  "special": true
32
  },
33
  {
34
+ "id": 32000,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
35
  "content": "<|im_end|>",
36
  "single_word": false,
37
  "lstrip": false,
 
40
  "special": true
41
  },
42
  {
43
+ "id": 32001,
44
  "content": "<|im_start|>",
45
  "single_word": false,
46
  "lstrip": false,
 
32152
  "μ™•": 31996,
32153
  "ζ”Ά": 31997,
32154
  "弘": 31998,
32155
+ "η»™": 31999
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
32156
  },
32157
  "merges": [
32158
  "▁ t",
 
93403
  "▁▁▁▁▁▁▁▁▁ ▁▁▁▁▁▁",
93404
  "▁▁▁▁▁▁▁ ▁▁▁▁▁▁▁▁",
93405
  "▁▁▁▁▁▁▁▁▁▁▁ ▁▁▁▁",
93406
+ "▁ ▁▁▁▁▁▁▁▁▁▁▁▁▁▁"
 
 
 
 
 
 
 
 
 
 
 
93407
  ]
93408
  }
93409
  }
tokenizer_config.json CHANGED
@@ -26,39 +26,7 @@
26
  "single_word": false,
27
  "special": true
28
  },
29
- "32007": {
30
- "content": "▁<PRE>",
31
- "lstrip": false,
32
- "normalized": false,
33
- "rstrip": false,
34
- "single_word": false,
35
- "special": true
36
- },
37
- "32008": {
38
- "content": "▁<SUF>",
39
- "lstrip": false,
40
- "normalized": false,
41
- "rstrip": false,
42
- "single_word": false,
43
- "special": true
44
- },
45
- "32009": {
46
- "content": "▁<MID>",
47
- "lstrip": false,
48
- "normalized": false,
49
- "rstrip": false,
50
- "single_word": false,
51
- "special": true
52
- },
53
- "32010": {
54
- "content": "▁<EOT>",
55
- "lstrip": false,
56
- "normalized": false,
57
- "rstrip": false,
58
- "single_word": false,
59
- "special": true
60
- },
61
- "32016": {
62
  "content": "<|im_end|>",
63
  "lstrip": false,
64
  "normalized": false,
@@ -66,7 +34,7 @@
66
  "single_word": false,
67
  "special": true
68
  },
69
- "32017": {
70
  "content": "<|im_start|>",
71
  "lstrip": false,
72
  "normalized": false,
@@ -83,16 +51,12 @@
83
  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
84
  "clean_up_tokenization_spaces": false,
85
  "eos_token": "<|im_end|>",
86
- "eot_token": "▁<EOT>",
87
- "fill_token": "<FILL_ME>",
88
- "legacy": null,
89
- "middle_token": "▁<MID>",
90
  "model_max_length": 1000000000000000019884624838656,
91
  "pad_token": "<|im_end|>",
92
- "prefix_token": "▁<PRE>",
93
  "sp_model_kwargs": {},
94
- "suffix_token": "▁<SUF>",
95
- "tokenizer_class": "CodeLlamaTokenizer",
96
  "unk_token": "<unk>",
97
  "use_default_system_prompt": false
98
  }
 
26
  "single_word": false,
27
  "special": true
28
  },
29
+ "32000": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
30
  "content": "<|im_end|>",
31
  "lstrip": false,
32
  "normalized": false,
 
34
  "single_word": false,
35
  "special": true
36
  },
37
+ "32001": {
38
  "content": "<|im_start|>",
39
  "lstrip": false,
40
  "normalized": false,
 
51
  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
52
  "clean_up_tokenization_spaces": false,
53
  "eos_token": "<|im_end|>",
54
+ "legacy": false,
 
 
 
55
  "model_max_length": 1000000000000000019884624838656,
56
  "pad_token": "<|im_end|>",
57
+ "padding_side": "right",
58
  "sp_model_kwargs": {},
59
+ "tokenizer_class": "LlamaTokenizer",
 
60
  "unk_token": "<unk>",
61
  "use_default_system_prompt": false
62
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28a45aca5ab35e569815fffefb7d31b0405c5201cdcba8ebe1588feb9626243b
3
  size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fa1ba59014e4e8e028b8a46ef609bc1bb6f80342b5f1442a0c383b971d6b067
3
  size 4728