xammi commited on
Commit
8ac59cb
1 Parent(s): b62db11

Training in progress, step 500

Browse files
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "unsloth/tinyllama-bnb-4bit",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
@@ -15,20 +15,20 @@
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": [
18
- "lm_head",
19
- "embed_tokens"
20
  ],
21
  "peft_type": "LORA",
22
  "r": 128,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
26
  "down_proj",
27
  "up_proj",
28
- "q_proj",
29
  "o_proj",
30
- "gate_proj",
31
  "v_proj",
 
32
  "k_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "unsloth/tinyllama-chat-bnb-4bit",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
 
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": [
18
+ "embed_tokens",
19
+ "lm_head"
20
  ],
21
  "peft_type": "LORA",
22
  "r": 128,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "q_proj",
27
  "down_proj",
28
  "up_proj",
 
29
  "o_proj",
 
30
  "v_proj",
31
+ "gate_proj",
32
  "k_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d64a914458ab95accdfd355f2dc697d7291e2119c4006b0752c1f68a3fe77f5
3
  size 928031856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e347e50d6716cfefb693cc92ebf0a27e1b51aae9d9b114cc1b4bf7daeaeeed28
3
  size 928031856
runs/Sep23_18-41-41_sammie/events.out.tfevents.1727138621.sammie.215374.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e47aa32c00c7a9db0600c5d45d7fa8e12d03c834b500fa4331275d07d22aa944
3
+ size 7804
runs/Sep23_18-47-08_sammie/events.out.tfevents.1727138836.sammie.215374.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05eb491eabdcfa5479898053f11455063c46f61132045dc2555b6f8f5cc13529
3
+ size 16237
tokenizer_config.json CHANGED
@@ -29,12 +29,13 @@
29
  }
30
  },
31
  "bos_token": "<s>",
 
32
  "clean_up_tokenization_spaces": false,
33
  "eos_token": "</s>",
34
  "legacy": false,
35
  "model_max_length": 2048,
36
  "pad_token": "<unk>",
37
- "padding_side": "left",
38
  "sp_model_kwargs": {},
39
  "tokenizer_class": "LlamaTokenizer",
40
  "unk_token": "<unk>",
 
29
  }
30
  },
31
  "bos_token": "<s>",
32
+ "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n' + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
33
  "clean_up_tokenization_spaces": false,
34
  "eos_token": "</s>",
35
  "legacy": false,
36
  "model_max_length": 2048,
37
  "pad_token": "<unk>",
38
+ "padding_side": "right",
39
  "sp_model_kwargs": {},
40
  "tokenizer_class": "LlamaTokenizer",
41
  "unk_token": "<unk>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c89a36a77fa9eebd71816a8911311d820a1b6d5082b97bbfa52d8df84a2916e
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c750b60303af2a2b5c01d7de4b0117c092f04379827ff62731f3912f38b2b0d7
3
  size 5496