Suparious commited on
Commit
582edb4
1 Parent(s): 049e764

Adding AWQ model

Browse files
Files changed (3) hide show
  1. config.json +3 -2
  2. generation_config.json +1 -1
  3. tokenizer_config.json +2 -1
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/home/ubuntu/.cache/huggingface/hub/models--Locutusque--Llama-3-Orca-2.0-8B/snapshots/b6a4448cf33dd2c7a729a9ac12791a38a0955d33",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -12,6 +12,7 @@
12
  "initializer_range": 0.02,
13
  "intermediate_size": 14336,
14
  "max_position_embeddings": 8192,
 
15
  "model_type": "llama",
16
  "num_attention_heads": 32,
17
  "num_hidden_layers": 32,
@@ -30,7 +31,7 @@
30
  "rope_theta": 500000.0,
31
  "tie_word_embeddings": false,
32
  "torch_dtype": "float16",
33
- "transformers_version": "4.40.1",
34
  "use_cache": false,
35
  "vocab_size": 128256
36
  }
 
1
  {
2
+ "_name_or_path": "/home/ubuntu/.cache/huggingface/hub/models--Locutusque--Llama-3-Orca-2.0-8B/snapshots/ec02fa2b6743bc47c4453bcfe92a0233d1467bd6",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
12
  "initializer_range": 0.02,
13
  "intermediate_size": 14336,
14
  "max_position_embeddings": 8192,
15
+ "mlp_bias": false,
16
  "model_type": "llama",
17
  "num_attention_heads": 32,
18
  "num_hidden_layers": 32,
 
31
  "rope_theta": 500000.0,
32
  "tie_word_embeddings": false,
33
  "torch_dtype": "float16",
34
+ "transformers_version": "4.41.0",
35
  "use_cache": false,
36
  "vocab_size": 128256
37
  }
generation_config.json CHANGED
@@ -5,5 +5,5 @@
5
  "max_length": 4096,
6
  "temperature": 0.6,
7
  "top_p": 0.9,
8
- "transformers_version": "4.40.1"
9
  }
 
5
  "max_length": 4096,
6
  "temperature": 0.6,
7
  "top_p": 0.9,
8
+ "transformers_version": "4.41.0"
9
  }
tokenizer_config.json CHANGED
@@ -2050,9 +2050,10 @@
2050
  }
2051
  },
2052
  "bos_token": "<|begin_of_text|>",
 
2053
  "clean_up_tokenization_spaces": true,
2054
  "eos_token": "<|end_of_text|>",
2055
- "max_length": 512,
2056
  "model_input_names": [
2057
  "input_ids",
2058
  "attention_mask"
 
2050
  }
2051
  },
2052
  "bos_token": "<|begin_of_text|>",
2053
+ "chat_template": "{%- set ns = namespace(found=false) -%}{%- for message in messages -%}{%- if message['role'] == 'system' -%}{%- set ns.found = true -%}{%- endif -%}{%- endfor -%}{%- for message in messages %}{%- if message['role'] == 'system' -%}{{- '<|im_start|>system\n' + message['content'].rstrip() + '<|im_end|>\n' -}}{%- else -%}{%- if message['role'] == 'user' -%}{{-'<|im_start|>user\n' + message['content'].rstrip() + '<|im_end|>\n'-}}{%- else -%}{{-'<|im_start|>assistant\n' + message['content'] + '<|im_end|>\n' -}}{%- endif -%}{%- endif -%}{%- endfor -%}{%- if add_generation_prompt -%}{{-'<|im_start|>assistant\n'-}}{%- endif -%}",
2054
  "clean_up_tokenization_spaces": true,
2055
  "eos_token": "<|end_of_text|>",
2056
+ "max_length": 4096,
2057
  "model_input_names": [
2058
  "input_ids",
2059
  "attention_mask"