CharlieFRuan
commited on
Commit
•
f53a857
1
Parent(s):
c889571
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +87 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_140.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,87 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q3f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 8192,
|
7 |
+
"intermediate_size": 28672,
|
8 |
+
"num_attention_heads": 64,
|
9 |
+
"num_hidden_layers": 80,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 500000.0,
|
14 |
+
"rope_scaling": {
|
15 |
+
"factor": 8.0,
|
16 |
+
"low_freq_factor": 1.0,
|
17 |
+
"high_freq_factor": 4.0,
|
18 |
+
"original_max_position_embeddings": 8192,
|
19 |
+
"rope_type": "llama3"
|
20 |
+
},
|
21 |
+
"context_window_size": 131072,
|
22 |
+
"prefill_chunk_size": 2048,
|
23 |
+
"num_key_value_heads": 8,
|
24 |
+
"head_dim": 128,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"max_batch_size": 80
|
27 |
+
},
|
28 |
+
"vocab_size": 128256,
|
29 |
+
"context_window_size": 131072,
|
30 |
+
"sliding_window_size": -1,
|
31 |
+
"prefill_chunk_size": 2048,
|
32 |
+
"attention_sink_size": -1,
|
33 |
+
"tensor_parallel_shards": 1,
|
34 |
+
"temperature": 0.6,
|
35 |
+
"presence_penalty": 0.0,
|
36 |
+
"frequency_penalty": 0.0,
|
37 |
+
"repetition_penalty": 1.0,
|
38 |
+
"top_p": 0.9,
|
39 |
+
"tokenizer_files": [
|
40 |
+
"tokenizer.json",
|
41 |
+
"tokenizer_config.json"
|
42 |
+
],
|
43 |
+
"tokenizer_info": {
|
44 |
+
"token_postproc_method": "byte_level",
|
45 |
+
"prepend_space_in_encode": false,
|
46 |
+
"strip_space_in_decode": false
|
47 |
+
},
|
48 |
+
"conv_template": {
|
49 |
+
"name": "llama-3_1",
|
50 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>",
|
51 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
52 |
+
"system_prefix_token_ids": [
|
53 |
+
128000
|
54 |
+
],
|
55 |
+
"add_role_after_system_message": true,
|
56 |
+
"roles": {
|
57 |
+
"user": "<|start_header_id|>user",
|
58 |
+
"assistant": "<|start_header_id|>assistant"
|
59 |
+
},
|
60 |
+
"role_templates": {
|
61 |
+
"user": "{user_message}",
|
62 |
+
"assistant": "{assistant_message}",
|
63 |
+
"tool": "{tool_message}"
|
64 |
+
},
|
65 |
+
"messages": [],
|
66 |
+
"seps": [
|
67 |
+
"<|eot_id|>"
|
68 |
+
],
|
69 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
70 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
71 |
+
"stop_str": [],
|
72 |
+
"stop_token_ids": [
|
73 |
+
128001,
|
74 |
+
128008,
|
75 |
+
128009
|
76 |
+
],
|
77 |
+
"function_string": "",
|
78 |
+
"use_function_calling": false
|
79 |
+
},
|
80 |
+
"pad_token_id": 0,
|
81 |
+
"bos_token_id": 128000,
|
82 |
+
"eos_token_id": [
|
83 |
+
128001,
|
84 |
+
128008,
|
85 |
+
128009
|
86 |
+
]
|
87 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dea8ea3b8b20efbd30f64dff386633b23ae645356865a39def4eb19f4a5f355a
|
3 |
+
size 420679680
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cedc0b847c7fc518b975ad7f9e73cced0b79637d9a1bcedc79483c7ea8e2abf
|
3 |
+
size 52584960
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d215b245f2b3c5c260fa593d37d3b1f0c73004bf357c129be1494385f3939da4
|
3 |
+
size 23511040
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8b2614d2e8b464d0c8d2fa91009b4fd307d35ae5c64851652feebfa4348d223
|
3 |
+
size 26869760
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38601acf8027626e7865bac95c2b8e140930a948025964e815b7c20199b7f19b
|
3 |
+
size 31100928
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ce6a90d09d38b37459295aed7203ebda09f07e494cd33a7dbd2d40569bffec0
|
3 |
+
size 93978624
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa5b535b1e87823a54a0a1b63e9a45dea4a2c97da433949615c3cf93c56c92d2
|
3 |
+
size 188088320
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca2fa9fde069460bad2221f91bc59d5ee1b805c723396d424b03bd50fca8e96a
|
3 |
+
size 23511040
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd4625c851c5c89e0b8adcbaa7d9d4889dea59eec0b0594c35c2e88a585a4c91
|
3 |
+
size 33587200
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df5455e0523d67d59f2e7c0d2a707d276451fe2ae2741b9701999bff4caf07d4
|
3 |
+
size 26869760
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b174c2d1ce8dd9db3a6140e8c627b6095ea4d016a8f031a4300ef4fb9e7a2062
|
3 |
+
size 93978624
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb24c0d9217a0be1f13a5062c2c0dccc96d38489e4472838771a032b1916534d
|
3 |
+
size 22712320
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49a0f497034c844e949cd4045ad3074608f0752c153ad38b1de615dcb704937d
|
3 |
+
size 188088320
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7647adea8c531bc05daa6f79918645f778c903391fc925fb142321cd49ca325e
|
3 |
+
size 33587200
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19fdba357bc3eeee1ae3567ffdb9875ef9bd21c8ecc9bdab59146ef8150346df
|
3 |
+
size 23511040
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e46fb2afae0b0eaaf25fa766cd08d6f9cd7f2587c0b127704ba958a622adf4f7
|
3 |
+
size 33587200
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6fd2af7564ccc5955078cd196468a6efec47b3d56d6dd20e4785432092464e1
|
3 |
+
size 26869760
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cd70b218ec53d6fcb7b169f2f10bac191cbfefc6f23335d037835032b4a7c59
|
3 |
+
size 93978624
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:276151e11953ec766ec91fa70be215be9ba39eaebed05fd545ad9a15ad7ef08e
|
3 |
+
size 188088320
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ee6c8a7d1c5772095a397ddfcd8d2d5592b87e4d6007da5508fcd2f654d2ec1
|
3 |
+
size 23511040
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5233da288d5e1a58d0d25b71ea5447e765af544d6a2c0b9b48dc3bec07fb448a
|
3 |
+
size 33587200
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b76ce0ff6afb54069ddb584fe596dae4c42ed6fa9bfd958255ac63b3a91352d5
|
3 |
+
size 31100928
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fd57709f93dc28cdcc7b5639c9231bd06bf44aab982930e83b877a8d7755680
|
3 |
+
size 31068160
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c2cdf9095edebda0b913618debf1eeba1446c0302037613f406d17684ceecaf
|
3 |
+
size 188088320
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3426bbcde78cca0451a8fa227f166962536a03beb2c9799407ae1e2fe3676aa9
|
3 |
+
size 26869760
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50f6f504a6c899e4575c0f603e1f87a333160c0b05d0b57c5585715c8dee871d
|
3 |
+
size 33587200
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88e3db6caef239d0e6ffbb575228c014894f79c3047893016eb77e7a79067a11
|
3 |
+
size 26869760
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bd230e56d365e56e76da5c5108166c4119005b7967520462e4f13487e3c04d1
|
3 |
+
size 31068160
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93bbc9b99f0cb9f5a3e757b773818a3fb6b85117991f48c030e507eee86e2229
|
3 |
+
size 93978624
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3f6970ee56b45be2d8cf2335197c786852f6da5a5171af9646b54e838cb4e24
|
3 |
+
size 93978624
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fbc50bd3be32357897c45fa0e4f608cace143ba7c124ce26cac650a31d02dc0
|
3 |
+
size 188088320
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bb99e0ec4d2ebb024e52a00379c7f2e7bdbb10ec94dd809b0f7ea4647557152
|
3 |
+
size 23511040
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1322381c3c3621cd82da2d3ee8b7e4d34a2ea402e7accf7b1da20574ab7a9154
|
3 |
+
size 33587200
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81b76b71bb2e827659a1009988ecb6fa495bfc0c7ff3369ef5c338b5c9fc0b70
|
3 |
+
size 26869760
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7378af8a43663e27815f580433a0a390318caea6c54968d16eade415c5fa2fcb
|
3 |
+
size 31117312
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:996ea63d4e4eb323a8c5e42a4847e8156eeb5531ff301a7784bf181c904d7a2c
|
3 |
+
size 93978624
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa9ca6b9c07202b7dcc87a36671522bb84be785298a5abf867b8c8f5416d56e9
|
3 |
+
size 93978624
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fce56b5b5fdb29280975d94bc5bfcf52f9972531f3712848c36d789ab7b3c1ab
|
3 |
+
size 188088320
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd0ca9521fe8a826457a599c80303c8ef1dfa71d43d09bfa3c6168c46051910f
|
3 |
+
size 23511040
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5380299096c91382d171778736d4429b093feeb781e3d61331ae70115e1c8a1f
|
3 |
+
size 33587200
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72742e961e0f549b94d6c29e283b7edc3923bd0c17c965ad2c9d520face7b5d2
|
3 |
+
size 26869760
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92c901b4778647ef776d30481b179234691be0d124c20e1ca02ff50f878589e1
|
3 |
+
size 188088320
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ceb7b97a723bbf26817d4052c847ba6568b9360b5c4a942c05c3fb6f6ba2a78
|
3 |
+
size 23511040
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e4693826ed24a1dbc416a852d56b4fdecb82e728a6f7428e83dd86e3a3f3b00
|
3 |
+
size 33587200
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:961eb4fe1923336410e3dd031597f1b0b88bec5d22a0522895b74900484c42b6
|
3 |
+
size 26869760
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65b1b49af6c494b3017f7a5ad5883ff197fd1d8b404c539d4aaf0fada2a65cab
|
3 |
+
size 93978624
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71138804e567f1748dc96fe852ef70538888c0acca01aaaa78a3ebec31ec6091
|
3 |
+
size 26910720
|
params_shard_140.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6640450085ff75d1b31e93233091281db6a7accf8cbf5929b39a042126e83c09
|
3 |
+
size 30269440
|