CharlieFRuan
commited on
Commit
•
300ae9f
1
Parent(s):
cddce97
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +86 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,86 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q0f16",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 500000.0,
|
14 |
+
"rope_scaling": {
|
15 |
+
"factor": 8.0,
|
16 |
+
"low_freq_factor": 1.0,
|
17 |
+
"high_freq_factor": 4.0,
|
18 |
+
"original_max_position_embeddings": 8192,
|
19 |
+
"rope_type": "llama3"
|
20 |
+
},
|
21 |
+
"context_window_size": 131072,
|
22 |
+
"prefill_chunk_size": 2048,
|
23 |
+
"num_key_value_heads": 8,
|
24 |
+
"head_dim": 128,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"pipeline_parallel_stages": 1,
|
27 |
+
"max_batch_size": 80
|
28 |
+
},
|
29 |
+
"vocab_size": 128256,
|
30 |
+
"context_window_size": 131072,
|
31 |
+
"sliding_window_size": -1,
|
32 |
+
"prefill_chunk_size": 2048,
|
33 |
+
"attention_sink_size": -1,
|
34 |
+
"tensor_parallel_shards": 1,
|
35 |
+
"pipeline_parallel_stages": 1,
|
36 |
+
"temperature": 0.6,
|
37 |
+
"presence_penalty": 0.0,
|
38 |
+
"frequency_penalty": 0.0,
|
39 |
+
"repetition_penalty": 1.0,
|
40 |
+
"top_p": 0.9,
|
41 |
+
"tokenizer_files": [
|
42 |
+
"tokenizer.json",
|
43 |
+
"tokenizer_config.json"
|
44 |
+
],
|
45 |
+
"tokenizer_info": {
|
46 |
+
"token_postproc_method": "byte_level",
|
47 |
+
"prepend_space_in_encode": false,
|
48 |
+
"strip_space_in_decode": false
|
49 |
+
},
|
50 |
+
"conv_template": {
|
51 |
+
"name": "llama-3_1",
|
52 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>",
|
53 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
54 |
+
"system_prefix_token_ids": [
|
55 |
+
128000
|
56 |
+
],
|
57 |
+
"add_role_after_system_message": true,
|
58 |
+
"roles": {
|
59 |
+
"user": "<|start_header_id|>user",
|
60 |
+
"assistant": "<|start_header_id|>assistant",
|
61 |
+
"tool": "<|start_header_id|>ipython"
|
62 |
+
},
|
63 |
+
"role_templates": {
|
64 |
+
"user": "{user_message}",
|
65 |
+
"assistant": "{assistant_message}",
|
66 |
+
"tool": "{tool_message}"
|
67 |
+
},
|
68 |
+
"messages": [],
|
69 |
+
"seps": [
|
70 |
+
"<|eot_id|>"
|
71 |
+
],
|
72 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
73 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
74 |
+
"stop_str": [],
|
75 |
+
"stop_token_ids": [
|
76 |
+
128001,
|
77 |
+
128008,
|
78 |
+
128009
|
79 |
+
],
|
80 |
+
"function_string": "",
|
81 |
+
"use_function_calling": false
|
82 |
+
},
|
83 |
+
"pad_token_id": 0,
|
84 |
+
"bos_token_id": 128000,
|
85 |
+
"eos_token_id": 128001
|
86 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2573a3efeffc45038427e1dbdcdeb68b9a5f5196f9ba3e42eeb5c60a78c7089c
|
3 |
+
size 1050673152
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8282f2e760779a55f43437520ffe20e7ba3427039e0c480b8c735ffbc50d291d
|
3 |
+
size 117440512
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed2f1e6665bbef0a3becb3725224704e553c97e3e67bb1080daa253ddf18f919
|
3 |
+
size 33554432
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c50428d3815ff5f054e15fa1362c1aef9b935176c78dc4ce290eac9d6c72cf8d
|
3 |
+
size 234881024
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af22d13687bcaa3d0d8266ab765faa799922cd56fcff4f66d9de67586ac8004c
|
3 |
+
size 50331648
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75d4bd9451d27d30bf68ba7d37dae70a2392ec8240e84303f026894ae15a7698
|
3 |
+
size 33554432
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f15586edaffc3be1e823ecc4a9d0b6ff56532552e0a7f5288364ba49d246499
|
3 |
+
size 117440512
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d342c428105642ddd5de632b01a4bd94638b9cc60700a2a073b097ef11ba948
|
3 |
+
size 234881024
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ceb77f0318add9a0552ba67b360bbc5879488df5c0d4d09cf2a44572eb6fdb0
|
3 |
+
size 50331648
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b36fe6310cd028ecd88f9f6f15fd42b09554c4a080c5ff08f23536a0bb69a12c
|
3 |
+
size 33554432
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce8982aa3ea3f4d29778c3113012886d7a492da015f0e5a68638c2516203b513
|
3 |
+
size 117440512
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cd8ae1ed4e7cebf60bf81d8644e2ded0466676b08ed888df84328908c0975fb
|
3 |
+
size 234881024
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afe9b5185815b42b505a270a4aa55c136e2ccd4681cec3942609c483db70aeb2
|
3 |
+
size 50331648
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb3a7f912b0df7e873d491754ff106f5d02a5b70a23f30e58cd0f5f58443c6d
|
3 |
+
size 117440512
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc16581455eb0fd60cfbc94b3f9c3bfc267d026c8d59d0463305c9d74bc78787
|
3 |
+
size 33554432
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90adeb94a5869c9acb4a2802b1ae61b1ef0b56660774a3eba1b9045216afabf2
|
3 |
+
size 117440512
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2bacde7465ab65265e32f3141220a5c3dd23387d59d6e264aec7837450ae66e3
|
3 |
+
size 234881024
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da63b26137b60eac360bed70117f9797c08f8fb55e75df6e9c53793234c410dd
|
3 |
+
size 50331648
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d308ced6600d40eaf69437557dd137d8e562c7e3af4a4223fd4e6b3f175fa9b
|
3 |
+
size 33554432
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8d58688d014e95078d59fc6d92bda51727ba57f9d62ff6822b3fb35d9a46373
|
3 |
+
size 117440512
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:facd2c13abe14a13b3f9be0617ba9d33f0f0e7330e8ae44e2364851b74ebef1c
|
3 |
+
size 234881024
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb9829dbaffe21d50dd8e9d8226d4cc4be24edf0d5a15f98ccd7e6738b3cbe7a
|
3 |
+
size 50331648
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a90e99852dcd2c8dbaba34564b6b7d42451b43998e66d95247e60aedbed9c4f
|
3 |
+
size 33554432
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e3b8717ad5bfdb9beae752a2ea116ac42bb695a72444fc1ae544a4a6f19ca07
|
3 |
+
size 117440512
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1a6fe30338654fc0d8e430219ae6adc9caf3d367f94808a8f4c659760507601
|
3 |
+
size 234881024
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:250e856e608c6116b1b08aefb8ce33fa9105da885dd2a793ac8f3c047f7e0421
|
3 |
+
size 234881024
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23aa3c0ac6ca0b03a466bc7148da9a3ac6d4b2fde031db9d7003d774d547e418
|
3 |
+
size 50331648
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bc5bb74dcce3425198ed7c2411bf4c041dbbd36abb53621a93c621b252f292c
|
3 |
+
size 33554432
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:387c9b2e7ca617872677ce15b6efbcf19d95ca0d4d16aaaddbbf82e17af38b5c
|
3 |
+
size 117440512
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d0d80f3899c1b3f4580333e662e1e9efcd8c790b5778aaf6fa039070b0eda2a
|
3 |
+
size 234881024
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8454a4b69ae3ba401c00fbc5d33dafdcd5fec25b754d1f920eb56f44d3cc549
|
3 |
+
size 50331648
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fd429bab7ebfd9992c68ad6d9d3df2d8fa4c36ceda6496a697a108693fec7a5
|
3 |
+
size 33554432
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2fb125af9dc183997da50e554a75f813856f229d59946393115cd544cdcb187
|
3 |
+
size 234881024
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bf74439e2a0d78249523af702eab4ed9e958fbb62f603670494e852d064a151
|
3 |
+
size 50331648
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d810740d8e0bb29c50abab8f6f7c0b1f700b73e64dc244791da3c9173864786
|
3 |
+
size 33554432
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e750027aa404e2eeb4e5c9dd9acdedee4ce61f992a0b646bca466e8805ed9c5a
|
3 |
+
size 50331648
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:812055e6aba2097fe8f0c7af973898f4958e62501bed91321cf9f3dacac7e16f
|
3 |
+
size 532480
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1a2b4c37371bb00a52259adade7aedf89158c6a424f3d593f701f01baaf38e6
|
3 |
+
size 33554432
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:187ba5769c17eadeaf0fa7fb66f763ba0a076c096622f64efa9fa7584f20f734
|
3 |
+
size 117440512
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8e79a8d5bd9b18a1c91141a00f6f1cc6639032cf9828a3b99ca837a75acfacb
|
3 |
+
size 234881024
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a6b2cfde0e8be952e3e1d4086d92704c1f9a38090026dfd6cee8d22b490ea86
|
3 |
+
size 50331648
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9379f6cddd9dfb9aa8072b3d897834dd0037f9034b6ac8afd9678371204b862
|
3 |
+
size 33554432
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c43157edf03a806be50175a689caacd15841fab4452148676d7d7d1d8b445140
|
3 |
+
size 117440512
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1f60979ed67d6dea5906bcd5939cf043a595a7bd5dc82572d7741591afc2d08
|
3 |
+
size 1050673152
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50b4c1f5b31210acead1568f4f0d945c5b0ac748d0e5592032387d2135ffa268
|
3 |
+
size 234881024
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6db4e3978f24942805c59b6ce7211f962acc4a0ab0ac9cba30a8d4bf5170422e
|
3 |
+
size 50331648
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3d37de8d6032ba387fdf2bc0bc6eb4ec04bc14ce50650f40a45ca2b41e2a5aa
|
3 |
+
size 33554432
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3ef8295589d5ced1dbd7befe6b791e1366c60ba6175638535f5c4420a95285e
|
3 |
+
size 117440512
|