CharlieFRuan
commited on
Commit
•
f4027ef
1
Parent(s):
9da0214
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +86 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,86 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 500000.0,
|
14 |
+
"rope_scaling": {
|
15 |
+
"factor": 8.0,
|
16 |
+
"low_freq_factor": 1.0,
|
17 |
+
"high_freq_factor": 4.0,
|
18 |
+
"original_max_position_embeddings": 8192,
|
19 |
+
"rope_type": "llama3"
|
20 |
+
},
|
21 |
+
"context_window_size": 131072,
|
22 |
+
"prefill_chunk_size": 2048,
|
23 |
+
"num_key_value_heads": 8,
|
24 |
+
"head_dim": 128,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"pipeline_parallel_stages": 1,
|
27 |
+
"max_batch_size": 80
|
28 |
+
},
|
29 |
+
"vocab_size": 128256,
|
30 |
+
"context_window_size": 131072,
|
31 |
+
"sliding_window_size": -1,
|
32 |
+
"prefill_chunk_size": 2048,
|
33 |
+
"attention_sink_size": -1,
|
34 |
+
"tensor_parallel_shards": 1,
|
35 |
+
"pipeline_parallel_stages": 1,
|
36 |
+
"temperature": 0.6,
|
37 |
+
"presence_penalty": 0.0,
|
38 |
+
"frequency_penalty": 0.0,
|
39 |
+
"repetition_penalty": 1.0,
|
40 |
+
"top_p": 0.9,
|
41 |
+
"tokenizer_files": [
|
42 |
+
"tokenizer.json",
|
43 |
+
"tokenizer_config.json"
|
44 |
+
],
|
45 |
+
"tokenizer_info": {
|
46 |
+
"token_postproc_method": "byte_level",
|
47 |
+
"prepend_space_in_encode": false,
|
48 |
+
"strip_space_in_decode": false
|
49 |
+
},
|
50 |
+
"conv_template": {
|
51 |
+
"name": "llama-3_1",
|
52 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>",
|
53 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
54 |
+
"system_prefix_token_ids": [
|
55 |
+
128000
|
56 |
+
],
|
57 |
+
"add_role_after_system_message": true,
|
58 |
+
"roles": {
|
59 |
+
"user": "<|start_header_id|>user",
|
60 |
+
"assistant": "<|start_header_id|>assistant",
|
61 |
+
"tool": "<|start_header_id|>ipython"
|
62 |
+
},
|
63 |
+
"role_templates": {
|
64 |
+
"user": "{user_message}",
|
65 |
+
"assistant": "{assistant_message}",
|
66 |
+
"tool": "{tool_message}"
|
67 |
+
},
|
68 |
+
"messages": [],
|
69 |
+
"seps": [
|
70 |
+
"<|eot_id|>"
|
71 |
+
],
|
72 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
73 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
74 |
+
"stop_str": [],
|
75 |
+
"stop_token_ids": [
|
76 |
+
128001,
|
77 |
+
128008,
|
78 |
+
128009
|
79 |
+
],
|
80 |
+
"function_string": "",
|
81 |
+
"use_function_calling": false
|
82 |
+
},
|
83 |
+
"pad_token_id": 0,
|
84 |
+
"bos_token_id": 128000,
|
85 |
+
"eos_token_id": 128001
|
86 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c475522c845b2532b3bf900c60501e396a775edb908b2ff743bb6562cde8eae3
|
3 |
+
size 262668288
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b2139d9ac66a515404fbe14cbeaef07b010fdbaa62f760dcc3ed4aee5acb66d
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d48f708686d64fbdbb71783517b023a84879f828d795386ca47e793bf785f697
|
3 |
+
size 33046528
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c513fee59bf8af40162dc4d0fbfc17076dfcc92f189405340a5f60dfe85b603
|
3 |
+
size 58720256
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b47815223b4f9ca4782c0e00c992e98f15ae542a33eac68e8e6c6c1623191b4
|
3 |
+
size 25174016
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd610bba7c90c85a961e40a7d7514daec7b8c7787c32a1d8db749119e9ba2abf
|
3 |
+
size 29360128
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b33797ce8ae3132be02bd0ce985f5848e504593ef372d953385329d1482269cb
|
3 |
+
size 58720256
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7d1f26e4741404952ce9aab89097b0b7807247649462dfc23eeee1570750016
|
3 |
+
size 33046528
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb70247b445f57abff6c9aa72fad0ca93ee144723b703865474d00010694c2f3
|
3 |
+
size 58720256
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ffcfe4e51edb22a24261508fbb690f135115ec379637a414f9cdc2746cd51ab
|
3 |
+
size 32505856
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd129a6246243304b18a4e628927a4d4f3e6581bddcb43e25624f43fa1a59c55
|
3 |
+
size 9437184
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6255a9bd0597c15a6e9f02e61e84b07754537f7bc1da41f6fbb812c8429386aa
|
3 |
+
size 29360128
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bac7c1c8559893b33dc95867596f10c6e826412667f3cb5fa53c3b85e32905c
|
3 |
+
size 58720256
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33744dab02da4d0ba9f95b13491968aab017b00d1f2ff1d3510e850b2132c7af
|
3 |
+
size 22036480
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a86066fc78b7d0429c81df10118f873fb655aa7e0d60162b6697bf5300d77e31
|
3 |
+
size 29360128
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:284e690b76450d0c67d18d43b27d3f3d7c53e3b7ee613747f3c43caf4766ddae
|
3 |
+
size 58720256
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a1c0cb21fdc12e466f067fbcea368247879f842dbfba99346878e34b5fbea21
|
3 |
+
size 27271168
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd5caff3f6af2f3f88b43435a502a46c62088272ccd13936c18f5323afb97fcb
|
3 |
+
size 29360128
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32a2f6fb2d0a4cfe376f94d63b8565c22b9ce389f9ea3019f1a7de29c43151f0
|
3 |
+
size 30949376
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fad5c5c1d6faaff8c19a98646da9c8f693ab7f061562f13c2a0e00bc6462d7c1
|
3 |
+
size 58720256
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6128777c06ae20a0ab1a47ddca1a4ac7bb790e64a7397340f24d322692c6fde7
|
3 |
+
size 32841728
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4216c91bf10ed7755b466c131af96b245913588c09b3fac73b0dd4ae7d21bea5
|
3 |
+
size 25174016
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78bcc10730b953652c4f2d51bf90e499aed6a962008c07bd943c49ac31870638
|
3 |
+
size 29360128
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb7cd7e0e000e179c7a5e600bcb07c87bb73e144a849057ea3a16490cb10813d
|
3 |
+
size 58720256
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a29c704a3625e53e111aadf680cc1004dbec3e67f47fcf544566ba5e67a9a388
|
3 |
+
size 33046528
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2caf02d6fd9dc06e48d84231c4987af4454675650b3c59c3b727100f9b40864a
|
3 |
+
size 29360128
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c794c29f3eff156461539213a02f7fc6f67a3c781b8eba6990f50f002d9cced
|
3 |
+
size 58720256
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54110a3d317e839c5bbb038651d9168749efb862c2ca00ced79f6cb3fcbc454e
|
3 |
+
size 22036480
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87ae251c36572213296108b58f42e6462fd8d0c309cecc2f859eb518d1633319
|
3 |
+
size 29360128
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d7468ebe6130b7f49f96ba7fc17f28cf742a310536fb7118421c83c03b68377
|
3 |
+
size 58720256
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95c879c4b98e40ef6aaa84ebd02263e9913659f8cc80c6db57282533ef55cacf
|
3 |
+
size 27271168
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:692fe5ca8fc987d126db56792f01d6c0e44a64f249cad45c6befe91c30504258
|
3 |
+
size 262668288
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54680316525776da97403078d23a874d435b3693ec85d3e9faca9df5d4714b7b
|
3 |
+
size 29360128
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a3431cdef0b1b419599cf0e349848d076425250988d9d660bc5e3fe91c201ed
|
3 |
+
size 30949376
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd1d85121a46a42bde9a1ad4be2c0d8b2b6fd20823602455a95556d0c5c8f486
|
3 |
+
size 58720256
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1d7d2c1a0d6591434684fe89bfb1d31891179e9529570d9d2f9f87696ec6798
|
3 |
+
size 25174016
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8345c10cd0d7bedf94798e70b37490101c6239b0eebdd9bf184a3d8d02a8aca8
|
3 |
+
size 29360128
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0b4e1db6f8c19edfc07b09e355864deb464743866eb0b70c872f8dda8dd9aa6
|
3 |
+
size 58720256
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0632e368cb11a35bd30f6532fafcb64efc621b5f8f68dcd7cff8b971985a5b30
|
3 |
+
size 33046528
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e77603e74078d45633df71c9d504ac8ded7a79261fa72997fd0842e5b050cdd
|
3 |
+
size 29360128
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6eb1b7d7bc78f6956a17e4d8e50c78e1fa410ab5bbd58b24854af86bf8d7eef
|
3 |
+
size 58720256
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09fc6e15f5d5bf8e6f69d319d840ed83f200689b519da7e36524f3d56eac2d50
|
3 |
+
size 22036480
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8621c6119bc93e20a04e8ae894ba1db7f88aa11e14bc247b9f8b4e07a7e15cf
|
3 |
+
size 32833536
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c8c731d9e4afc93c34216d2c197a43264d8ff2b36ed5d108923e858e1f05193
|
3 |
+
size 29360128
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8146f83ca268e2ae28a564bb47f47770eb4c21566f46dca3c606ed531cc7dd8
|
3 |
+
size 58720256
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6131c89af2915f3416c5c15624a4861959961cfebb17c4d5a1da815f28518639
|
3 |
+
size 27271168
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b9246b0e4ec5802095d1f1c0c7a19b9ee43c53ea5149bf0fb34723e3d8ce7fd
|
3 |
+
size 29360128
|