Upload folder using huggingface_hub
#2
by
at676
- opened
- config.json +52 -0
- generation_config.json +12 -0
- model-00001-of-00044.safetensors +3 -0
- model-00002-of-00044.safetensors +3 -0
- model-00003-of-00044.safetensors +3 -0
- model-00004-of-00044.safetensors +3 -0
- model-00005-of-00044.safetensors +3 -0
- model-00006-of-00044.safetensors +3 -0
- model-00007-of-00044.safetensors +3 -0
- model-00008-of-00044.safetensors +3 -0
- model-00009-of-00044.safetensors +3 -0
- model-00010-of-00044.safetensors +3 -0
- model-00011-of-00044.safetensors +3 -0
- model-00012-of-00044.safetensors +3 -0
- model-00013-of-00044.safetensors +3 -0
- model-00014-of-00044.safetensors +3 -0
- model-00015-of-00044.safetensors +3 -0
- model-00016-of-00044.safetensors +3 -0
- model-00017-of-00044.safetensors +3 -0
- model-00018-of-00044.safetensors +3 -0
- model-00019-of-00044.safetensors +3 -0
- model-00020-of-00044.safetensors +3 -0
- model-00021-of-00044.safetensors +3 -0
- model-00022-of-00044.safetensors +3 -0
- model-00023-of-00044.safetensors +3 -0
- model-00024-of-00044.safetensors +3 -0
- model-00025-of-00044.safetensors +3 -0
- model-00026-of-00044.safetensors +3 -0
- model-00027-of-00044.safetensors +3 -0
- model-00028-of-00044.safetensors +3 -0
- model-00029-of-00044.safetensors +3 -0
- model-00030-of-00044.safetensors +3 -0
- model-00031-of-00044.safetensors +3 -0
- model-00032-of-00044.safetensors +3 -0
- model-00033-of-00044.safetensors +3 -0
- model-00034-of-00044.safetensors +3 -0
- model-00035-of-00044.safetensors +3 -0
- model-00036-of-00044.safetensors +3 -0
- model-00037-of-00044.safetensors +3 -0
- model-00038-of-00044.safetensors +3 -0
- model-00039-of-00044.safetensors +3 -0
- model-00040-of-00044.safetensors +3 -0
- model-00041-of-00044.safetensors +3 -0
- model-00042-of-00044.safetensors +3 -0
- model-00043-of-00044.safetensors +3 -0
- model-00044-of-00044.safetensors +3 -0
- model.safetensors.index.json +0 -0
config.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "meta-llama/Meta-Llama-3.1-405B-Instruct",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"head_dim": 128,
|
15 |
+
"hidden_act": "silu",
|
16 |
+
"hidden_size": 16384,
|
17 |
+
"initializer_range": 0.02,
|
18 |
+
"intermediate_size": 53248,
|
19 |
+
"max_position_embeddings": 131072,
|
20 |
+
"mlp_bias": false,
|
21 |
+
"model_type": "llama",
|
22 |
+
"num_attention_heads": 128,
|
23 |
+
"num_hidden_layers": 126,
|
24 |
+
"num_key_value_heads": 8,
|
25 |
+
"pretraining_tp": 1,
|
26 |
+
"quip_params": {
|
27 |
+
"K": 4,
|
28 |
+
"L": 16,
|
29 |
+
"V": 2,
|
30 |
+
"codebook": "bitshift",
|
31 |
+
"codebook_version": 0,
|
32 |
+
"decode_mode": "quantlut_sym",
|
33 |
+
"split_for_tp": true,
|
34 |
+
"td_x": 16,
|
35 |
+
"td_y": 16,
|
36 |
+
"tlut_bits": 9
|
37 |
+
},
|
38 |
+
"rms_norm_eps": 1e-05,
|
39 |
+
"rope_scaling": {
|
40 |
+
"factor": 8.0,
|
41 |
+
"high_freq_factor": 4.0,
|
42 |
+
"low_freq_factor": 1.0,
|
43 |
+
"original_max_position_embeddings": 8192,
|
44 |
+
"rope_type": "llama3"
|
45 |
+
},
|
46 |
+
"rope_theta": 500000.0,
|
47 |
+
"tie_word_embeddings": false,
|
48 |
+
"torch_dtype": "bfloat16",
|
49 |
+
"transformers_version": "4.45.2",
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 128256
|
52 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 128000,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
128001,
|
6 |
+
128008,
|
7 |
+
128009
|
8 |
+
],
|
9 |
+
"temperature": 0.6,
|
10 |
+
"top_p": 0.9,
|
11 |
+
"transformers_version": "4.45.2"
|
12 |
+
}
|
model-00001-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb853e920c912c15bb8ab443fa85a3b576df35fc8e8a4de0bf5d2239d7356295
|
3 |
+
size 4924644256
|
model-00002-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dd0f7a7f2455adff7ea0a639731150448552665f140e15ce917ffcaa647ce0b
|
3 |
+
size 4784559328
|
model-00003-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:734df5954bca402b4d78aaadb45838c93d92e7c38f6dab699013419e6623aec7
|
3 |
+
size 4784559328
|
model-00004-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59b067068fe8f0901c5c90e40e157625e4b25fa1d09676c067200e0d88da2889
|
3 |
+
size 4784559328
|
model-00005-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cce82a14e1d994c2de72614bbd140d1518b7ca70f4826d148d090499b36c134
|
3 |
+
size 4784559432
|
model-00006-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0650eaeb15263f425d02d2e90282adc9aac9c7f095bfd45892dbf7dbd47d48b6
|
3 |
+
size 4784559440
|
model-00007-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e6de5b0ecabcca7cac410b54c34344f10a0893380e444726d4be33cbd7c25b5
|
3 |
+
size 4784559440
|
model-00008-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2349d4beb027962816aa8ed1db56f02050ec7a57c48688241a68b1125ce6f14
|
3 |
+
size 4784559440
|
model-00009-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bc923acb7a2c379d906fb0c741be85403547408ad7093b0618e0171d61592a4
|
3 |
+
size 4784559440
|
model-00010-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:715d75d8fd437a626351a74b8b792d87bf2be2f63acb9486ea14eb0258844f04
|
3 |
+
size 4784559440
|
model-00011-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45f55b3fb4506c09c5584897129659a1af467bae772804e5e8686f9ff8a29194
|
3 |
+
size 4784559440
|
model-00012-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:070ac6ba6038eaddf3566e13f6d87c13abb1530ddcfe09f4ef47718cabb75c56
|
3 |
+
size 4784559440
|
model-00013-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:199062beeecc7eac2672ca19385c44c8516fd9ec8752e8bd58c8df1fe61992f4
|
3 |
+
size 4784559440
|
model-00014-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:320feefcda9ee6bbf7843567787b8e2187a62c50d81c12a53260bebe9e8de3f6
|
3 |
+
size 4784559440
|
model-00015-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29a8715edfd24f0ef757c88578d0317a8a012f2c40a88bfdc13c51792571fe32
|
3 |
+
size 4784559440
|
model-00016-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f28d9e69c7274e5d9c1ef4cb6109084780427db518e6364c680e8e64ff063780
|
3 |
+
size 4784559440
|
model-00017-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10d8706fcc5536b4ee298b756b820385882e8029d00812e9fa9a509561bddf40
|
3 |
+
size 4784559440
|
model-00018-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80a71d23a392c7c51c80f5790ba04326fff05311e77ced5dfb1fa7d5721b15a5
|
3 |
+
size 4784559440
|
model-00019-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06384a4bba1a5037dc9edae615ab8182b6f1b2be54a810e2e7eaa1381557489e
|
3 |
+
size 4784559440
|
model-00020-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:030313ca91deb44a17e47cfd97606767d0ec55982aef63d9b4ba19517e6385ad
|
3 |
+
size 4784559440
|
model-00021-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5275cef1047bccb0fdc882b6752a32aa2f3c26b6427d4b92c13e1e6e83b1e385
|
3 |
+
size 4784559440
|
model-00022-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddaed62e5aa9ddba18b8923663d46c83153431fe8d5883b2e97609c3aad750ee
|
3 |
+
size 4784559440
|
model-00023-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d85ea44149d6f535a11093f850cb0b4e5d2babc1e12c51e333c2e3ba7e0bc52
|
3 |
+
size 4784559440
|
model-00024-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:534e1d00b14eeac998844d24174bebbd3ee22ed8c1a02d77502dcb6aba77b9c7
|
3 |
+
size 4784559440
|
model-00025-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f312d4c84e05e7c4061f000fabdab1eb66f0e0ccc80173cf092ea993560fa75
|
3 |
+
size 4784559440
|
model-00026-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab8eb73f87d7ec1c8ee92140cf1f479aa2ae02d48016fdc6f11ae8149266bf6a
|
3 |
+
size 4784559440
|
model-00027-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbb8c10de4ba138cb5b75ab1c9178688e0c9dc016bd57446830682e5231f70e3
|
3 |
+
size 4784559440
|
model-00028-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e63e4952f613ae073b5aba84cb0b667df1060d3a257bd3bad674e2cbb763cf06
|
3 |
+
size 4784559440
|
model-00029-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42ddeaddec8bb34d79b0d037eeb58fc198b38911216f08ad94c2bbab328b1844
|
3 |
+
size 4784559440
|
model-00030-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d55738921485b99e0ba422f18263b3b16fb246fa830e38acd609b4e6a39237bb
|
3 |
+
size 4784559440
|
model-00031-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1eb091533a64700e483ca482a9b7a2a196f798fb96ad034054ddf94e8b15035
|
3 |
+
size 4784559440
|
model-00032-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d061e15a2104288a8cdd6c79043815c9a19f110002a1b4147c667230eb73dbd6
|
3 |
+
size 4784559440
|
model-00033-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d97a2a798b8854d202aab917e9e599f4152f69da0ef066f691a541bad5f607fb
|
3 |
+
size 4784559440
|
model-00034-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3db508eea5c86933fcc36f64eaf8ce48ab09b7a91e96985bd2c350fe3515a509
|
3 |
+
size 4784559440
|
model-00035-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:978eadb283a16c0f09de96855cdcc1cb699432d9cdd6842bfa32c1a4ec3e080b
|
3 |
+
size 4784559544
|
model-00036-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:598baee728eb850230af4ceec480bd016727a927c84ce0372454a37b4979e65a
|
3 |
+
size 4784559552
|
model-00037-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2861f7c4ecbab987c1b6223c88f769f825be950653f1aeac183366ab7b3574a7
|
3 |
+
size 4784559552
|
model-00038-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a14300eab5e140f012c8430e7268077174bdc5f64786fc3574bdf0fa58519425
|
3 |
+
size 4784559552
|
model-00039-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c167a62089f3d8846f6e5f2d8a6aebe0c4d88911d1b3877ae860e73022060c1d
|
3 |
+
size 4784559552
|
model-00040-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2396809fffd0accaac360308ccbf1facd2d587b3fe93f15f84a63b0cff5b2e2f
|
3 |
+
size 4784559552
|
model-00041-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cdae08a1ae3b7ef15aa1ebfdd22fc7faafabd18366b110a92d9dc73cf2466c0
|
3 |
+
size 4784559552
|
model-00042-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8266584f0dbec606b412e7b52bb7d27c2d65352dde1b6b24b64dd617b773648
|
3 |
+
size 4784559552
|
model-00043-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00736c83503d93a500a8df46e93d657b5a3154c5812fe58314e8d218dedf53ad
|
3 |
+
size 4062640880
|
model-00044-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71b079a02069ebe5a5f4f8135815f136afb1d6fc4423620dcb2a14fa399cdf12
|
3 |
+
size 4202692736
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|