Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- config.json +31 -0
- generation_config.json +6 -0
- model-00001-of-00189.safetensors +3 -0
- model-00002-of-00189.safetensors +3 -0
- model-00003-of-00189.safetensors +3 -0
- model-00004-of-00189.safetensors +3 -0
- model-00005-of-00189.safetensors +3 -0
- model-00006-of-00189.safetensors +3 -0
- model-00007-of-00189.safetensors +3 -0
- model-00008-of-00189.safetensors +3 -0
- model-00009-of-00189.safetensors +3 -0
- model-00010-of-00189.safetensors +3 -0
- model-00011-of-00189.safetensors +3 -0
- model-00012-of-00189.safetensors +3 -0
- model-00013-of-00189.safetensors +3 -0
- model-00014-of-00189.safetensors +3 -0
- model-00015-of-00189.safetensors +3 -0
- model-00016-of-00189.safetensors +3 -0
- model-00017-of-00189.safetensors +3 -0
- model-00018-of-00189.safetensors +3 -0
- model-00019-of-00189.safetensors +3 -0
- model-00020-of-00189.safetensors +3 -0
- model-00021-of-00189.safetensors +3 -0
- model-00022-of-00189.safetensors +3 -0
- model-00023-of-00189.safetensors +3 -0
- model-00024-of-00189.safetensors +3 -0
- model-00025-of-00189.safetensors +3 -0
- model-00026-of-00189.safetensors +3 -0
- model-00027-of-00189.safetensors +3 -0
- model-00028-of-00189.safetensors +3 -0
- model-00029-of-00189.safetensors +3 -0
- model-00030-of-00189.safetensors +3 -0
- model-00031-of-00189.safetensors +3 -0
- model-00032-of-00189.safetensors +3 -0
- model-00033-of-00189.safetensors +3 -0
- model-00034-of-00189.safetensors +3 -0
- model-00035-of-00189.safetensors +3 -0
- model-00036-of-00189.safetensors +3 -0
- model-00037-of-00189.safetensors +3 -0
- model-00038-of-00189.safetensors +3 -0
- model-00039-of-00189.safetensors +3 -0
- model-00040-of-00189.safetensors +3 -0
- model-00041-of-00189.safetensors +3 -0
- model-00042-of-00189.safetensors +3 -0
- model-00043-of-00189.safetensors +3 -0
- model-00044-of-00189.safetensors +3 -0
- model-00045-of-00189.safetensors +3 -0
- model-00046-of-00189.safetensors +3 -0
- model-00047-of-00189.safetensors +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "Nemotron-4-340B-Base-hf",
|
3 |
+
"architectures": [
|
4 |
+
"NemotronForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 2,
|
9 |
+
"eos_token_id": 3,
|
10 |
+
"head_dim": 192,
|
11 |
+
"hidden_act": "relu2",
|
12 |
+
"hidden_size": 18432,
|
13 |
+
"initializer_range": 0.0063,
|
14 |
+
"intermediate_size": 73728,
|
15 |
+
"max_position_embeddings": 4096,
|
16 |
+
"mlp_bias": false,
|
17 |
+
"model_type": "nemotron",
|
18 |
+
"norm_eps": 1e-05,
|
19 |
+
"num_attention_heads": 96,
|
20 |
+
"num_hidden_layers": 96,
|
21 |
+
"num_key_value_heads": 8,
|
22 |
+
"rope_percent": 0.5,
|
23 |
+
"rope_percentage": 0.5,
|
24 |
+
"rope_scaling": null,
|
25 |
+
"rope_theta": 10000,
|
26 |
+
"tie_word_embeddings": false,
|
27 |
+
"torch_dtype": "bfloat16",
|
28 |
+
"transformers_version": "4.43.0.dev0",
|
29 |
+
"use_cache": true,
|
30 |
+
"vocab_size": 256000
|
31 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 2,
|
4 |
+
"eos_token_id": 3,
|
5 |
+
"transformers_version": "4.43.0.dev0"
|
6 |
+
}
|
model-00001-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dd1ac8d1307a622364a2c4a8914f83c6294964ea8957a0ebd5e5a0ab96961b8
|
3 |
+
size 9437184144
|
model-00002-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d8f4f516d62b60c08840fbdc73fa8b921576866fd0d15ea424f2a6462f33de4
|
3 |
+
size 4190110320
|
model-00003-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0a347266866599e7a4a7944ea073e286e424baeb6ab66d48a5ac3e3fc5337c1
|
3 |
+
size 4190258216
|
model-00004-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b3f467b85bdf5949050bfd727a0a4166b39aaeb434af075babdfd23ffa5d276
|
3 |
+
size 2717909144
|
model-00005-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef9ad8c75e523111b8ca4137559bae64170d6cf8684de6c9e7407d1532566d99
|
3 |
+
size 4190258216
|
model-00006-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:609b732f836ded15eef00ae7f17fb577cb532a52cc79edb2ee6b7cb93e4ce5ea
|
3 |
+
size 2717909144
|
model-00007-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e4e0dcec2eb0b9d4bdbb149d1bb7067aeffc9416c0e30a0b6707d2a89c65121
|
3 |
+
size 4190258216
|
model-00008-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cbd8c24383bb377a082d74db6d2df253384d6c2f50ced655529e65aa042d63a
|
3 |
+
size 2717909144
|
model-00009-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f3c8f41c9579ef0b2ffdcdbcdfd08eb50f5dc3c2b0201df6c75a5dc5814d7ee
|
3 |
+
size 4190258216
|
model-00010-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40fb5ed8f19d18a9814a5cb02e34fdf96b2ac1e16b0a4e699d10fcb1ab3d366f
|
3 |
+
size 2717909144
|
model-00011-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ed282a3672baf6d1f6e2b2290b2d1ef3b82df972fe315e153dd1b687c36d1e6
|
3 |
+
size 4190258216
|
model-00012-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:338521ef8885d4c0e8efec5930e5e6bbe15a1b5e23eb65211df5a2ef3c82a2aa
|
3 |
+
size 2717909144
|
model-00013-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c623d9c8c452df9735b68d01876ff1afb10d0afa6482bd17f92fcaf4d4f364e4
|
3 |
+
size 4190258216
|
model-00014-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af5e2ac944ed77b5050cc20f275e3c38243f10e520c8ad52716fb8f84cb41aa2
|
3 |
+
size 2717909144
|
model-00015-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ef68ba06bb8f1f47767fa41de2bdfc4f0aefb4b7dbb9a6a8353aae6f0daf4f8
|
3 |
+
size 4190258216
|
model-00016-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf1683ef00f108e14124d2b819677477103189701bfa203116505c3b246aeba4
|
3 |
+
size 2717909144
|
model-00017-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5f7866f97c8c6851256ba8a4c905271787fa980296aaeb048ba98d2c4054f78
|
3 |
+
size 4190258216
|
model-00018-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cee94093cd02c2f254d94a29640fdfb8e748fcc1279c49e0057833f153cf067
|
3 |
+
size 2717909144
|
model-00019-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55dcc370cf15f7a86400210228d54596542689061b1008cd1fc70c84f7954e1c
|
3 |
+
size 4190258216
|
model-00020-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d773d64572283d7aa290e6884f9b6fa2c06f266e528126141e8752fc4ed3fce
|
3 |
+
size 2717909144
|
model-00021-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2bc142c5b7e15b443d70fd0b406f404fbaf94b1070a8ed0e2f2234a6b748cf1
|
3 |
+
size 4190258240
|
model-00022-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae6dfe5a71fe371c07c96da77584618dd312c60e04960bdbaa63743cbb23079c
|
3 |
+
size 2717909144
|
model-00023-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8e6b9f8ba35273274ce2d8fa44b51a232f63e3c03272770b481fe99ce20b535
|
3 |
+
size 4190258224
|
model-00024-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86a357f0fd41e8afa809103a1dc25a6e79fd2d878a700936624881246b0d8d25
|
3 |
+
size 2717909144
|
model-00025-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c46560584a544ea5ef1f61c2155425fefab7ed92956aa13c1c76368ac4839f9
|
3 |
+
size 4190258224
|
model-00026-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f06d38917bd209c5cb6df48c9305b27ce5bb08f0810d82a1aac0588670ee9e7f
|
3 |
+
size 2717909144
|
model-00027-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0293df2ce250853e3b4ab74fac1cd4c576bf03bd5ffa3645380527c0647c4084
|
3 |
+
size 4190258224
|
model-00028-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad4081110b4b30a8c130d4cc6902bf9ec8aba4526eacbc6affa1b90738ccc58c
|
3 |
+
size 2717909144
|
model-00029-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8ae84974bbf4364d97a2f7f4ba04ba05db660345af2f555f0b9794e3d90ab2f
|
3 |
+
size 4190258224
|
model-00030-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16f031a76b450784c8bf2ddc3b68dd3e939888320c9b6c1ac2aea0a02807e1d4
|
3 |
+
size 2717909144
|
model-00031-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0ef0e92ad95f8158b920bb31c6f5b93e6e5ae3f320a2fc8f8d196cde1638dbf
|
3 |
+
size 4190258224
|
model-00032-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7abff14d106d8c5b69a5551bfdd5a394817d20afffff203e577ee9b7790858c
|
3 |
+
size 2717909144
|
model-00033-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70768b3bfdd969a1855c967c5a33e5419aa95432bf8c45806ce64ffb2d7fd928
|
3 |
+
size 4190258224
|
model-00034-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:520ab1ce3c5c7c1f2fa05e4b4fbbcdef01494baa1873e1428ef21513893137e0
|
3 |
+
size 2717909144
|
model-00035-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cf1280acc1f456ed4eb89f4d3518d4a3c186b63a0f9db16451ec31e8b271c57
|
3 |
+
size 4190258224
|
model-00036-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46c24a8c6ee9bd26823a46eb3938f54207ccb9704b6a4fd25ef633e96fde984f
|
3 |
+
size 2717909144
|
model-00037-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f00ed95a79cae3b805d85be71934a7ee35548e4187a55d943fed69378a40130
|
3 |
+
size 4190258224
|
model-00038-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f67648e61fd81a3c73507faa73e80b04772ff079e15c0f87a0ae2cd40b25ca9
|
3 |
+
size 2717909144
|
model-00039-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5eaec9bf68aabc48b5ac5b8fbb674b876c3c4d29f62da4c742d21d92cff63b38
|
3 |
+
size 4190258224
|
model-00040-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2085099d5977b84d5c68819088ce817a5bdc0f3de0fe11eeef28148d8b765a24
|
3 |
+
size 2717909144
|
model-00041-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f86446a4fe46023737ef77230cdcbda17dcabbcd4238bb177b0e6ba3ad78aee6
|
3 |
+
size 4190258224
|
model-00042-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:363be390c21bbd3d1c56b9667a413ec864245d94db6a2d1ae9947d8b997d0293
|
3 |
+
size 2717909144
|
model-00043-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21be53f91f1bafe0a22c41fed68a86a80d58cf6afdfe5199cc7dd005c42ead9c
|
3 |
+
size 4190258224
|
model-00044-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbef384f28a69290e0d7d9284f85713756d5f82bd501b608e11cb3cb66fdb85a
|
3 |
+
size 2717909144
|
model-00045-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9b09709c4ed2f5364edcaf798351ffbd6455aa3a47b72547632c58bb4f871d3
|
3 |
+
size 4190258224
|
model-00046-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8105c9a5238d8990359c4b26e796710f455ea124ea7c0302c16cf0c3acf96f6e
|
3 |
+
size 2717909144
|
model-00047-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2037b00bd90bb81a0c8297b91293813f49a5bd9dd8246d6e63ec10cac88865f
|
3 |
+
size 4190258224
|