mgoin commited on
Commit
92c10ef
1 Parent(s): 1f859fe

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. config.json +31 -0
  3. generation_config.json +6 -0
  4. model-00001-of-00189.safetensors +3 -0
  5. model-00002-of-00189.safetensors +3 -0
  6. model-00003-of-00189.safetensors +3 -0
  7. model-00004-of-00189.safetensors +3 -0
  8. model-00005-of-00189.safetensors +3 -0
  9. model-00006-of-00189.safetensors +3 -0
  10. model-00007-of-00189.safetensors +3 -0
  11. model-00008-of-00189.safetensors +3 -0
  12. model-00009-of-00189.safetensors +3 -0
  13. model-00010-of-00189.safetensors +3 -0
  14. model-00011-of-00189.safetensors +3 -0
  15. model-00012-of-00189.safetensors +3 -0
  16. model-00013-of-00189.safetensors +3 -0
  17. model-00014-of-00189.safetensors +3 -0
  18. model-00015-of-00189.safetensors +3 -0
  19. model-00016-of-00189.safetensors +3 -0
  20. model-00017-of-00189.safetensors +3 -0
  21. model-00018-of-00189.safetensors +3 -0
  22. model-00019-of-00189.safetensors +3 -0
  23. model-00020-of-00189.safetensors +3 -0
  24. model-00021-of-00189.safetensors +3 -0
  25. model-00022-of-00189.safetensors +3 -0
  26. model-00023-of-00189.safetensors +3 -0
  27. model-00024-of-00189.safetensors +3 -0
  28. model-00025-of-00189.safetensors +3 -0
  29. model-00026-of-00189.safetensors +3 -0
  30. model-00027-of-00189.safetensors +3 -0
  31. model-00028-of-00189.safetensors +3 -0
  32. model-00029-of-00189.safetensors +3 -0
  33. model-00030-of-00189.safetensors +3 -0
  34. model-00031-of-00189.safetensors +3 -0
  35. model-00032-of-00189.safetensors +3 -0
  36. model-00033-of-00189.safetensors +3 -0
  37. model-00034-of-00189.safetensors +3 -0
  38. model-00035-of-00189.safetensors +3 -0
  39. model-00036-of-00189.safetensors +3 -0
  40. model-00037-of-00189.safetensors +3 -0
  41. model-00038-of-00189.safetensors +3 -0
  42. model-00039-of-00189.safetensors +3 -0
  43. model-00040-of-00189.safetensors +3 -0
  44. model-00041-of-00189.safetensors +3 -0
  45. model-00042-of-00189.safetensors +3 -0
  46. model-00043-of-00189.safetensors +3 -0
  47. model-00044-of-00189.safetensors +3 -0
  48. model-00045-of-00189.safetensors +3 -0
  49. model-00046-of-00189.safetensors +3 -0
  50. model-00047-of-00189.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Nemotron-4-340B-Base-hf",
3
+ "architectures": [
4
+ "NemotronForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 2,
9
+ "eos_token_id": 3,
10
+ "head_dim": 192,
11
+ "hidden_act": "relu2",
12
+ "hidden_size": 18432,
13
+ "initializer_range": 0.0063,
14
+ "intermediate_size": 73728,
15
+ "max_position_embeddings": 4096,
16
+ "mlp_bias": false,
17
+ "model_type": "nemotron",
18
+ "norm_eps": 1e-05,
19
+ "num_attention_heads": 96,
20
+ "num_hidden_layers": 96,
21
+ "num_key_value_heads": 8,
22
+ "rope_percent": 0.5,
23
+ "rope_percentage": 0.5,
24
+ "rope_scaling": null,
25
+ "rope_theta": 10000,
26
+ "tie_word_embeddings": false,
27
+ "torch_dtype": "bfloat16",
28
+ "transformers_version": "4.43.0.dev0",
29
+ "use_cache": true,
30
+ "vocab_size": 256000
31
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 2,
4
+ "eos_token_id": 3,
5
+ "transformers_version": "4.43.0.dev0"
6
+ }
model-00001-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7dd1ac8d1307a622364a2c4a8914f83c6294964ea8957a0ebd5e5a0ab96961b8
3
+ size 9437184144
model-00002-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d8f4f516d62b60c08840fbdc73fa8b921576866fd0d15ea424f2a6462f33de4
3
+ size 4190110320
model-00003-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0a347266866599e7a4a7944ea073e286e424baeb6ab66d48a5ac3e3fc5337c1
3
+ size 4190258216
model-00004-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b3f467b85bdf5949050bfd727a0a4166b39aaeb434af075babdfd23ffa5d276
3
+ size 2717909144
model-00005-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef9ad8c75e523111b8ca4137559bae64170d6cf8684de6c9e7407d1532566d99
3
+ size 4190258216
model-00006-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:609b732f836ded15eef00ae7f17fb577cb532a52cc79edb2ee6b7cb93e4ce5ea
3
+ size 2717909144
model-00007-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e4e0dcec2eb0b9d4bdbb149d1bb7067aeffc9416c0e30a0b6707d2a89c65121
3
+ size 4190258216
model-00008-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cbd8c24383bb377a082d74db6d2df253384d6c2f50ced655529e65aa042d63a
3
+ size 2717909144
model-00009-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f3c8f41c9579ef0b2ffdcdbcdfd08eb50f5dc3c2b0201df6c75a5dc5814d7ee
3
+ size 4190258216
model-00010-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40fb5ed8f19d18a9814a5cb02e34fdf96b2ac1e16b0a4e699d10fcb1ab3d366f
3
+ size 2717909144
model-00011-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ed282a3672baf6d1f6e2b2290b2d1ef3b82df972fe315e153dd1b687c36d1e6
3
+ size 4190258216
model-00012-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:338521ef8885d4c0e8efec5930e5e6bbe15a1b5e23eb65211df5a2ef3c82a2aa
3
+ size 2717909144
model-00013-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c623d9c8c452df9735b68d01876ff1afb10d0afa6482bd17f92fcaf4d4f364e4
3
+ size 4190258216
model-00014-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af5e2ac944ed77b5050cc20f275e3c38243f10e520c8ad52716fb8f84cb41aa2
3
+ size 2717909144
model-00015-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ef68ba06bb8f1f47767fa41de2bdfc4f0aefb4b7dbb9a6a8353aae6f0daf4f8
3
+ size 4190258216
model-00016-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf1683ef00f108e14124d2b819677477103189701bfa203116505c3b246aeba4
3
+ size 2717909144
model-00017-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5f7866f97c8c6851256ba8a4c905271787fa980296aaeb048ba98d2c4054f78
3
+ size 4190258216
model-00018-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cee94093cd02c2f254d94a29640fdfb8e748fcc1279c49e0057833f153cf067
3
+ size 2717909144
model-00019-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55dcc370cf15f7a86400210228d54596542689061b1008cd1fc70c84f7954e1c
3
+ size 4190258216
model-00020-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d773d64572283d7aa290e6884f9b6fa2c06f266e528126141e8752fc4ed3fce
3
+ size 2717909144
model-00021-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2bc142c5b7e15b443d70fd0b406f404fbaf94b1070a8ed0e2f2234a6b748cf1
3
+ size 4190258240
model-00022-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae6dfe5a71fe371c07c96da77584618dd312c60e04960bdbaa63743cbb23079c
3
+ size 2717909144
model-00023-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8e6b9f8ba35273274ce2d8fa44b51a232f63e3c03272770b481fe99ce20b535
3
+ size 4190258224
model-00024-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86a357f0fd41e8afa809103a1dc25a6e79fd2d878a700936624881246b0d8d25
3
+ size 2717909144
model-00025-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c46560584a544ea5ef1f61c2155425fefab7ed92956aa13c1c76368ac4839f9
3
+ size 4190258224
model-00026-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f06d38917bd209c5cb6df48c9305b27ce5bb08f0810d82a1aac0588670ee9e7f
3
+ size 2717909144
model-00027-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0293df2ce250853e3b4ab74fac1cd4c576bf03bd5ffa3645380527c0647c4084
3
+ size 4190258224
model-00028-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad4081110b4b30a8c130d4cc6902bf9ec8aba4526eacbc6affa1b90738ccc58c
3
+ size 2717909144
model-00029-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8ae84974bbf4364d97a2f7f4ba04ba05db660345af2f555f0b9794e3d90ab2f
3
+ size 4190258224
model-00030-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16f031a76b450784c8bf2ddc3b68dd3e939888320c9b6c1ac2aea0a02807e1d4
3
+ size 2717909144
model-00031-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0ef0e92ad95f8158b920bb31c6f5b93e6e5ae3f320a2fc8f8d196cde1638dbf
3
+ size 4190258224
model-00032-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7abff14d106d8c5b69a5551bfdd5a394817d20afffff203e577ee9b7790858c
3
+ size 2717909144
model-00033-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70768b3bfdd969a1855c967c5a33e5419aa95432bf8c45806ce64ffb2d7fd928
3
+ size 4190258224
model-00034-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:520ab1ce3c5c7c1f2fa05e4b4fbbcdef01494baa1873e1428ef21513893137e0
3
+ size 2717909144
model-00035-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf1280acc1f456ed4eb89f4d3518d4a3c186b63a0f9db16451ec31e8b271c57
3
+ size 4190258224
model-00036-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46c24a8c6ee9bd26823a46eb3938f54207ccb9704b6a4fd25ef633e96fde984f
3
+ size 2717909144
model-00037-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f00ed95a79cae3b805d85be71934a7ee35548e4187a55d943fed69378a40130
3
+ size 4190258224
model-00038-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f67648e61fd81a3c73507faa73e80b04772ff079e15c0f87a0ae2cd40b25ca9
3
+ size 2717909144
model-00039-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eaec9bf68aabc48b5ac5b8fbb674b876c3c4d29f62da4c742d21d92cff63b38
3
+ size 4190258224
model-00040-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2085099d5977b84d5c68819088ce817a5bdc0f3de0fe11eeef28148d8b765a24
3
+ size 2717909144
model-00041-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f86446a4fe46023737ef77230cdcbda17dcabbcd4238bb177b0e6ba3ad78aee6
3
+ size 4190258224
model-00042-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:363be390c21bbd3d1c56b9667a413ec864245d94db6a2d1ae9947d8b997d0293
3
+ size 2717909144
model-00043-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21be53f91f1bafe0a22c41fed68a86a80d58cf6afdfe5199cc7dd005c42ead9c
3
+ size 4190258224
model-00044-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbef384f28a69290e0d7d9284f85713756d5f82bd501b608e11cb3cb66fdb85a
3
+ size 2717909144
model-00045-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9b09709c4ed2f5364edcaf798351ffbd6455aa3a47b72547632c58bb4f871d3
3
+ size 4190258224
model-00046-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8105c9a5238d8990359c4b26e796710f455ea124ea7c0302c16cf0c3acf96f6e
3
+ size 2717909144
model-00047-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2037b00bd90bb81a0c8297b91293813f49a5bd9dd8246d6e63ec10cac88865f
3
+ size 4190258224