Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +88 -0
generation_config.json +6 -0
onnx/model.onnx +3 -0
onnx/model_bnb4.onnx +3 -0
onnx/model_fp16.onnx +3 -0
onnx/model_int8.onnx +3 -0
onnx/model_q4.onnx +3 -0
onnx/model_quantized.onnx +3 -0
onnx/model_uint8.onnx +3 -0
quantize_config.json +132 -0

config.json ADDED Viewed

	@@ -0,0 +1,88 @@

+{
+  "_name_or_path": "apple/OpenELM-270M-Instruct",
+  "activation_fn_name": "swish",
+  "architectures": [
+    "OpenELMForCausalLM"
+  ],
+  "auto_map": {
+    "AutoConfig": "apple/OpenELM-270M-Instruct--configuration_openelm.OpenELMConfig",
+    "AutoModelForCausalLM": "apple/OpenELM-270M-Instruct--modeling_openelm.OpenELMForCausalLM"
+  },
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "ffn_dim_divisor": 256,
+  "ffn_multipliers": [
+    0.5,
+    0.73,
+    0.97,
+    1.2,
+    1.43,
+    1.67,
+    1.9,
+    2.13,
+    2.37,
+    2.6,
+    2.83,
+    3.07,
+    3.3,
+    3.53,
+    3.77,
+    4.0
+  ],
+  "ffn_with_glu": true,
+  "head_dim": 64,
+  "initializer_range": 0.02,
+  "max_context_length": 2048,
+  "model_dim": 1280,
+  "model_type": "openelm",
+  "normalization_layer_name": "rms_norm",
+  "normalize_qk_projections": true,
+  "num_gqa_groups": 4,
+  "num_kv_heads": [
+    3,
+    3,
+    3,
+    3,
+    3,
+    4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    5,
+    5,
+    5,
+    5
+  ],
+  "num_query_heads": [
+    12,
+    12,
+    12,
+    12,
+    12,
+    16,
+    16,
+    16,
+    16,
+    16,
+    16,
+    16,
+    20,
+    20,
+    20,
+    20
+  ],
+  "num_transformer_layers": 16,
+  "qkv_multipliers": [
+    0.5,
+    1.0
+  ],
+  "rope_freq_constant": 10000,
+  "rope_max_length": 4096,
+  "share_input_output_layers": true,
+  "transformers_version": "4.38.2",
+  "use_cache": true,
+  "vocab_size": 32000
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "transformers_version": "4.38.2"
+}

onnx/model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:630b4b8d4aac990e2b169e0928a109bd925e29343da2510f05eedcc28433ad18
+size 1256920099

onnx/model_bnb4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:220cb57c43b1e6e33c2cd10a56717babb0f223057245899d52d3be15136151c4
+size 323707915

onnx/model_fp16.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:09b3a233192aab4f6837d318009808e3188abba7ae91e5b9c9c776765d764145
+size 631188025

onnx/model_int8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e05c62d2de6c20bc60d3058a7d93c8924c8a88d7439ab120de03427fd3feaac6
+size 319957458

onnx/model_q4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2cf69419c4b9fbba0c9fe57bb764f8d205abfc53d1a473759bb3bb6ec8ea94be
+size 340675066

onnx/model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e05c62d2de6c20bc60d3058a7d93c8924c8a88d7439ab120de03427fd3feaac6
+size 319957458

onnx/model_uint8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4d34a694969e060ed90aa0cde42991b12af108c2f08c16cce1e9c27958e256c2
+size 319957487

quantize_config.json ADDED Viewed

	@@ -0,0 +1,132 @@

+{
+    "fp16": {},
+    "q8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "And",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "ConstantOfShape",
+                    "Div",
+                    "Equal",
+                    "Expand",
+                    "Gather",
+                    "MatMul",
+                    "Mul",
+                    "Neg",
+                    "Pow",
+                    "Range",
+                    "ReduceMean",
+                    "Reshape",
+                    "ScatterND",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Sub",
+                    "Tile",
+                    "Transpose",
+                    "Unsqueeze",
+                    "Where"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "int8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "And",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "ConstantOfShape",
+                    "Div",
+                    "Equal",
+                    "Expand",
+                    "Gather",
+                    "MatMul",
+                    "Mul",
+                    "Neg",
+                    "Pow",
+                    "Range",
+                    "ReduceMean",
+                    "Reshape",
+                    "ScatterND",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Sub",
+                    "Tile",
+                    "Transpose",
+                    "Unsqueeze",
+                    "Where"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "uint8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "And",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "ConstantOfShape",
+                    "Div",
+                    "Equal",
+                    "Expand",
+                    "Gather",
+                    "MatMul",
+                    "Mul",
+                    "Neg",
+                    "Pow",
+                    "Range",
+                    "ReduceMean",
+                    "Reshape",
+                    "ScatterND",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Sub",
+                    "Tile",
+                    "Transpose",
+                    "Unsqueeze",
+                    "Where"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "q4": {
+        "block_size": 32,
+        "is_symmetric": true,
+        "accuracy_level": null
+    },
+    "bnb4": {
+        "block_size": 64,
+        "quant_type": 1
+    }
+}