Trained with Unsloth

Files changed (7) hide show

README.md CHANGED Viewed

@@ -1,11 +1,11 @@
 ---
 library_name: transformers
 tags:
 - unsloth
 - trl
 - sft
 - gita
-license: mit
 pipeline_tag: text-generation
 ---

 ---
+license: mit
 library_name: transformers
 tags:
 - unsloth
 - trl
 - sft
 - gita
 pipeline_tag: text-generation
 ---

config.json CHANGED Viewed

@@ -1,3 +1,28 @@
 {
-    "model_type": "mistral"
-}

 {
+  "_name_or_path": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
+  "architectures": [
+    "MistralForCausalLM"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 4096,
+  "initializer_range": 0.02,
+  "intermediate_size": 14336,
+  "max_position_embeddings": 32768,
+  "model_type": "mistral",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 32,
+  "num_key_value_heads": 8,
+  "pad_token_id": 770,
+  "rms_norm_eps": 1e-05,
+  "rope_theta": 1000000.0,
+  "sliding_window": null,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float16",
+  "transformers_version": "4.41.1",
+  "unsloth_version": "2024.5",
+  "use_cache": true,
+  "vocab_size": 32768
+}

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
-  "transformers_version": "4.40.2"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
+  "transformers_version": "4.41.1"
 }

pytorch_model-00001-of-00003.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:deb7af504efcbdb428e7459d1ec98ab018d3b553690b39c66d3c58e491bc1e1e
-size 4943185632

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb56b08940932622280e73e282ca772b27623d32a0f065c33b4edde55f14117a
+size 4949477088

pytorch_model-00002-of-00003.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0f2e2e010ade345070d3751c5cc09875d31eeb2bd84ef80ef3fca2a013533915
-size 4999844040

 version https://git-lfs.github.com/spec/v1
+oid sha256:6b962e76ed33df30882366137508a3c58ec7de9504cbb8cb75be19e4f145a99d
+size 4999844296

pytorch_model-00003-of-00003.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77a8e22e64a7474f5b6bc8c79572f36918bd0869ab5830b501d00da8da6bb88a
-size 4540536454

 version https://git-lfs.github.com/spec/v1
+oid sha256:13f693b0c809a0cfd8df491678932bf8afb58831f69baab7b472fedcd9997e95
+size 4546827910

pytorch_model.bin.index.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "metadata": {
-    "total_size": 14483464192
   },
   "weight_map": {
     "lm_head.weight": "pytorch_model-00003-of-00003.bin",

 {
   "metadata": {
+    "total_size": 14496047104
   },
   "weight_map": {
     "lm_head.weight": "pytorch_model-00003-of-00003.bin",