Upload model trained with Unsloth

Upload model trained with Unsloth 2x faster

Files changed (3) hide show

README.md CHANGED Viewed

@@ -1,18 +1,19 @@
 ---
 language:
 - bn
 license: apache-2.0
 tags:
 - text-generation-inference
 - transformers
 - llama
 - trl
 inference: false
-base_model: unsloth/llama-3-8b-bnb-4bit
-library_name: transformers
-pipeline_tag: question-answering
-datasets:
-- iamshnoo/alpaca-cleaned-bengali
 ---
 Bangla LLaMA is a specialized model for context-based question answering and Bengali retrieval augment generation. It is derived from LLaMA 3 8B and trained on the iamshnoo/alpaca-cleaned-bengali dataset. This model is designed to provide accurate responses in Bengali with relevant contextual information. It is integrated with the transformers library, making it easy to use for context-based question answering and Bengali retrieval augment generation in projects.

 ---
+base_model: unsloth/llama-3-8b-bnb-4bit
+datasets:
+- iamshnoo/alpaca-cleaned-bengali
 language:
 - bn
+library_name: transformers
 license: apache-2.0
+pipeline_tag: question-answering
 tags:
 - text-generation-inference
 - transformers
 - llama
 - trl
+- unsloth
 inference: false
 ---
 Bangla LLaMA is a specialized model for context-based question answering and Bengali retrieval augment generation. It is derived from LLaMA 3 8B and trained on the iamshnoo/alpaca-cleaned-bengali dataset. This model is designed to provide accurate responses in Bengali with relevant contextual information. It is integrated with the transformers library, making it easy to use for context-based question answering and Bengali retrieval augment generation in projects.

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "unsloth/llama-3-8b-bnb-4bit",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -16,17 +16,17 @@
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
-  "r": 16,
   "rank_pattern": {},
-  "revision": "unsloth",
   "target_modules": [
     "gate_proj",
-    "down_proj",
     "o_proj",
     "q_proj",
-    "v_proj",
-    "up_proj",
-    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "unsloth/llama-3.2-1b-bnb-4bit",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "r": 128,
   "rank_pattern": {},
+  "revision": null,
   "target_modules": [
     "gate_proj",
+    "v_proj",
     "o_proj",
+    "k_proj",
     "q_proj",
+    "down_proj",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:623432d23660a6e39de5ee012cbde9514eb93ace77c2c0ef1b471ca8a742256b
-size 167832240

 version https://git-lfs.github.com/spec/v1
+oid sha256:ff2aea5911617b6918e68bd68b077ece7ed739eecccdf89aba2954d9073abfb5
+size 360740440