asif00 commited on
Commit
969e769
1 Parent(s): b1afd5a

Upload model trained with Unsloth

Browse files

Upload model trained with Unsloth 2x faster

Files changed (3) hide show
  1. README.md +6 -5
  2. adapter_config.json +7 -7
  3. adapter_model.safetensors +2 -2
README.md CHANGED
@@ -1,18 +1,19 @@
1
  ---
 
 
 
2
  language:
3
  - bn
 
4
  license: apache-2.0
 
5
  tags:
6
  - text-generation-inference
7
  - transformers
8
  - llama
9
  - trl
 
10
  inference: false
11
- base_model: unsloth/llama-3-8b-bnb-4bit
12
- library_name: transformers
13
- pipeline_tag: question-answering
14
- datasets:
15
- - iamshnoo/alpaca-cleaned-bengali
16
  ---
17
 
18
  Bangla LLaMA is a specialized model for context-based question answering and Bengali retrieval augment generation. It is derived from LLaMA 3 8B and trained on the iamshnoo/alpaca-cleaned-bengali dataset. This model is designed to provide accurate responses in Bengali with relevant contextual information. It is integrated with the transformers library, making it easy to use for context-based question answering and Bengali retrieval augment generation in projects.
 
1
  ---
2
+ base_model: unsloth/llama-3-8b-bnb-4bit
3
+ datasets:
4
+ - iamshnoo/alpaca-cleaned-bengali
5
  language:
6
  - bn
7
+ library_name: transformers
8
  license: apache-2.0
9
+ pipeline_tag: question-answering
10
  tags:
11
  - text-generation-inference
12
  - transformers
13
  - llama
14
  - trl
15
+ - unsloth
16
  inference: false
 
 
 
 
 
17
  ---
18
 
19
  Bangla LLaMA is a specialized model for context-based question answering and Bengali retrieval augment generation. It is derived from LLaMA 3 8B and trained on the iamshnoo/alpaca-cleaned-bengali dataset. This model is designed to provide accurate responses in Bengali with relevant contextual information. It is integrated with the transformers library, making it easy to use for context-based question answering and Bengali retrieval augment generation in projects.
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "unsloth/llama-3-8b-bnb-4bit",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
@@ -16,17 +16,17 @@
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
- "r": 16,
20
  "rank_pattern": {},
21
- "revision": "unsloth",
22
  "target_modules": [
23
  "gate_proj",
24
- "down_proj",
25
  "o_proj",
 
26
  "q_proj",
27
- "v_proj",
28
- "up_proj",
29
- "k_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "unsloth/llama-3.2-1b-bnb-4bit",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
 
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
+ "r": 128,
20
  "rank_pattern": {},
21
+ "revision": null,
22
  "target_modules": [
23
  "gate_proj",
24
+ "v_proj",
25
  "o_proj",
26
+ "k_proj",
27
  "q_proj",
28
+ "down_proj",
29
+ "up_proj"
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:623432d23660a6e39de5ee012cbde9514eb93ace77c2c0ef1b471ca8a742256b
3
- size 167832240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff2aea5911617b6918e68bd68b077ece7ed739eecccdf89aba2954d9073abfb5
3
+ size 360740440