emeses commited on
Commit
16924a4
·
1 Parent(s): 31a6cd5

Update space

Browse files
Files changed (4) hide show
  1. .build_config +0 -6
  2. README.md +0 -10
  3. app.py +4 -3
  4. requirements.txt +5 -5
.build_config DELETED
@@ -1,6 +0,0 @@
1
- # .build_config
2
- build:
3
- cuda: "11.8"
4
- python_version: "3.10"
5
- system_packages:
6
- - "nvidia-cuda-toolkit"
 
 
 
 
 
 
 
README.md CHANGED
@@ -8,16 +8,6 @@ sdk_version: 4.19.2
8
  app_file: app.py
9
  pinned: false
10
  python_version: "3.10"
11
- cuda: "11.8"
12
- license: "mit"
13
- duplicated_from: unsloth/Llama-3.2-3B-Instruct-bnb-4bit
14
- models:
15
- - unsloth/Llama-3.2-3B-Instruct-bnb-4bit
16
- - emeses/lab2_model
17
- tags:
18
- - llama
19
- - chat
20
- - gradio
21
  ---
22
 
23
  # LLaMA Chat Interface
 
8
  app_file: app.py
9
  pinned: false
10
  python_version: "3.10"
 
 
 
 
 
 
 
 
 
 
11
  ---
12
 
13
  # LLaMA Chat Interface
app.py CHANGED
@@ -17,16 +17,17 @@ bnb_config = BitsAndBytesConfig(
17
  load_in_4bit=True,
18
  bnb_4bit_compute_dtype=torch.float16,
19
  bnb_4bit_quant_type="nf4",
20
- bnb_4bit_use_double_quant=True,
21
  )
22
 
23
  # Load model and tokenizer
24
  base_model = AutoModelForCausalLM.from_pretrained(
25
  "unsloth/Llama-3.2-3B-Instruct-bnb-4bit",
 
26
  device_map="auto",
27
- torch_dtype=torch.float16,
28
- quantization_config=bnb_config
29
  )
 
30
  model = PeftModel.from_pretrained(base_model, "emeses/lab2_model")
31
  tokenizer = AutoTokenizer.from_pretrained("unsloth/Llama-3.2-3B-Instruct-bnb-4bit")
32
 
 
17
  load_in_4bit=True,
18
  bnb_4bit_compute_dtype=torch.float16,
19
  bnb_4bit_quant_type="nf4",
20
+ bnb_4bit_use_double_quant=True
21
  )
22
 
23
  # Load model and tokenizer
24
  base_model = AutoModelForCausalLM.from_pretrained(
25
  "unsloth/Llama-3.2-3B-Instruct-bnb-4bit",
26
+ quantization_config=bnb_config,
27
  device_map="auto",
28
+ torch_dtype=torch.float16
 
29
  )
30
+
31
  model = PeftModel.from_pretrained(base_model, "emeses/lab2_model")
32
  tokenizer = AutoTokenizer.from_pretrained("unsloth/Llama-3.2-3B-Instruct-bnb-4bit")
33
 
requirements.txt CHANGED
@@ -1,8 +1,8 @@
1
- huggingface_hub==0.25.2
2
- gradio==4.19.2
3
- transformers
4
- peft==0.7.1
5
  torch==2.1.2
 
6
  accelerate==0.26.1
7
  bitsandbytes==0.41.3
8
- torch==2.1.2
 
 
 
 
 
 
 
 
1
  torch==2.1.2
2
+ transformers==4.36.2
3
  accelerate==0.26.1
4
  bitsandbytes==0.41.3
5
+ peft==0.7.1
6
+ huggingface_hub==0.25.2
7
+ gradio==4.19.2
8
+ sentencepiece