mobinln commited on
Commit
6482c59
1 Parent(s): 654cf40

change to qwen2 0.5B fp16

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -1,10 +1,10 @@
1
  import gradio as gr
2
  from llama_cpp import Llama
3
 
4
- model = "Qwen/Qwen2-7B-Instruct-GGUF"
5
  llm = Llama.from_pretrained(
6
  repo_id=model,
7
- filename="qwen2-7b-instruct-q4_k_m.gguf",
8
  verbose=True,
9
  use_mmap=False,
10
  use_mlock=True,
 
1
  import gradio as gr
2
  from llama_cpp import Llama
3
 
4
+ model = "Qwen/Qwen2-0.5B-Instruct-GGUF"
5
  llm = Llama.from_pretrained(
6
  repo_id=model,
7
+ filename="qwen2-0_5b-instruct-fp16.gguf",
8
  verbose=True,
9
  use_mmap=False,
10
  use_mlock=True,