theodotus commited on
Commit
aa251d2
·
1 Parent(s): cf610a7

Use k-quant model

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -19,7 +19,7 @@ def generate(history):
19
  return streamer
20
 
21
 
22
- llm = AutoModelForCausalLM.from_pretrained("theodotus/llama-uk", model_file="model_q4_1.bin", model_type='llama')
23
  end_token = "</s>"
24
 
25
 
 
19
  return streamer
20
 
21
 
22
+ llm = AutoModelForCausalLM.from_pretrained("theodotus/llama-uk", model_file="model.bin", model_type='llama')
23
  end_token = "</s>"
24
 
25