radames commited on
Commit
de33e52
1 Parent(s): b670baa

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -9,8 +9,8 @@ from huggingface_hub import hf_hub_download
9
 
10
  llm = Llama(
11
  model_path=hf_hub_download(
12
- repo_id=os.environ.get("REPO_ID", "TheBloke/Llama-2-7B-Chat-GGML"),
13
- filename=os.environ.get("MODEL_FILE", "llama-2-7b-chat.ggmlv3.q5_0.bin"),
14
  ),
15
  n_ctx=2048,
16
  n_gpu_layers=50, # change n_gpu_layers if you have more or less VRAM
 
9
 
10
  llm = Llama(
11
  model_path=hf_hub_download(
12
+ repo_id=os.environ.get("REPO_ID", "TheBloke/Llama-2-7b-Chat-GGUF"),
13
+ filename=os.environ.get("MODEL_FILE", "llama-2-7b-chat.Q5_0.gguf"),
14
  ),
15
  n_ctx=2048,
16
  n_gpu_layers=50, # change n_gpu_layers if you have more or less VRAM