radames commited on
Commit
ae0a725
1 Parent(s): 88cf25d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -1,3 +1,4 @@
 
1
  import gradio as gr
2
  import copy
3
  import time
@@ -8,8 +9,8 @@ from huggingface_hub import hf_hub_download
8
 
9
  llm = Llama(
10
  model_path=hf_hub_download(
11
- repo_id="TheBloke/Llama-2-7B-Chat-GGML",
12
- filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
13
  ),
14
  n_ctx=2048,
15
  n_gpu_layers=50, # change n_gpu_layers if you have more or less VRAM
 
1
+ import os
2
  import gradio as gr
3
  import copy
4
  import time
 
9
 
10
  llm = Llama(
11
  model_path=hf_hub_download(
12
+ repo_id=os.environ.get("REPO_ID", "TheBloke/Llama-2-7B-Chat-GGML"),
13
+ filename=os.environ.get("MODEL_FILE", "llama-2-7b-chat.ggmlv3.q5_0.bin"),
14
  ),
15
  n_ctx=2048,
16
  n_gpu_layers=50, # change n_gpu_layers if you have more or less VRAM