Spaces:

yash009
/

textgeneration

Runtime error

Yash Sachdeva commited on Mar 11, 2024

Commit

b63fd3c

1 Parent(s): 37111b2

download llama

Files changed (2) hide show

Dockerfile CHANGED Viewed

@@ -18,8 +18,7 @@ RUN pip install accelerate
 # Install hugging face hub to download llama2 model
 RUN pip install --upgrade huggingface_hub
-RUN huggingface-cli download TheBloke/Llama-2-7b-Chat-GGUF llama-2-7b.Q4_K_M.gguf --local-dir . --local-dir-use-symlinks False
 RUN CMAKE_ARGS="-DLLAMA_BLAS=ON -DLLAMA_BLAS_VENDOR=OpenBLAS" pip install 'llama-cpp-python[server]' --upgrade --force-reinstall --no-cache-dir
 # Install requirements.txt

 # Install hugging face hub to download llama2 model
 RUN pip install --upgrade huggingface_hub
+RUN huggingface-cli download TheBloke/Llama-2-7b-Chat-GGUF llama-2-7b-chat.Q4_K_M.gguf --local-dir . --local-dir-use-symlinks False
 RUN CMAKE_ARGS="-DLLAMA_BLAS=ON -DLLAMA_BLAS_VENDOR=OpenBLAS" pip install 'llama-cpp-python[server]' --upgrade --force-reinstall --no-cache-dir
 # Install requirements.txt

question_paper.py CHANGED Viewed

@@ -14,7 +14,7 @@ app = FastAPI()
 @app.get("/")
 def llama():
     llm = Llama(
-      model_path="./llama-2-7b.Q4_K_M.gguf",
       # n_gpu_layers=-1, # Uncomment to use GPU acceleration
       # seed=1337, # Uncomment to set a specific seed
       # n_ctx=2048, # Uncomment to increase the context window

 @app.get("/")
 def llama():
     llm = Llama(
+      model_path="./llama-2-7b-chat.Q4_K_M.gguf",
       # n_gpu_layers=-1, # Uncomment to use GPU acceleration
       # seed=1337, # Uncomment to set a specific seed
       # n_ctx=2048, # Uncomment to increase the context window