pabloce commited on
Commit
20f7e9c
·
verified ·
1 Parent(s): 9c5c4b3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -9,7 +9,7 @@ from llama_cpp_agent.providers import LlamaCppPythonProvider
9
  For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
10
  """
11
  # client = InferenceClient("cognitivecomputations/dolphin-2.8-mistral-7b-v02")
12
- llama_model = Llama(r"Meta-Llama-3-8B.Q5_K_M.gguf", n_batch=1024, n_threads=10, n_gpu_layers=33, n_ctx=8192, verbose=False)
13
 
14
  provider = LlamaCppPythonProvider(llama_model)
15
 
 
9
  For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
10
  """
11
  # client = InferenceClient("cognitivecomputations/dolphin-2.8-mistral-7b-v02")
12
+ llama_model = Llama(r"Meta-Llama-3-8B.Q5_K_M.gguf", n_batch=1024, n_threads=4, n_gpu_layers=33, n_ctx=8192, verbose=False)
13
 
14
  provider = LlamaCppPythonProvider(llama_model)
15