whoami02 commited on
Commit
4290234
·
1 Parent(s): 951f486

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -4,7 +4,7 @@ import gradio as gr
4
  # from llama_cpp import Llama
5
  from langchain.llms import llamacpp
6
  from huggingface_hub import login, hf_hub_download
7
- from dotenv import load_dotenv, find_dotenv
8
 
9
  MODEL_ID = "TheBloke/Llama-2-7b-Chat-GGUF"
10
  MODEL_BASENAME = "llama-2-7b-chat.Q4_K_M.gguf"
@@ -13,7 +13,8 @@ MODEL_BASENAME = "llama-2-7b-chat.Q4_K_M.gguf"
13
  CONTEXT_WINDOW_SIZE = 8000
14
  MAX_NEW_TOKENS = 2000
15
  N_BATCH = 128
16
- load_dotenv(find_dotenv(hf_token))
 
17
  def load_quantized_model(model_id, model_basename):
18
  try:
19
  model_path = hf_hub_download(
 
4
  # from llama_cpp import Llama
5
  from langchain.llms import llamacpp
6
  from huggingface_hub import login, hf_hub_download
7
+ # from dotenv import load_dotenv, find_dotenv
8
 
9
  MODEL_ID = "TheBloke/Llama-2-7b-Chat-GGUF"
10
  MODEL_BASENAME = "llama-2-7b-chat.Q4_K_M.gguf"
 
13
  CONTEXT_WINDOW_SIZE = 8000
14
  MAX_NEW_TOKENS = 2000
15
  N_BATCH = 128
16
+
17
+ os.getenv("hf_token")
18
  def load_quantized_model(model_id, model_basename):
19
  try:
20
  model_path = hf_hub_download(