Hackoor commited on
Commit
f23396e
·
1 Parent(s): 8e02412

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -70,7 +70,7 @@ def create_conversational_chain(vector_store):
70
  load_dotenv()
71
  # Create llm
72
  llm = CTransformers(streaming=True,
73
- model = AutoModelForCausalLM.from_pretrained("NousResearch/Nous-Hermes-llama-2-7b", device_map='auto',torch_dtype=torch.float16,load_in_4bit=True, token=True ),
74
  callbacks=[StreamingStdOutCallbackHandler()],
75
  model_type="llama", config={'max_new_tokens': 500, 'temperature': 0.01})
76
  # llm = Replicate(
 
70
  load_dotenv()
71
  # Create llm
72
  llm = CTransformers(streaming=True,
73
+ model = AutoModelForCausalLM.from_pretrained("NousResearch/Nous-Hermes-llama-2-7b", device_map='auto',torch_dtype=torch.float16,load_in_4bit=True),
74
  callbacks=[StreamingStdOutCallbackHandler()],
75
  model_type="llama", config={'max_new_tokens': 500, 'temperature': 0.01})
76
  # llm = Replicate(