Saif Rehman Nasir
commited on
Commit
•
f81204d
1
Parent(s):
8af0ee8
Revert to llama3 8b
Browse files
rag.py
CHANGED
@@ -22,7 +22,8 @@ NEO4J_PASSWORD = os.getenv("NEO4J_PASSWORD")
|
|
22 |
vector_index = os.getenv("VECTOR_INDEX")
|
23 |
|
24 |
chat_llm = HuggingFaceEndpoint(
|
25 |
-
repo_id="HuggingFaceH4/zephyr-7b-beta",
|
|
|
26 |
task="text-generation",
|
27 |
max_new_tokens=4096,
|
28 |
do_sample=False,
|
@@ -218,7 +219,7 @@ def global_retriever(query: str, level: int, response_type: str):
|
|
218 |
|
219 |
where 1, 2, 3, 7, 34, 46, and 64 represent the id (not the index) of the relevant data record.
|
220 |
|
221 |
-
Do not include information where the supporting evidence for it is not provided.
|
222 |
|
223 |
|
224 |
---Target response length and format---
|
|
|
22 |
vector_index = os.getenv("VECTOR_INDEX")
|
23 |
|
24 |
chat_llm = HuggingFaceEndpoint(
|
25 |
+
# repo_id="HuggingFaceH4/zephyr-7b-beta",
|
26 |
+
repo_id="meta-llama/Meta-Llama-3-8B-Instruct",
|
27 |
task="text-generation",
|
28 |
max_new_tokens=4096,
|
29 |
do_sample=False,
|
|
|
219 |
|
220 |
where 1, 2, 3, 7, 34, 46, and 64 represent the id (not the index) of the relevant data record.
|
221 |
|
222 |
+
Do not include information where the supporting evidence for it is not provided. Style the response in markdown.
|
223 |
|
224 |
|
225 |
---Target response length and format---
|