bstraehle commited on
Commit
6514d80
·
1 Parent(s): c8efcca

Update rag.py

Browse files
Files changed (1) hide show
  1. rag.py +4 -4
rag.py CHANGED
@@ -22,8 +22,8 @@ WEB_URL = "https://openai.com/research/gpt-4"
22
  YOUTUBE_URL_1 = "https://www.youtube.com/watch?v=--khbXchTeE"
23
  YOUTUBE_URL_2 = "https://www.youtube.com/watch?v=hdhZwyf24mE"
24
 
25
- YOUTUBE_DIR = "/data/youtube"
26
- CHROMA_DIR = "/data/chroma"
27
 
28
  MONGODB_ATLAS_CLUSTER_URI = os.environ["MONGODB_ATLAS_CLUSTER_URI"]
29
  MONGODB_DB_NAME = "langchain_db"
@@ -80,13 +80,13 @@ def rag_batch(config):
80
  document_storage_mongodb(chunks)
81
 
82
  def document_retrieval_chroma():
83
- return Chroma(embedding_function = OpenAIEmbeddings(),
84
  persist_directory = CHROMA_DIR)
85
 
86
  def document_retrieval_mongodb():
87
  return MongoDBAtlasVectorSearch.from_connection_string(MONGODB_ATLAS_CLUSTER_URI,
88
  MONGODB_DB_NAME + "." + MONGODB_COLLECTION_NAME,
89
- OpenAIEmbeddings(),
90
  index_name = MONGODB_INDEX_NAME)
91
 
92
  def get_llm(config, openai_api_key):
 
22
  YOUTUBE_URL_1 = "https://www.youtube.com/watch?v=--khbXchTeE"
23
  YOUTUBE_URL_2 = "https://www.youtube.com/watch?v=hdhZwyf24mE"
24
 
25
+ YOUTUBE_DIR = "/data/yt"
26
+ CHROMA_DIR = "/data/db"
27
 
28
  MONGODB_ATLAS_CLUSTER_URI = os.environ["MONGODB_ATLAS_CLUSTER_URI"]
29
  MONGODB_DB_NAME = "langchain_db"
 
80
  document_storage_mongodb(chunks)
81
 
82
  def document_retrieval_chroma():
83
+ return Chroma(embedding_function = OpenAIEmbeddings(disallowed_special = ()),
84
  persist_directory = CHROMA_DIR)
85
 
86
  def document_retrieval_mongodb():
87
  return MongoDBAtlasVectorSearch.from_connection_string(MONGODB_ATLAS_CLUSTER_URI,
88
  MONGODB_DB_NAME + "." + MONGODB_COLLECTION_NAME,
89
+ OpenAIEmbeddings(disallowed_special = ()),
90
  index_name = MONGODB_INDEX_NAME)
91
 
92
  def get_llm(config, openai_api_key):