gauravgulati619 commited on
Commit
cc751de
·
1 Parent(s): 95841bc

Update: Change embeddings model to all-MiniLM-L6-v2 for better performance

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -34,7 +34,7 @@ class SentenceTransformerEmbeddings(Embeddings):
34
  return embedding.tolist()
35
 
36
  embeddings = SentenceTransformerEmbeddings(
37
- model_name="sentence-transformers/all-mpnet-base-v2",
38
  device=device
39
  )
40
 
@@ -53,8 +53,8 @@ if not (vectorstore_path / "index.faiss").exists():
53
 
54
  # Split documents into chunks
55
  text_splitter = RecursiveCharacterTextSplitter(
56
- chunk_size=1000,
57
- chunk_overlap=200,
58
  length_function=len,
59
  )
60
  texts = text_splitter.split_documents(documents)
 
34
  return embedding.tolist()
35
 
36
  embeddings = SentenceTransformerEmbeddings(
37
+ model_name="sentence-transformers/all-MiniLM-L6-v2",
38
  device=device
39
  )
40
 
 
53
 
54
  # Split documents into chunks
55
  text_splitter = RecursiveCharacterTextSplitter(
56
+ chunk_size=2000,
57
+ chunk_overlap=100,
58
  length_function=len,
59
  )
60
  texts = text_splitter.split_documents(documents)