Spaces:
Sleeping
Sleeping
Commit
·
cc751de
1
Parent(s):
95841bc
Update: Change embeddings model to all-MiniLM-L6-v2 for better performance
Browse files
app.py
CHANGED
@@ -34,7 +34,7 @@ class SentenceTransformerEmbeddings(Embeddings):
|
|
34 |
return embedding.tolist()
|
35 |
|
36 |
embeddings = SentenceTransformerEmbeddings(
|
37 |
-
model_name="sentence-transformers/all-
|
38 |
device=device
|
39 |
)
|
40 |
|
@@ -53,8 +53,8 @@ if not (vectorstore_path / "index.faiss").exists():
|
|
53 |
|
54 |
# Split documents into chunks
|
55 |
text_splitter = RecursiveCharacterTextSplitter(
|
56 |
-
chunk_size=
|
57 |
-
chunk_overlap=
|
58 |
length_function=len,
|
59 |
)
|
60 |
texts = text_splitter.split_documents(documents)
|
|
|
34 |
return embedding.tolist()
|
35 |
|
36 |
embeddings = SentenceTransformerEmbeddings(
|
37 |
+
model_name="sentence-transformers/all-MiniLM-L6-v2",
|
38 |
device=device
|
39 |
)
|
40 |
|
|
|
53 |
|
54 |
# Split documents into chunks
|
55 |
text_splitter = RecursiveCharacterTextSplitter(
|
56 |
+
chunk_size=2000,
|
57 |
+
chunk_overlap=100,
|
58 |
length_function=len,
|
59 |
)
|
60 |
texts = text_splitter.split_documents(documents)
|