Multi-OpenSource / config.py
Atreyu4EVR's picture
Update config.py
e747f55 verified
raw
history blame
312 Bytes
# Embeddings Configuration
EMBEDDING_MODEL_NAME = "sentence-transformers/all-MiniLM-L6-v2"
# Document Processing Configuration
CHUNK_SIZE = 8192
CHUNK_OVERLAP = 200
BATCH_SIZE = 1000
# Retrieval Configuration
RETRIEVER_K = 3
# File Paths
JSON_FILE_PATH = "index_training.json"
VECTORSTORE_PATH = "vectorstore"