openai llama-index langchain chromadb torch transformers gradio scikit-learn scipy matplotlib openpyxl mosestokenizer indic-nlp-library sentence_transformers playwright~=1.30 faiss-cpu tiktoken googletrans==3.1.0a0 BeautifulSoup4 pypdf PyPDF2 html2text