Spaces:

RJuro
/

rag-lex

Sleeping

App Files Files Community

RJuro commited on Apr 3, 2024

Commit

3026887

1 Parent(s): 5972ea6

-

Browse files

Files changed (33) hide show

.gitattributes +1 -1
Dockerfile +21 -0
_README.md +79 -0
app/.env +1 -0
app/__init__.py +0 -0
app/__pycache__/__init__.cpython-311.pyc +0 -0
app/__pycache__/server.cpython-311.pyc +0 -0
app/server.py +39 -0
app/streamlit_test.py +36 -0
app/test_server.ipynb +95 -0
packages/.DS_Store +0 -0
packages/README.md +0 -0
packages/rag-chroma/.DS_Store +0 -0
packages/rag-chroma/LICENSE +21 -0
packages/rag-chroma/README.md +68 -0
packages/rag-chroma/poetry.lock +0 -0
packages/rag-chroma/pyproject.toml +35 -0
packages/rag-chroma/rag_chroma.ipynb +51 -0
packages/rag-chroma/rag_chroma/.DS_Store +0 -0
packages/rag-chroma/rag_chroma/.env +1 -0
packages/rag-chroma/rag_chroma/__init__.py +3 -0
packages/rag-chroma/rag_chroma/__pycache__/__init__.cpython-311.pyc +0 -0
packages/rag-chroma/rag_chroma/__pycache__/chain.cpython-311.pyc +0 -0
packages/rag-chroma/rag_chroma/chain.py +92 -0
packages/rag-chroma/rag_chroma/load_files_chroma.ipynb +164 -0
packages/rag-chroma/rag_chroma/test.ipynb +122 -0
packages/rag-chroma/rag_chroma/vecdb/12bce733-e94f-4342-829a-6786a9f92a50/data_level0.bin +3 -0
packages/rag-chroma/rag_chroma/vecdb/12bce733-e94f-4342-829a-6786a9f92a50/header.bin +3 -0
packages/rag-chroma/rag_chroma/vecdb/12bce733-e94f-4342-829a-6786a9f92a50/length.bin +3 -0
packages/rag-chroma/rag_chroma/vecdb/12bce733-e94f-4342-829a-6786a9f92a50/link_lists.bin +0 -0
packages/rag-chroma/rag_chroma/vecdb/chroma.sqlite3 +3 -0
packages/rag-chroma/tests/__init__.py +0 -0
pyproject.toml +25 -0

.gitattributes CHANGED Viewed

@@ -33,4 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
-*.sqlite3 filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.sqlite3 filter=lfs diff=lfs merge=lfs -text

Dockerfile ADDED Viewed

	@@ -0,0 +1,21 @@

+FROM python:3.11-slim
+RUN pip install poetry==1.6.1
+RUN poetry config virtualenvs.create false
+WORKDIR /code
+COPY ./pyproject.toml ./README.md ./poetry.lock* ./
+COPY ./packages ./packages
+RUN poetry install  --no-interaction --no-ansi --no-root
+COPY ./app ./app
+RUN poetry install --no-interaction --no-ansi
+EXPOSE 8080
+CMD ["uvicorn", "app.server:app", "--host", "0.0.0.0", "--port", "7860"]

_README.md ADDED Viewed

	@@ -0,0 +1,79 @@

+# my-app
+## Installation
+Install the LangChain CLI if you haven't yet
+```bash
+pip install -U langchain-cli
+```
+## Adding packages
+```bash
+# adding packages from
+# https://github.com/langchain-ai/langchain/tree/master/templates
+langchain app add $PROJECT_NAME
+# adding custom GitHub repo packages
+langchain app add --repo $OWNER/$REPO
+# or with whole git string (supports other git providers):
+# langchain app add git+https://github.com/hwchase17/chain-of-verification
+# with a custom api mount point (defaults to `/{package_name}`)
+langchain app add $PROJECT_NAME --api_path=/my/custom/path/rag
+```
+Note: you remove packages by their api path
+```bash
+langchain app remove my/custom/path/rag
+```
+## Setup LangSmith (Optional)
+LangSmith will help us trace, monitor and debug LangChain applications.
+LangSmith is currently in private beta, you can sign up [here](https://smith.langchain.com/).
+If you don't have access, you can skip this section
+```shell
+export LANGCHAIN_TRACING_V2=true
+export LANGCHAIN_API_KEY=<your-api-key>
+export LANGCHAIN_PROJECT=<your-project>  # if not specified, defaults to "default"
+```
+## Launch LangServe
+```bash
+langchain serve
+```
+## Running in Docker
+This project folder includes a Dockerfile that allows you to easily build and host your LangServe app.
+### Building the Image
+To build the image, you simply:
+```shell
+docker build . -t my-langserve-app
+```
+If you tag your image with something other than `my-langserve-app`,
+note it for use in the next step.
+### Running the Image Locally
+To run the image, you'll need to include any environment variables
+necessary for your application.
+In the below example, we inject the `OPENAI_API_KEY` environment
+variable with the value set in my local environment
+(`$OPENAI_API_KEY`)
+We also expose port 8080 with the `-p 8080:8080` option.
+```shell
+docker run -e OPENAI_API_KEY=$OPENAI_API_KEY -p 8080:8080 my-langserve-app
+```

app/.env ADDED Viewed

	@@ -0,0 +1 @@


1	+ BACK_API_KEY=a6ab9026-0ac8-4c26-9c30-6d9837fc9013

app/__init__.py ADDED Viewed

File without changes

app/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (214 Bytes). View file

app/__pycache__/server.cpython-311.pyc ADDED Viewed

Binary file (1.8 kB). View file

app/server.py ADDED Viewed

	@@ -0,0 +1,39 @@

+from fastapi import FastAPI, Depends, HTTPException, status, Request #added security
+from fastapi.responses import RedirectResponse
+from langserve import add_routes
+from rag_chroma import chain as rag_chroma_chain
+from dotenv import load_dotenv
+load_dotenv()
+# load api key from .env file
+import os
+app = FastAPI()
+API_KEY = os.getenv("BACK_API_KEY")
+async def get_api_key(request: Request):
+    api_key = request.headers.get('x-api-key')
+    if api_key != API_KEY:
+        raise HTTPException(
+            status_code=status.HTTP_401_UNAUTHORIZED,
+            detail="Invalid API Key"
+        )
+@app.get("/")
+async def redirect_root_to_docs():
+    return RedirectResponse("/docs")
+# Edit this to add the chain you want to add
+add_routes(app, rag_chroma_chain,
+           path="/rag-chroma",
+           #playground_type='chat',
+           dependencies=[Depends(get_api_key)]
+           )
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=8000)

app/streamlit_test.py ADDED Viewed

	@@ -0,0 +1,36 @@

+import streamlit as st
+import os
+from langserve.client import RemoteRunnable
+from httpx import HTTPStatusError
+from dotenv import load_dotenv
+# Load the environment variable
+load_dotenv()
+# Get the API key from environment variables
+token = os.environ.get("BACK_API_KEY")
+# Initialize the RemoteRunnable with your API endpoint and headers
+rag_app = RemoteRunnable("http://127.0.0.1:8000/rag-chroma/", headers={"x-api-key": f"{token}"})
+# Streamlit app
+def main():
+    # Title of the app
+    st.title("Question Answering App")
+    # User input
+    question = st.text_input("Type your question here:")
+    # Button to send the question
+    if st.button("Get Answer"):
+        try:
+            # Use the RemoteRunnable to send the question and get the answer
+            answer = rag_app.invoke(question)
+            # Display the answer
+            st.success(answer)
+        except HTTPStatusError as e:
+            # Handle potential errors from the API call
+            st.error(f"Failed to get an answer. Error: {e}")
+if __name__ == "__main__":
+    main()

app/test_server.ipynb ADDED Viewed

	@@ -0,0 +1,95 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "True"
+      ]
+     },
+     "execution_count": 1,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import streamlit as st\n",
+    "import os\n",
+    "from langserve.client import RemoteRunnable\n",
+    "from httpx import HTTPStatusError\n",
+    "from dotenv import load_dotenv\n",
+    "load_dotenv()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "token = os.environ.get(\"BACK_API_KEY\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "rag_app = RemoteRunnable(\"http://127.0.0.1:8000/rag-chroma/\", headers={\"x-api-key\": f\"{token}\"})"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'\\nAnswer: The speakers do not provide specific details about GPT-5. They mention that it is not yet developed and that there are challenges and bottlenecks to overcome before its creation. They also discuss that it will require a bigger computer and a new secret, and that it is a result of multiplying 200 medium-sized things together into one giant thing. They also mention that there is a lot of distributed constant innovation happening on the technical side.'"
+      ]
+     },
+     "execution_count": 5,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "rag_app.invoke(\"What do they say about GPT-5?\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "langcorn",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

packages/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

packages/README.md ADDED Viewed

File without changes

packages/rag-chroma/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

packages/rag-chroma/LICENSE ADDED Viewed

	@@ -0,0 +1,21 @@

+MIT License
+Copyright (c) 2023 LangChain, Inc.
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

packages/rag-chroma/README.md ADDED Viewed

	@@ -0,0 +1,68 @@

+# rag-chroma
+This template performs RAG using Chroma and OpenAI.
+The vectorstore is created in `chain.py` and by default indexes a [popular blog posts on Agents](https://lilianweng.github.io/posts/2023-06-23-agent/) for question-answering.
+## Environment Setup
+Set the `OPENAI_API_KEY` environment variable to access the OpenAI models.
+## Usage
+To use this package, you should first have the LangChain CLI installed:
+```shell
+pip install -U langchain-cli
+```
+To create a new LangChain project and install this as the only package, you can do:
+```shell
+langchain app new my-app --package rag-chroma
+```
+If you want to add this to an existing project, you can just run:
+```shell
+langchain app add rag-chroma
+```
+And add the following code to your `server.py` file:
+```python
+from rag_chroma import chain as rag_chroma_chain
+add_routes(app, rag_chroma_chain, path="/rag-chroma")
+```
+(Optional) Let's now configure LangSmith.
+LangSmith will help us trace, monitor and debug LangChain applications.
+LangSmith is currently in private beta, you can sign up [here](https://smith.langchain.com/).
+If you don't have access, you can skip this section
+```shell
+export LANGCHAIN_TRACING_V2=true
+export LANGCHAIN_API_KEY=<your-api-key>
+export LANGCHAIN_PROJECT=<your-project>  # if not specified, defaults to "default"
+```
+If you are inside this directory, then you can spin up a LangServe instance directly by:
+```shell
+langchain serve
+```
+This will start the FastAPI app with a server is running locally at
+[http://localhost:8000](http://localhost:8000)
+We can see all templates at [http://127.0.0.1:8000/docs](http://127.0.0.1:8000/docs)
+We can access the playground at [http://127.0.0.1:8000/rag-chroma/playground](http://127.0.0.1:8000/rag-chroma/playground)
+We can access the template from code with:
+```python
+from langserve.client import RemoteRunnable
+runnable = RemoteRunnable("http://localhost:8000/rag-chroma")
+```

packages/rag-chroma/poetry.lock ADDED Viewed

The diff for this file is too large to render. See raw diff

packages/rag-chroma/pyproject.toml ADDED Viewed

	@@ -0,0 +1,35 @@

+[tool.poetry]
+name = "rag-chroma"
+version = "0.1.0"
+description = "RAG using Chroma"
+authors = [
+    "Erick Friis <erick@langchain.dev>",
+]
+readme = "README.md"
+[tool.poetry.dependencies]
+python = ">=3.8.1,<4.0"
+langchain = "^0.1"
+openai = "<2"
+tiktoken = ">=0.5.1"
+chromadb = ">=0.4.14"
+langchain-text-splitters = ">=0.0.1,<0.1"
+[tool.poetry.group.dev.dependencies]
+langchain-cli = ">=0.0.21"
+[tool.langserve]
+export_module = "rag_chroma"
+export_attr = "chain"
+[tool.templates-hub]
+use-case = "rag"
+author = "LangChain"
+integrations = ["OpenAI", "Chroma"]
+tags = ["vectordbs"]
+[build-system]
+requires = [
+    "poetry-core",
+]
+build-backend = "poetry.core.masonry.api"

packages/rag-chroma/rag_chroma.ipynb ADDED Viewed

	@@ -0,0 +1,51 @@

+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "681a5d1e",
+   "metadata": {},
+   "source": [
+    "## Run Template\n",
+    "\n",
+    "In `server.py`, set -\n",
+    "```\n",
+    "add_routes(app, chain_rag_conv, path=\"/rag-chroma\")\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d774be2a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from langserve.client import RemoteRunnable\n",
+    "\n",
+    "rag_app = RemoteRunnable(\"http://localhost:8001/rag-chroma\")\n",
+    "rag_app.invoke(\"Where id Harrison work\")"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

packages/rag-chroma/rag_chroma/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

packages/rag-chroma/rag_chroma/.env ADDED Viewed

	@@ -0,0 +1 @@


1	+ TOGETHER_API_KEY=7091f9fb4f9db7e39170ca113c4bc9ad2405b1c8fec3772098a9f06c8c82e103

packages/rag-chroma/rag_chroma/__init__.py ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ from rag_chroma.chain import chain
2	+
3	+ __all__ = ["chain"]

packages/rag-chroma/rag_chroma/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (282 Bytes). View file

packages/rag-chroma/rag_chroma/__pycache__/chain.cpython-311.pyc ADDED Viewed

Binary file (2.38 kB). View file

packages/rag-chroma/rag_chroma/chain.py ADDED Viewed

	@@ -0,0 +1,92 @@

+#from langchain_community.chat_models import ChatOpenAI
+from langchain_together.embeddings import TogetherEmbeddings
+from langchain_together import Together
+from langchain_community.vectorstores import Chroma
+from langchain_core.output_parsers import StrOutputParser
+from langchain_core.prompts import ChatPromptTemplate
+from langchain_core.pydantic_v1 import BaseModel
+from langchain_core.runnables import RunnableParallel, RunnablePassthrough
+import os
+from dotenv import load_dotenv
+load_dotenv()
+together_api_key = os.getenv("TOGETHER_API_KEY")
+embeddings = TogetherEmbeddings(model="togethercomputer/m2-bert-80M-2k-retrieval")
+# Example for document loading (from url), splitting, and creating vectostore
+"""
+# Load
+from langchain_community.document_loaders import WebBaseLoader
+loader = WebBaseLoader("https://lilianweng.github.io/posts/2023-06-23-agent/")
+data = loader.load()
+# Split
+from langchain_text_splitters import RecursiveCharacterTextSplitter
+text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=0)
+all_splits = text_splitter.split_documents(data)
+# Add to vectorDB
+vectorstore = Chroma.from_documents(documents=all_splits,
+                                    collection_name="rag-chroma",
+                                    embedding=OpenAIEmbeddings(),
+                                    )
+retriever = vectorstore.as_retriever()
+"""
+""" # Embed a single document as a test
+vectorstore = Chroma.from_texts(
+    ["harrison worked at kensho"],
+    collection_name="rag-chroma",
+    embedding=OpenAIEmbeddings(),
+)
+retriever = vectorstore.as_retriever() """
+# Load up vector-store
+vectorstore = Chroma(persist_directory="packages/rag-chroma/rag_chroma/vecdb",
+                     collection_name="rag-chroma",
+                     embedding_function = embeddings)
+retriever = vectorstore.as_retriever(search_type="mmr", search_kwargs={'k': 7})
+# RAG prompt
+template = """Answer the question based only on the following context:
+{context}
+Question: {question}
+"""
+prompt = ChatPromptTemplate.from_template(template)
+# LLM
+model  = Together(
+    #model="mistralai/Mistral-7B-Instruct-v0.2",
+    model="mistralai/Mixtral-8x7B-Instruct-v0.1",
+    temperature=0.7,
+    top_k=50,
+    top_p=0.7,
+    repetition_penalty=1,
+    together_api_key=together_api_key
+)
+# RAG chain
+chain = (
+    RunnableParallel({"context": retriever, "question": RunnablePassthrough()})
+    | prompt
+    | model
+    | StrOutputParser()
+)
+# Add typing for input
+class Question(BaseModel):
+    __root__: str
+chain = chain.with_types(input_type=Question)

packages/rag-chroma/rag_chroma/load_files_chroma.ipynb ADDED Viewed

	@@ -0,0 +1,164 @@

+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Create vecdb - notebook"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from langchain_community.vectorstores import Chroma\n",
+    "from langchain_together.embeddings import TogetherEmbeddings\n",
+    "\n",
+    "\n",
+    "import os\n",
+    "from dotenv import load_dotenv\n",
+    "load_dotenv()\n",
+    "together_api_key = os.getenv(\"TOGETHER_API_KEY\")\n",
+    "\n",
+    "embeddings = TogetherEmbeddings(model=\"togethercomputer/m2-bert-80M-2k-retrieval\")\n",
+    "\n",
+    "# Load\n",
+    "from langchain_community.document_loaders import WebBaseLoader\n",
+    "loader = WebBaseLoader(\"https://lexfridman.com/sam-altman-2-transcript/\")\n",
+    "data = loader.load()\n",
+    "\n",
+    "# Split\n",
+    "from langchain_text_splitters import RecursiveCharacterTextSplitter\n",
+    "text_splitter = RecursiveCharacterTextSplitter(chunk_size=2000, chunk_overlap=250)\n",
+    "all_splits = text_splitter.split_documents(data)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Add to vectorDB\n",
+    "vectorstore = Chroma.from_documents(persist_directory=\"vecdb_test\",\n",
+    "                                    documents=all_splits, \n",
+    "                                    collection_name=\"rag-chroma\",\n",
+    "                                    embedding=embeddings,\n",
+    "                                    )\n",
+    "retriever = vectorstore.as_retriever()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Huggingface transformers embeddings\n",
+    "\n",
+    "more complicated but \"free\" way of creating embeddings\n",
+    "you will need to install\n",
+    "```\n",
+    "sentence-transformers\n",
+    "einops\n",
+    "opt_einsum\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from langchain_community.embeddings import HuggingFaceEmbeddings"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/opt/miniconda3/envs/langcorn/lib/python3.11/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
+      "  from .autonotebook import tqdm as notebook_tqdm\n",
+      "No sentence-transformers model found with name togethercomputer/m2-bert-80M-2k-retrieval. Creating a new one with MEAN pooling.\n",
+      "You are using a model of type m2_bert to instantiate a model of type bert. This is not supported for all configurations of models and can yield errors.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "-- Bidirectional: True\n",
+      "-- Using Long Conv Residual: True\n",
+      "-- Hyena w: 10\n",
+      "-- Hyena w mod: 1\n",
+      "-- Hyena filter order: 128\n",
+      "-- Hyena filter dropout: 0.2\n",
+      "-- Hyena filter wd: 0.1\n",
+      "-- Hyena filter emb dim: 5\n",
+      "-- Hyena filter lr: 0.001\n",
+      "-- Hyena filter lr pos emb: 1e-05\n"
+     ]
+    }
+   ],
+   "source": [
+    "model_name = \"togethercomputer/m2-bert-80M-2k-retrieval\"\n",
+    "model_kwargs = {'device': 'cpu', 'trust_remote_code': True}\n",
+    "encode_kwargs = {'normalize_embeddings': False}\n",
+    "hf = HuggingFaceEmbeddings(\n",
+    "    model_name=model_name,\n",
+    "    model_kwargs=model_kwargs,\n",
+    "    encode_kwargs=encode_kwargs\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Add to vectorDB\n",
+    "vectorstore = Chroma.from_documents(persist_directory=\"vecdb_hf_test\",\n",
+    "                                    documents=all_splits, \n",
+    "                                    collection_name=\"rag-chroma\",\n",
+    "                                    embedding=hf,\n",
+    "                                    )\n",
+    "retriever = vectorstore.as_retriever()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "langcorn",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

packages/rag-chroma/rag_chroma/test.ipynb ADDED Viewed

	@@ -0,0 +1,122 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#from langchain_community.chat_models import ChatOpenAI\n",
+    "from langchain_together.embeddings import TogetherEmbeddings\n",
+    "from langchain_together import Together\n",
+    "from langchain_community.vectorstores import Chroma\n",
+    "from langchain_core.output_parsers import StrOutputParser\n",
+    "from langchain_core.prompts import ChatPromptTemplate\n",
+    "from langchain_core.pydantic_v1 import BaseModel\n",
+    "from langchain_core.runnables import RunnableParallel, RunnablePassthrough\n",
+    "\n",
+    "import os\n",
+    "from dotenv import load_dotenv\n",
+    "load_dotenv()\n",
+    "together_api_key = os.getenv(\"TOGETHER_API_KEY\")\n",
+    "\n",
+    "\n",
+    "embeddings = TogetherEmbeddings(model=\"togethercomputer/m2-bert-80M-2k-retrieval\")\n",
+    "\n",
+    "\n",
+    "\n",
+    "# Example for document loading (from url), splitting, and creating vectostore\n",
+    "\n",
+    "\"\"\" \n",
+    "# Load\n",
+    "from langchain_community.document_loaders import WebBaseLoader\n",
+    "loader = WebBaseLoader(\"https://lilianweng.github.io/posts/2023-06-23-agent/\")\n",
+    "data = loader.load()\n",
+    "\n",
+    "# Split\n",
+    "from langchain_text_splitters import RecursiveCharacterTextSplitter\n",
+    "text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=0)\n",
+    "all_splits = text_splitter.split_documents(data)\n",
+    "\n",
+    "# Add to vectorDB\n",
+    "vectorstore = Chroma.from_documents(documents=all_splits, \n",
+    "                                    collection_name=\"rag-chroma\",\n",
+    "                                    embedding=OpenAIEmbeddings(),\n",
+    "                                    )\n",
+    "retriever = vectorstore.as_retriever()\n",
+    "\"\"\"\n",
+    "\n",
+    "\"\"\" # Embed a single document as a test\n",
+    "vectorstore = Chroma.from_texts(\n",
+    "    [\"harrison worked at kensho\"],\n",
+    "    collection_name=\"rag-chroma\",\n",
+    "    embedding=OpenAIEmbeddings(),\n",
+    ")\n",
+    "retriever = vectorstore.as_retriever() \"\"\"\n",
+    "\n",
+    "\n",
+    "# Load up vector-store\n",
+    "vectorstore = Chroma(persist_directory=\"vecdb\",\n",
+    "                     collection_name=\"rag-chroma\",\n",
+    "                     embedding_function = embeddings)\n",
+    "\n",
+    "\n",
+    "retriever = vectorstore.as_retriever(search_type=\"mmr\", search_kwargs={'k': 7})\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[Document(page_content='(00:35:28) \\nI remember when I started first watching Sora videos and I would see a person walk in front of something for a few seconds and occlude it and then walk away and the same thing was still there. I was like, “Oh, this is pretty good.” Or there’s examples where the underlying physics looks so well represented over a lot of steps in a sequence, it’s like, “|Oh, this is quite impressive.” But fundamentally, these models are just getting better and that will keep happening. If you look at the trajectory from DALL·E 1 to 2 to 3 to Sora, there are a lot of people that were dunked on each version saying it can’t do this, it can’t do that and look at it now.\\n\\n\\nLex Fridman\\n(00:36:04) \\nWell, the thing you just mentioned is the occlusions is basically modeling the physics of the three-dimensional physics of the world sufficiently well to capture those kinds of things.\\n\\n\\nSam Altman\\n(00:36:17) \\nWell…\\n\\n\\nLex Fridman\\n(00:36:18) \\nOr yeah, maybe you can tell me, in order to deal with occlusions, what does the world model need to?\\n\\n\\nSam Altman\\n(00:36:24) \\nYeah. So what I would say is it’s doing something to deal with occlusions really well. What I represent that it has a great underlying 3D model of the world, it’s a little bit more of a stretch.\\n\\n\\nLex Fridman\\n(00:36:33) \\nBut can you get there through just these kinds of two-dimensional training data approaches?\\n\\n\\nSam Altman\\n(00:36:39) \\nIt looks like this approach is going to go surprisingly far. I don’t want to speculate too much about what limits it will surmount and which it won’t, but…\\n\\n\\nLex Fridman\\n(00:36:46) \\nWhat are some interesting limitations of the system that you’ve seen? I mean there’s been some fun ones you’ve posted.\\n\\n\\nSam Altman\\n(00:36:52) \\nThere’s all kinds of fun. I mean, cat’s sprouting an extra limit at random points in a video. Pick what you want, but there’s still a lot of problem, there’s a lot of weaknesses.', metadata={'language': 'en-US', 'source': 'https://lexfridman.com/sam-altman-2-transcript/', 'title': 'Transcript for Sam Altman: OpenAI, GPT-5, Sora, Board Saga, Elon Musk, Ilya, Power & AGI | Lex Fridman Podcast #419 - Lex Fridman'}),\n",
+       " Document(page_content='Sam Altman\\n(01:37:22) \\nMaybe. Maybe we need to go invent more technology and measure more things first.\\n\\n\\nLex Fridman\\n(01:37:28) \\nOh, I see. It just doesn’t have enough data. It’s just if it keeps-\\n\\n\\nSam Altman\\n(01:37:31) \\nI mean, maybe it says, “You want to know the answer to this question about physics, I need you to build this machine and make these five measurements, and tell me that.”\\n\\n\\nLex Fridman\\n(01:37:39) \\nYeah, “What the hell do you want from me? I need the machine first, and I’ll help you deal with the data from that machine.” Maybe it’ll help you build a machine.\\n\\n\\nSam Altman\\n(01:37:47) \\nMaybe. Maybe.\\n\\n\\nLex Fridman\\n(01:37:49) \\nAnd on the mathematical side, maybe prove some things. Are you interested in that side of things, too? The formalized exploration of ideas?\\n\\n\\nSam Altman\\n(01:37:56) \\nMm-hmm.\\n\\n\\nLex Fridman\\n(01:37:59) \\nWhoever builds AGI first gets a lot of power. Do you trust yourself with that much power?\\n\\n\\nSam Altman\\n(01:38:14) \\nLook, I’ll just be very honest with this answer. I was going to say, and I still believe this, that it is important that I nor any other one person have total control over OpenAI or over AGI. And I think you want a robust governance system. I can point out a whole bunch of things about all of our board drama from last year about how I didn’t fight it initially, and was just like, “Yeah. That’s the will of the board, even though I think it’s a really bad decision.” And then later, I clearly did fight it, and I can explain the nuance and why I think it was okay for me to fight it later. But as many people have observed, although the board had the legal ability to fire me, in practice, it didn’t quite work. And that is its own kind of governance failure.', metadata={'language': 'en-US', 'source': 'https://lexfridman.com/sam-altman-2-transcript/', 'title': 'Transcript for Sam Altman: OpenAI, GPT-5, Sora, Board Saga, Elon Musk, Ilya, Power & AGI | Lex Fridman Podcast #419 - Lex Fridman'}),\n",
+       " Document(page_content='Sam Altman\\n(00:38:44) \\nYeah.\\n\\n\\nLex Fridman\\n(00:38:45) \\nAnd then the question is, how much data is there on the internet that could be used in this that is conducive to this kind of self supervised way if only we knew the details of the self supervised. Have you considered opening it up a little more details?\\n\\n\\nSam Altman\\n(00:39:02) \\nWe have. You mean for source specifically?\\n\\n\\nLex Fridman\\n(00:39:04) \\nSource specifically. Because it’s so interesting that can the same magic of LLMs now start moving towards visual data and what does that take to do that?\\n\\n\\nSam Altman\\n(00:39:18) \\nI mean it looks to me like yes, but we have more work to do.\\n\\n\\nLex Fridman\\n(00:39:22) \\nSure. What are the dangers? Why are you concerned about releasing the system? What are some possible dangers of this?\\n\\n\\nSam Altman\\n(00:39:29) \\nI mean frankly speaking, one thing we have to do before releasing the system is just get it to work at a level of efficiency that will deliver the scale people are going to want from this so that I don’t want to downplay that. And there’s still a ton ton of work to do there. But you can imagine issues with deepfakes, misinformation. We try to be a thoughtful company about what we put out into the world and it doesn’t take much thought to think about the ways this can go badly.\\n\\n\\nLex Fridman\\n(00:40:05) \\nThere’s a lot of tough questions here, you’re dealing in a very tough space. Do you think training AI should be or is fair use under copyright law?', metadata={'language': 'en-US', 'source': 'https://lexfridman.com/sam-altman-2-transcript/', 'title': 'Transcript for Sam Altman: OpenAI, GPT-5, Sora, Board Saga, Elon Musk, Ilya, Power & AGI | Lex Fridman Podcast #419 - Lex Fridman'}),\n",
+       " Document(page_content='Sam Altman\\n(01:01:34) \\nI suspect that’s a reasonable intuition.\\n\\n\\nLex Fridman\\n(01:01:37) \\nInteresting. So it’s not possible once the GPT gets like GPT-7, would just instantaneously be able to see, “Here’s the proof of Fermat’s Theorem”?\\n\\n\\nSam Altman\\n(01:01:49) \\nIt seems to me like you want to be able to allocate more compute to harder problems. It seems to me that if you ask a system like that, “Prove Fermat’s Last Theorem,” versus, “What’s today’s date?,” unless it already knew and and had memorized the answer to the proof, assuming it’s got to go figure that out, seems like that will take more compute.\\n\\n\\nLex Fridman\\n(01:02:20) \\nBut can it look like basically an LLM talking to itself, that kind of thing?\\n\\n\\nSam Altman\\n(01:02:25) \\nMaybe. I mean, there’s a lot of things that you could imagine working. What the right or the best way to do that will be, we don’t know.\\n\\nQ*\\n\\nLex Fridman\\n(01:02:37) \\nThis does make me think of the mysterious lore behind Q*. What’s this mysterious Q* project? Is it also in the same nuclear facility?\\n\\n\\nSam Altman\\n(01:02:50) \\nThere is no nuclear facility.\\n\\n\\nLex Fridman\\n(01:02:52) \\nMm-hmm. That’s what a person with a nuclear facility always says.\\n\\n\\nSam Altman\\n(01:02:54) \\nI would love to have a secret nuclear facility. There isn’t one.\\n\\n\\nLex Fridman\\n(01:02:59) \\nAll right.\\n\\n\\nSam Altman\\n(01:03:00) \\nMaybe someday.\\n\\n\\nLex Fridman\\n(01:03:01) \\nSomeday? All right. One can dream.\\n\\n\\nSam Altman\\n(01:03:05) \\nOpenAI is not a good company at keeping secrets. It would be nice. We’re like, been plagued by a lot of leaks, and it would be nice if we were able to have something like that.\\n\\n\\nLex Fridman\\n(01:03:14) \\nCan you speak to what Q* is?\\n\\n\\nSam Altman\\n(01:03:16) \\nWe are not ready to talk about that.\\n\\n\\nLex Fridman\\n(01:03:17) \\nSee, but an answer like that means there’s something to talk about. It’s very mysterious, Sam.', metadata={'language': 'en-US', 'source': 'https://lexfridman.com/sam-altman-2-transcript/', 'title': 'Transcript for Sam Altman: OpenAI, GPT-5, Sora, Board Saga, Elon Musk, Ilya, Power & AGI | Lex Fridman Podcast #419 - Lex Fridman'}),\n",
+       " Document(page_content='Sam Altman\\n(01:30:55) \\nChanges the skillset. How much it changes the predisposition, I’m not sure.\\n\\n\\nLex Fridman\\n(01:30:59) \\nWell, the same kind of puzzle solving, all that kind of stuff.\\n\\n\\nSam Altman\\n(01:30:59) \\nMaybe.\\n\\n\\nLex Fridman\\n(01:31:02) \\nProgramming is hard. It’s like how get that last 1% to close the gap? How hard is that?\\n\\n\\nSam Altman\\n(01:31:09) \\nYeah, I think with most other cases, the best practitioners of the craft will use multiple tools. And they’ll do some work in natural language, and when they need to go write C for something, they’ll do that.\\n\\n\\nLex Fridman\\n(01:31:20) \\nWill we see humanoid robots or humanoid robot brains from OpenAI at some point?\\n\\n\\nSam Altman\\n(01:31:28) \\nAt some point.\\n\\n\\nLex Fridman\\n(01:31:29) \\nHow important is embodied AI to you?\\n\\n\\nSam Altman\\n(01:31:32) \\nI think it’s depressing if we have AGI and the only way to get things done in the physical world is to make a human go do it. So I really hope that as part of this transition, as this phase change, we also get humanoid robots or some sort of physical world robots.\\n\\n\\nLex Fridman\\n(01:31:51) \\nI mean, OpenAI has some history and quite a bit of history working in robotics, but it hasn’t quite done in terms of ethics-\\n\\n\\nSam Altman\\n(01:31:59) \\nWe’re a small company. We have to really focus. And also, robots were hard for the wrong reason at the time, but we will return to robots in some way at some point.\\n\\n\\nLex Fridman\\n(01:32:11) \\nThat sounds both inspiring and menacing.\\n\\n\\nSam Altman\\n(01:32:14) \\nWhy?\\n\\n\\nLex Fridman\\n(01:32:15) \\nBecause immediately, we will return to robots. It’s like in Terminator-\\n\\n\\nSam Altman\\n(01:32:20) \\nWe will return to work on developing robots. We will not turn ourselves into robots, of course.\\n\\nAGI\\n\\nLex Fridman\\n(01:32:24) \\nYeah. When do you think we, you and we as humanity will build AGI?', metadata={'language': 'en-US', 'source': 'https://lexfridman.com/sam-altman-2-transcript/', 'title': 'Transcript for Sam Altman: OpenAI, GPT-5, Sora, Board Saga, Elon Musk, Ilya, Power & AGI | Lex Fridman Podcast #419 - Lex Fridman'}),\n",
+       " Document(page_content='Lex Fridman\\n(00:50:01) \\nHow does the context window of going from 8K to 128K tokens compare from GPT-4 to GPT-4 Turbo?\\n\\n\\nSam Altman\\n(00:50:13) \\nMost people don’t need all the way to 128 most of the time. Although if we dream into the distant future, we’ll have way distant future, we’ll have context length of several billion. You will feed in all of your information, all of your history over time and it’ll just get to know you better and better and that’ll be great. For now, the way people use these models, they’re not doing that. People sometimes post in a paper or a significant fraction of a code repository, whatever, but most usage of the models is not using the long context most of the time.\\n\\n\\nLex Fridman\\n(00:50:50) \\nI like that this is your “I have a dream” speech. One day you’ll be judged by the full context of your character or of your whole lifetime. That’s interesting. So that’s part of the expansion that you’re hoping for, is a greater and greater context.\\n\\n\\nSam Altman\\n(00:51:06) \\nI saw this internet clip once, I’m going to get the numbers wrong, but it was like Bill Gates talking about the amount of memory on some early computer, maybe it was 64K, maybe 640K, something like that. Most of it was used for the screen buffer. He just couldn’t seem genuine. He just couldn’t imagine that the world would eventually need gigabytes of memory in a computer or terabytes of memory in a computer. And you always do, or you always do just need to follow the exponential of technology and we will find out how to use better technology. So I can’t really imagine what it’s like right now for context links to go out to the billion someday. And they might not literally go there, but effectively it’ll feel like that. But I know we’ll use it and really not want to go back once we have it.\\n\\n\\nLex Fridman\\n(00:51:56) \\nYeah, even saying billions 10 years from now might seem dumb because it’ll be trillions upon trillions.\\n\\n\\nSam Altman\\n(00:52:04) \\nSure.', metadata={'language': 'en-US', 'source': 'https://lexfridman.com/sam-altman-2-transcript/', 'title': 'Transcript for Sam Altman: OpenAI, GPT-5, Sora, Board Saga, Elon Musk, Ilya, Power & AGI | Lex Fridman Podcast #419 - Lex Fridman'}),\n",
+       " Document(page_content='Lex Fridman\\n(01:12:57) \\nOh, like we want to stop this from-\\n\\n\\nSam Altman\\n(01:13:00) \\nMaybe.\\n\\n\\nLex Fridman\\n(01:13:03) \\nHow do you decrease the theatrical nature of it? I’m already starting to hear rumblings, because I do talk to people on both sides of the political spectrum, hear rumblings where it’s going to be politicized. AI is going to be politicized, which really worries me, because then it’s like maybe the right is against AI and the left is for AI because it’s going to help the people, or whatever the narrative and the formulation is, that really worries me. And then the theatrical nature of it can be leveraged fully. How do you fight that?\\n\\n\\nSam Altman\\n(01:13:38) \\nI think it will get caught up in left versus right wars. I don’t know exactly what that’s going to look like, but I think that’s just what happens with anything of consequence, unfortunately. What I meant more about theatrical risks is AI’s going to have, I believe, tremendously more good consequences than bad ones, but it is going to have bad ones, and there’ll be some bad ones that are bad but not theatrical. A lot more people have died of air pollution than nuclear reactors, for example. But most people worry more about living next to a nuclear reactor than a coal plant. But something about the way we’re wired is that although there’s many different kinds of risks we have to confront, the ones that make a good climax scene of a movie carry much more weight with us than the ones that are very bad over a long period of time but on a slow burn.\\n\\n\\nLex Fridman\\n(01:14:36) \\nWell, that’s why truth matters, and hopefully AI can help us see the truth of things, to have balance, to understand what are the actual risks, what are the actual dangers of things in the world. What are the pros and cons of the competition in the space and competing with Google, Meta, xAI, and others?', metadata={'language': 'en-US', 'source': 'https://lexfridman.com/sam-altman-2-transcript/', 'title': 'Transcript for Sam Altman: OpenAI, GPT-5, Sora, Board Saga, Elon Musk, Ilya, Power & AGI | Lex Fridman Podcast #419 - Lex Fridman'})]"
+      ]
+     },
+     "execution_count": 2,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "retriever.invoke('GPT-5')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "langcorn",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

packages/rag-chroma/rag_chroma/vecdb/12bce733-e94f-4342-829a-6786a9f92a50/data_level0.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a13e72541800c513c73dccea69f79e39cf4baef4fa23f7e117c0d6b0f5f99670
+size 3212000

packages/rag-chroma/rag_chroma/vecdb/12bce733-e94f-4342-829a-6786a9f92a50/header.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ec6df10978b056a10062ed99efeef2702fa4a1301fad702b53dd2517103c746
+size 100

packages/rag-chroma/rag_chroma/vecdb/12bce733-e94f-4342-829a-6786a9f92a50/length.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc19b1997119425765295aeab72d76faa6927d4f83985d328c26f20468d6cc76
+size 4000

packages/rag-chroma/rag_chroma/vecdb/12bce733-e94f-4342-829a-6786a9f92a50/link_lists.bin ADDED Viewed

File without changes

packages/rag-chroma/rag_chroma/vecdb/chroma.sqlite3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:058452996d2a4d5e9b7024ef66bd7f398e9a50fc943b671258681034fb911624
+size 1376256

packages/rag-chroma/tests/__init__.py ADDED Viewed

File without changes

pyproject.toml ADDED Viewed

	@@ -0,0 +1,25 @@

+[tool.poetry]
+name = "my-app"
+version = "0.1.0"
+description = ""
+authors = ["Your Name <you@example.com>"]
+readme = "README.md"
+packages = [
+    { include = "app" },
+]
+[tool.poetry.dependencies]
+python = "^3.11"
+uvicorn = "^0.23.2"
+langserve = {extras = ["server"], version = ">=0.0.30"}
+pydantic = "2.6.0"
+rag-chroma = {path = "packages/rag-chroma", develop = true}
+python-dotenv = "1"
+langchain-together = "0.0.2.post1"
+[tool.poetry.group.dev.dependencies]
+langchain-cli = ">=0.0.15"
+[build-system]
+requires = ["poetry-core"]
+build-backend = "poetry.core.masonry.api"