chat-llm-streaming

Running

App Files Files Community

star_nox commited on Mar 30, 2023

Commit

c1d7a66

•

1 Parent(s): e5f680f

added context retrieval

Browse files

Files changed (3) hide show

__pycache__/retrieval.cpython-310.pyc +0 -0
app.py +11 -3
retrieval.py +66 -0

__pycache__/retrieval.cpython-310.pyc ADDED Viewed

Binary file (2.91 kB). View file

app.py CHANGED Viewed

@@ -1,9 +1,11 @@
 import os
 import gradio as gr
 from text_generation import Client, InferenceAPIClient
 openchat_preprompt = (
     "\n<human>: Hi!\n<bot>: My name is Bot, model version is 0.15, part of an open-source kit for "
     "fine-tuning new bots! I was created by Together, LAION, and Ontocord.ai and the open-source "
@@ -110,7 +112,13 @@ def predict(
             for i in range(0, len(history) - 1, 2)
         ]
         yield chat, history
 def reset_textbox():
     return gr.update(value="")

 import os
 import gradio as gr
 from text_generation import Client, InferenceAPIClient
+import retrieval
+NUM_ANSWERS_GENERATED = 3
 openchat_preprompt = (
     "\n<human>: Hi!\n<bot>: My name is Bot, model version is 0.15, part of an open-source kit for "
     "fine-tuning new bots! I was created by Together, LAION, and Ontocord.ai and the open-source "
             for i in range(0, len(history) - 1, 2)
         ]
         yield chat, history
+    # add context retrieval part here
+    ta = retrieval.Retrieval()
+    ta._load_pinecone_vectorstore()
+    question = inputs
+    top_context_list = ta.retrieve_contexts_from_pinecone(user_question=question, topk=NUM_ANSWERS_GENERATED)
+    print(top_context_list)
 def reset_textbox():
     return gr.update(value="")

retrieval.py ADDED Viewed

	@@ -0,0 +1,66 @@

+import json
+import os
+import pathlib
+import sys
+import time
+from typing import Any, Dict, List
+import pinecone  # cloud-hosted vector database for context retrieval
+# for vector search
+from langchain.embeddings import HuggingFaceEmbeddings
+from langchain.vectorstores import Pinecone
+from dotenv import load_dotenv
+from PIL import Image
+from transformers import (AutoModelForSequenceClassification, AutoTokenizer, GPT2Tokenizer, OPTForCausalLM, T5ForConditionalGeneration)
+PINECONE_API_KEY="insert your pinecone api key here"
+class Retrieval:
+    def __init__(self,
+               device='cuda',
+               use_clip=True):
+        self.user_question = ''
+        self.max_text_length = None
+        self.pinecone_index_name = 'uiuc-chatbot'  # uiuc-chatbot-v2
+        self.use_clip = use_clip
+        # init parameters
+        self.device = device
+        self.num_answers_generated = 3
+        self.vectorstore = None
+    def _load_pinecone_vectorstore(self,):
+        model_name = "intfloat/e5-large"  # best text embedding model. 1024 dims.
+        pincecone_index = pinecone.Index("uiuc-chatbot")
+        embeddings = HuggingFaceEmbeddings(model_name=model_name)
+        #pinecone.init(api_key=os.environ['PINECONE_API_KEY'], environment="us-west1-gcp")
+        pinecone.init(api_key=PINECONE_API_KEY, environment="us-west1-gcp")
+        print(pinecone.list_indexes())
+        self.vectorstore = Pinecone(index=pincecone_index, embedding_function=embeddings.embed_query, text_key="text")
+    def retrieve_contexts_from_pinecone(self, user_question: str, topk: int = None) -> List[Any]:
+        '''
+        Invoke Pinecone for vector search. These vector databases are created in the notebook `data_formatting_patel.ipynb` and `data_formatting_student_notes.ipynb`.
+        Returns a list of LangChain Documents. They have properties: `doc.page_content`: str, doc.metadata['page_number']: int, doc.metadata['textbook_name']: str.
+        '''
+        print("USER QUESTION: ", user_question)
+        print("TOPK: ", topk)
+        if topk is None:
+            topk = self.num_answers_generated
+        # similarity search
+        top_context_list = self.vectorstore.similarity_search(user_question, k=topk)
+        # add the source info to the bottom of the context.
+        top_context_metadata = [f"Source: page {doc.metadata['page_number']} in {doc.metadata['textbook_name']}" for doc in top_context_list]
+        relevant_context_list = [f"{text.page_content}. {meta}" for text, meta in zip(top_context_list, top_context_metadata)]
+        return relevant_context_list