Spaces:

Njomo
/

PotterChat

Sleeping

App Files Files Community

Njomo commited on Mar 18, 2023

Commit

f1a168b

•

1 Parent(s): 2631075

added app files

Browse files

Files changed (5) hide show

app.py +92 -0
chain.py +49 -0
combined.txt +0 -0
data.py +25 -0
docs.pkl +3 -0

app.py ADDED Viewed

	@@ -0,0 +1,92 @@

+import os
+import datetime
+import pickle
+import gradio as gr
+import langchain
+from langchain.llms import HuggingFaceHub
+from chain import get_new_chain
+api_token = os.environ["HF_TOKEN"]
+def get_faiss_store():
+    with open("docs.pkl", "rb") as f:
+        faiss_store = pickle.load(f)
+        return faiss_store
+def load_model():
+    print(langchain.__file__)
+    vectorstore = get_faiss_store()
+    flan_ul = HuggingFaceHub(repo_id="google/flan-ul2",
+                                model_kwargs={"temperature":0.1, "max_new_tokens":200},
+                                huggingfacehub_api_token=api_token)
+    qa_chain = get_new_chain(vectorstore, flan_ul)
+    return qa_chain
+def chat(inp, agent):
+    result = []
+    if agent is None:
+        result.append((inp, "Please wait for model to load (3-5 seconds)"))
+        return result
+    print("\n==== date/time: " + str(datetime.datetime.now()) + " ====")
+    print("inp: " + inp)
+    result = []
+    output = agent({"question": inp})
+    answer = output["answer"]
+    result.append((inp, answer))
+    print(result)
+    return result
+block = gr.Blocks(css=".gradio-container {background-color: lightgray}")
+with block:
+    with gr.Row():
+        gr.Markdown("<h3><center>PotterChat</center></h3><p>Ask questions about the Harry Potter Books, Powered by Flan-UL2</p>")
+    chatbot = gr.Chatbot()
+    with gr.Row():
+        message = gr.Textbox(
+            label="What's your question?",
+            placeholder="Who was Harry's godfather?",
+            lines=1,
+        )
+        submit = gr.Button(value="Send", variant="secondary").style(full_width=False)
+    gr.Examples(
+        examples=[
+            "Which house in Hogwarts was Harry in?",
+            "Who were Harry's best friends?",
+            "Who taught Potions at Hogwarts?",
+        ],
+        inputs=message,
+    )
+    gr.HTML(
+        """
+    This simple application uses Langchain, an open-source LLM, and FAISS to do Q&A over the Harry Potter books."""
+    )
+    gr.HTML(
+        "<center>Powered by <a href='huggingface.co'>Hugging Face 🤗</a> and <a href='https://github.com/hwchase17/langchain'>LangChain 🦜️🔗</a></center>"
+    )
+    # state = gr.State()
+    agent_state = gr.State()
+    block.load(load_model, inputs=None, outputs=[agent_state])
+    # submit.click(chat, inputs=[message, state, agent_state], outputs=[chatbot, state])
+    # message.submit(chat, inputs=[message, state, agent_state], outputs=[chatbot, state])
+    submit.click(chat, inputs=[message, agent_state], outputs=[chatbot])
+    message.submit(chat, inputs=[message, agent_state], outputs=[chatbot])
+block.launch(debug=True)

chain.py ADDED Viewed

	@@ -0,0 +1,49 @@

+from typing import Dict, List
+from langchain import PromptTemplate
+from langchain.chains.base import Chain
+from langchain.chains.combine_documents.base import BaseCombineDocumentsChain
+from langchain.chains.question_answering import load_qa_chain
+from langchain.prompts import PromptTemplate
+from langchain.vectorstores import FAISS
+from pydantic import BaseModel
+class CustomChain(Chain, BaseModel):
+    vstore: FAISS
+    chain: BaseCombineDocumentsChain
+    @property
+    def input_keys(self) -> List[str]:
+        return ["question"]
+    @property
+    def output_keys(self) -> List[str]:
+        return ["answer"]
+    def _call(self, inputs: Dict[str, str]) -> Dict[str, str]:
+    # def _call(self, inputs: str) -> Dict[str, str]:
+        question = inputs["question"]
+        # question = inputs
+        docs = self.vstore.similarity_search(question, k=5)
+        answer, _ = self.chain.combine_docs(docs, **inputs)
+        return {"answer": answer}
+def get_new_chain(vectorstore, llm):
+    flan_template = """Use only the following pieces of context to answer the question at the end. If you don't know the answer, just say that you don't know, don't try to make up an answer.
+    {context}
+    Question: {question}
+    """
+    PROMPT = PromptTemplate(template=flan_template, input_variables=["question", "context"])
+    doc_chain = load_qa_chain(
+        llm,
+        chain_type="stuff",
+        prompt=PROMPT,
+        verbose=True
+        )
+    return CustomChain(chain=doc_chain, vstore=vectorstore)

combined.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

data.py ADDED Viewed

	@@ -0,0 +1,25 @@

+import pickle
+from langchain.vectorstores import FAISS
+from langchain.embeddings import HuggingFaceEmbeddings
+file = open("combined.txt", "r")
+contents = file.read()
+embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-mpnet-base-v2")
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+text_splitter = RecursiveCharacterTextSplitter(
+    chunk_size = 500,
+    chunk_overlap  = 20,
+    length_function = len,
+)
+texts = text_splitter.create_documents([contents])
+print("Beginning construction of FAISS DB")
+docs = FAISS.from_documents(texts, embeddings)
+print("Beginning pickle")
+with open("docs.pkl", "wb") as f:
+    pickle.dump(docs, f)
+print("pickle over")

docs.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:382cb8f95c5e1aa71364e67eb6383368c231b002173aaf5db073ed793f32b5d6
+size 502076344