Spaces:

bstraehle
/

rag

Running

App Files Files Community

bstraehle commited on Jun 3, 2024

Commit

caeaee0

verified ·

1 Parent(s): fbf1f2e

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -48

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import gradio as gr
-import logging, os, sys, time
 from dotenv import load_dotenv, find_dotenv
@@ -7,6 +7,8 @@ from rag_langchain import LangChainRAG
 from rag_llamaindex import LlamaIndexRAG
 from trace import trace_wandb
 _ = load_dotenv(find_dotenv())
 RAG_INGESTION = False # load, split, embed, and store documents
@@ -34,55 +36,58 @@ def invoke(openai_api_key, prompt, rag_option):
     if (rag_option is None):
         raise gr.Error("Retrieval-Augmented Generation is required.")
-    os.environ["OPENAI_API_KEY"] = openai_api_key
-    if (RAG_INGESTION):
-        if (rag_option == RAG_LANGCHAIN):
-            rag = LangChainRAG()
-            rag.ingestion(config)
-        elif (rag_option == RAG_LLAMAINDEX):
-            rag = LlamaIndexRAG()
-            rag.ingestion(config)
-    completion = ""
-    result = ""
-    callback = ""
-    err_msg = ""
-    try:
-        start_time_ms = round(time.time() * 1000)
-        if (rag_option == RAG_LANGCHAIN):
-            rag = LangChainRAG()
-            completion, callback = rag.rag_chain(config, prompt)
-            result = completion["result"]
-        elif (rag_option == RAG_LLAMAINDEX):
-            rag = LlamaIndexRAG()
-            result, callback = rag.retrieval(config, prompt)
-        else:
-            rag = LangChainRAG()
-            completion, callback = rag.llm_chain(config, prompt)
-            result = completion.generations[0][0].text
-    except Exception as e:
-        err_msg = e
-        raise gr.Error(e)
-    finally:
-        end_time_ms = round(time.time() * 1000)
-        trace_wandb(
-            config,
-            rag_option,
-            prompt,
-            completion,
-            result,
-            callback,
-            err_msg,
-            start_time_ms,
-            end_time_ms
-        )
-    return result
 gr.close_all()

 import gradio as gr
+import logging, os, sys, threading, time
 from dotenv import load_dotenv, find_dotenv
 from rag_llamaindex import LlamaIndexRAG
 from trace import trace_wandb
+lock = threading.Lock()
 _ = load_dotenv(find_dotenv())
 RAG_INGESTION = False # load, split, embed, and store documents
     if (rag_option is None):
         raise gr.Error("Retrieval-Augmented Generation is required.")
+    with lock:
+        os.environ["OPENAI_API_KEY"] = openai_api_key
+        if (RAG_INGESTION):
+            if (rag_option == RAG_LANGCHAIN):
+                rag = LangChainRAG()
+                rag.ingestion(config)
+            elif (rag_option == RAG_LLAMAINDEX):
+                rag = LlamaIndexRAG()
+                rag.ingestion(config)
+        completion = ""
+        result = ""
+        callback = ""
+        err_msg = ""
+        try:
+            start_time_ms = round(time.time() * 1000)
+            if (rag_option == RAG_LANGCHAIN):
+                rag = LangChainRAG()
+                completion, callback = rag.rag_chain(config, prompt)
+                result = completion["result"]
+            elif (rag_option == RAG_LLAMAINDEX):
+                rag = LlamaIndexRAG()
+                result, callback = rag.retrieval(config, prompt)
+            else:
+                rag = LangChainRAG()
+                completion, callback = rag.llm_chain(config, prompt)
+                result = completion.generations[0][0].text
+        except Exception as e:
+            err_msg = e
+            raise gr.Error(e)
+        finally:
+            end_time_ms = round(time.time() * 1000)
+            trace_wandb(
+                config,
+                rag_option,
+                prompt,
+                completion,
+                result,
+                callback,
+                err_msg,
+                start_time_ms,
+                end_time_ms
+            )
+            del os.environ["OPENAI_API_KEY"]
+        return result
 gr.close_all()