NadeulAI-chatbot-2

Running on Zero

suwonpabby commited on Sep 17

Commit

c861cde

•

1 Parent(s): 49b0675

Modify

Files changed (1) hide show

app.py CHANGED Viewed

@@ -59,11 +59,11 @@ embedding_model = BGEM3FlagModel(embedding_model_name, use_fp16=True)
 # Util Functions
 # 1개 데이터 처리, 배치 단위 아님
-def qa_2_str(qa: List) -> str:
     result = ""
-    if len(qa) > 1:
-        for idx, message in enumerate(qa[:-1]):
                 if idx % 2 == 0: # Q
                     result += f"User: {message}\n"
                 else: # A
@@ -174,11 +174,11 @@ Assistant: {context_example}
 @spaces.GPU(duration=35)
-def make_gen(qa, candidates, top_k, character_type):
     start_time = time.time()
     # Make For Rag Prompt
-    rag_prompt = qa_2_str(qa)
     # Do RAG
     query_embeddings = embedding_model.encode([rag_prompt],
@@ -199,7 +199,7 @@ def make_gen(qa, candidates, top_k, character_type):
     # Make For LLM Prompt
-    final_prompt = make_prompt(qa, rag_result, character_type)
     # Use LLM
     streamer = TextIteratorStreamer(llm_tokenizer, skip_special_tokens=True)
@@ -239,12 +239,12 @@ def make_gen(qa, candidates, top_k, character_type):
 @app.get("/")
-async def root_endpoint(qa: List[str], candidates: List[str] = Query(...), top_k: int = Query(...), character_type: int = Query(...)):
-    return StreamingResponse(gen_stream(qa, candidates, top_k, character_type), media_type="text/event-stream")
-async def gen_stream(qa, candidates, top_k, character_type):
-    for value in make_gen(qa, candidates, top_k, character_type):
         yield value

 # Util Functions
 # 1개 데이터 처리, 배치 단위 아님
+def qa_2_str(QA: List) -> str:
     result = ""
+    if len(QA) > 1:
+        for idx, message in enumerate(QA[:-1]):
                 if idx % 2 == 0: # Q
                     result += f"User: {message}\n"
                 else: # A
 @spaces.GPU(duration=35)
+def make_gen(QA, candidates, top_k, character_type):
     start_time = time.time()
     # Make For Rag Prompt
+    rag_prompt = qa_2_str(QA)
     # Do RAG
     query_embeddings = embedding_model.encode([rag_prompt],
     # Make For LLM Prompt
+    final_prompt = make_prompt(QA, rag_result, character_type)
     # Use LLM
     streamer = TextIteratorStreamer(llm_tokenizer, skip_special_tokens=True)
 @app.get("/")
+async def root_endpoint(QA: List[str] = Query(...), candidates: List[str] = Query(...), top_k: int = Query(...), character_type: int = Query(...)):
+    return StreamingResponse(gen_stream(QA, candidates, top_k, character_type), media_type="text/event-stream")
+async def gen_stream(QA, candidates, top_k, character_type):
+    for value in make_gen(QA, candidates, top_k, character_type):
         yield value