chinese_lantern_riddles_v2_sft

Sleeping

App Files Files Community

3v324v23 commited on Feb 25

Commit

972fdd3

•

1 Parent(s): 71fab9c

updated prompt

Browse files

Files changed (17) hide show

app.py +22 -18
chroma/28c81268-af8d-4e89-9744-aee894bcbde6/data_level0.bin +0 -3
chroma/28c81268-af8d-4e89-9744-aee894bcbde6/header.bin +0 -3
chroma/28c81268-af8d-4e89-9744-aee894bcbde6/index_metadata.pickle +0 -3
chroma/28c81268-af8d-4e89-9744-aee894bcbde6/length.bin +0 -3
chroma/28c81268-af8d-4e89-9744-aee894bcbde6/link_lists.bin +0 -3
chroma/8b53584a-0ad0-4736-8a94-cfa8d70be50f/header.bin +0 -3
chroma/c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a/data_level0.bin +0 -3
chroma/c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a/index_metadata.pickle +0 -3
chroma/c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a/length.bin +0 -3
chroma/c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a/link_lists.bin +0 -3
chroma/chroma.sqlite3 +2 -2
chroma/{8b53584a-0ad0-4736-8a94-cfa8d70be50f → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/data_level0.bin +1 -1
chroma/{c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/header.bin +0 -0
chroma/{8b53584a-0ad0-4736-8a94-cfa8d70be50f → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/index_metadata.pickle +1 -1
chroma/{8b53584a-0ad0-4736-8a94-cfa8d70be50f → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/length.bin +1 -1
chroma/{8b53584a-0ad0-4736-8a94-cfa8d70be50f → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/link_lists.bin +1 -1

app.py CHANGED Viewed

@@ -2,7 +2,6 @@
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 from langchain.vectorstores import Chroma
 from langchain.embeddings import HuggingFaceEmbeddings
-from peft import AutoPeftModelForCausalLM
 import gradio as gr
 import hanzidentifier
@@ -18,14 +17,15 @@ current_path=str(pathlib.Path(__file__).parent.resolve())
 llm_model_name="Qwen/Qwen1.5-0.5B-Chat"
 #pipe = pipeline("text2text-generation", model=model)
-#model = AutoModelForCausalLM.from_pretrained(
-#    llm_model_name
-#)
 model = AutoModelForCausalLM.from_pretrained(
     "ytyeung/Qwen1.5-0.5B-Chat-SFT-riddles",
 )
 tokenizer = AutoTokenizer.from_pretrained(llm_model_name)
 # %%
@@ -72,16 +72,20 @@ threshold = 0.6
 def answer(input_text,context=None):
     if context:
         tips = "提示：\n"
-        tips += "\n".join([x[0] for x in context])
-        print (f"====\n{input_text}\n{context[0][0]} {context[0][1]}")
-        if context[0][1] >=0.9:
-            ans = re.search(r"谜底：(\w+)", context[0][0])
-            if ans:
-                return f"谜底是：{ans.group(1)}"
     else:
         tips=""
-    prompt = f"{input_text}\n{tips}\n谜底是什么？"
     prompt = prompt.strip()
     print(f"===\n{prompt}")
@@ -120,7 +124,7 @@ def helper_rag(text):
     context = []
     for doc in docs_out:
         if doc[1] > threshold:
-            context.append((f"{doc[0].page_content}{doc[0].metadata['answer']}", doc[1]))
     return context
@@ -132,7 +136,7 @@ def helper_text(text_input,radio=None):
         text_input = chinese_converter.to_simplified(text_input)
         chinese_type = "traditional"
-    text_input = re.sub(r'hint',"猜",text_input,flags=re.I)
     #if not any(c in text_input for c in ["猜", "打"]):
     #    warning = "请给一个提示，提示格式，例子：猜一水果，打一字。"
@@ -140,10 +144,9 @@ def helper_text(text_input,radio=None):
     #        warning = chinese_converter.to_traditional(warning)
     #    return warning
-    text=f"""猜谜语：\n谜面：{text_input}
-    """
-    context = helper_rag(text)
     output = answer(text,context=context)
@@ -248,6 +251,7 @@ def translate_text(text_input,text_output):
     text_input = translate(f"{text_input}")
     text_output = translate(f"{text_output}")
     return text_input,text_output
@@ -266,7 +270,7 @@ with gr.Blocks() as demo:
         ["小家伙穿黄袍，花丛中把房造。飞到西来飞到东，人人夸他爱劳动。（猜一动物）"],
         ["一物生来身穿三百多件衣，每天脱一件，年底剩张皮。（猜一物品）"],
         ["A thousand threads, a million strands. Reaching the water, vanishing all at once. (Hint: natural phenomenon)"],
-        ["无底洞"],
     ]
     radio = gr.Radio(
         ["简体中文","繁體中文", "English"],show_label=False,value="简体中文"

 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 from langchain.vectorstores import Chroma
 from langchain.embeddings import HuggingFaceEmbeddings
 import gradio as gr
 import hanzidentifier
 llm_model_name="Qwen/Qwen1.5-0.5B-Chat"
 #pipe = pipeline("text2text-generation", model=model)
 model = AutoModelForCausalLM.from_pretrained(
     "ytyeung/Qwen1.5-0.5B-Chat-SFT-riddles",
 )
+#model = AutoPeftModelForCausalLM.from_pretrained(
+#    "Qwen1.5_0.5B_Chat_sft_full/checkpoint-300",
+#    low_cpu_mem_usage=True,
+#)
 tokenizer = AutoTokenizer.from_pretrained(llm_model_name)
 # %%
 def answer(input_text,context=None):
     if context:
         tips = "提示：\n"
+        for i, tip in enumerate(context):
+            #if i==0:
+            #    tips +="最佳答案\n"
+            #else:
+            #    tips +="較差答案\n"
+            tips += f"谜面：{tip[0]} 谜底是：{tip[1]} "
+            tips +="\n"
+        print (f"====\n{input_text}\n{context[0][0]} 谜底是：{context[0][1]} {context[0][2]}")
+        if context[0][2] >=0.9:
+            return f"谜底是：{context[0][1]}"
     else:
         tips=""
+    prompt = f"{input_text}\n\n{tips}\n\n谜底是什么？"
     prompt = prompt.strip()
     print(f"===\n{prompt}")
     context = []
     for doc in docs_out:
         if doc[1] > threshold:
+            context.append((doc[0].page_content, doc[0].metadata['answer'], doc[1]))
     return context
         text_input = chinese_converter.to_simplified(text_input)
         chinese_type = "traditional"
+    text_input = re.sub(r'hint:',"猜",text_input,flags=re.I)
     #if not any(c in text_input for c in ["猜", "打"]):
     #    warning = "请给一个提示，提示格式，例子：猜一水果，打一字。"
     #        warning = chinese_converter.to_traditional(warning)
     #    return warning
+    text=f"""猜谜语：\n谜面：{text_input}"""
+    context = helper_rag(text_input)
     output = answer(text,context=context)
     text_input = translate(f"{text_input}")
     text_output = translate(f"{text_output}")
     return text_input,text_output
         ["小家伙穿黄袍，花丛中把房造。飞到西来飞到东，人人夸他爱劳动。（猜一动物）"],
         ["一物生来身穿三百多件衣，每天脱一件，年底剩张皮。（猜一物品）"],
         ["A thousand threads, a million strands. Reaching the water, vanishing all at once. (Hint: natural phenomenon)"],
+        ["无底洞（猜一成语）"],
     ]
     radio = gr.Radio(
         ["简体中文","繁體中文", "English"],show_label=False,value="简体中文"

chroma/28c81268-af8d-4e89-9744-aee894bcbde6/data_level0.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0067068c3258f065668e2ad17382df3424f1c001807139881c2dc1691772ac7b
-size 28908000

chroma/28c81268-af8d-4e89-9744-aee894bcbde6/header.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:4b630aa796b842f9cb3af4a5f7cbc9fd3fc793047cec78a183ac3eaa83d68497
-size 100

chroma/28c81268-af8d-4e89-9744-aee894bcbde6/index_metadata.pickle DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e1f937c780ce5ab483dc40c3bf8d8408b3fa3d1bf03b5d20488b0d5b8a906fde
-size 520085

chroma/28c81268-af8d-4e89-9744-aee894bcbde6/length.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:3a76c43e6fc007afd7f87d90b5a60a482449450491f8b307c5617b83471cf7a7
-size 36000

chroma/28c81268-af8d-4e89-9744-aee894bcbde6/link_lists.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:dcde28a793504ace57c738a180d964a0c8ed59bf30194cdde6f16484f267ba06
-size 80540

chroma/8b53584a-0ad0-4736-8a94-cfa8d70be50f/header.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:2ffd87324d19f8f6366a4be4dccc22a83a50ca6837d1327fb660dc4b4e25d140
-size 100

chroma/c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a/data_level0.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0fab3b1442c2e9319c9406cb2db197e9b806a2d4122f8c3575c62d4a0fff1dc5
-size 3212000

chroma/c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a/index_metadata.pickle DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:ca24af71d714f0248ef6b2057c614abc943d509f5289bfdaf8d41d3f4d38d22c
-size 55974

chroma/c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a/length.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:9814e6d812bbb532273fec5061e2a38f55f8cab0dbe292ff0ba8d230076943ce
-size 4000

chroma/c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a/link_lists.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:2f5dc8c4171f8df8a126112a3ebe4e91ccb0895344eff083d43ad767f6effc54
-size 8148

chroma/chroma.sqlite3 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c9e3b574a3b8dbc63d41d8e71a3653fca2baef9ab537656e4e1cd21214543fcb
-size 7331840

 version https://git-lfs.github.com/spec/v1
+oid sha256:5b44b6dd7c8ba23f9faa645c2562ec8b601e93f915588d07876518ac0a686614
+size 7327744

chroma/{8b53584a-0ad0-4736-8a94-cfa8d70be50f → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/data_level0.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:edb2a2f5c1c28d8ef8cacc3147c4063334a65511a472e08e135311ae0e0ab4d8
 size 3212000

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6b26a194dc2620543256c04ccea396ecd8de5787096f7d87d9a9474e9480754
 size 3212000

chroma/{c2db2536-5ceb-4ce6-b43c-7b5a8994dc6a → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/header.bin RENAMED Viewed

File without changes

chroma/{8b53584a-0ad0-4736-8a94-cfa8d70be50f → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/index_metadata.pickle RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee7d84a48338615ccd0e768b4e75af93c55c4f65ecd3e11dec0a1ccd9b940691
 size 55974

 version https://git-lfs.github.com/spec/v1
+oid sha256:84ebb46c8fd7958ede9a01c261de4f9f85f1020cf32b8ef2afeca67e0b0c62d0
 size 55974

chroma/{8b53584a-0ad0-4736-8a94-cfa8d70be50f → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/length.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:abaa3de524548f66212e75fe061d1d727b88fda93bfdec1db331f171a74ad768
 size 4000

 version https://git-lfs.github.com/spec/v1
+oid sha256:45569e91b592cc6a9fce4ee6a878eb041638b21d09934f0b7158eda3aa83ad89
 size 4000

chroma/{8b53584a-0ad0-4736-8a94-cfa8d70be50f → db67d0e6-bc9f-4536-a3d5-3b23e19e0212}/link_lists.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1b15423477efdd5be75319fa4f6893b9ca83949f88856ace47fdc9457a69e828
 size 8148

 version https://git-lfs.github.com/spec/v1
+oid sha256:421b1cc5ed6bbb1c3f7433d3afd18fcc96e7b0b4d670b4f374b599eec28bd8f2
 size 8148