Spaces:

Chan-Y
/

Mistral-7B-Summarizer

Sleeping

Chan-Y commited on Jul 4, 2024

Commit

bf3ac4c

verified ·

1 Parent(s): 9be919d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,6 +7,7 @@ from langchain.prompts import PromptTemplate
 from pathlib import Path
 from langchain_huggingface import ChatHuggingFace, HuggingFaceEndpoint
 from langchain_core.output_parsers import JsonOutputParser
 llm = HuggingFaceEndpoint(
     repo_id="mistralai/Mistral-7B-Instruct-v0.3",
@@ -34,26 +35,7 @@ def summarize(file, n_words):
         with open(file_path, 'r', encoding='utf-8') as f:
             text = f.read()
-    template_detect = '''
-Please carefully read the following document:
-<document>
-{TEXT}
-</document>
-identify the MOST used language in the document, return detected language in json format with key "language" and value is the detected language
-'''
-    prompt_detect = PromptTemplate(
-        template=template_detect,
-        input_variables=['TEXT']
-    )
-    language_detect = prompt_detect | llm | JsonOutputParser()
-    formatted_prompt = prompt_detect.format(TEXT=text)
-    language = language_detect.invoke(formatted_prompt)
-    lang = language["language"]
     template_translate = '''
 Please carefully read the following document:
 <document>

 from pathlib import Path
 from langchain_huggingface import ChatHuggingFace, HuggingFaceEndpoint
 from langchain_core.output_parsers import JsonOutputParser
+from langdetect import detect
 llm = HuggingFaceEndpoint(
     repo_id="mistralai/Mistral-7B-Instruct-v0.3",
         with open(file_path, 'r', encoding='utf-8') as f:
             text = f.read()
+    lang = detect(text)
     template_translate = '''
 Please carefully read the following document:
 <document>