Spaces:

VGG11
/

armenian_chatbot_bert_multilingual

Runtime error

Mary12 commited on Aug 1, 2023

Commit

163cb0f

•

1 Parent(s): d5c2598

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,7 +3,18 @@ from transformers import AutoTokenizer, AutoModelForQuestionAnswering
 import torch
 import transformers
 from transformers import pipeline
 def model(model_name):
   tokenizer = AutoTokenizer.from_pretrained(model_name)
   model = AutoModelForQuestionAnswering.from_pretrained(model_name,return_dict = False)
@@ -20,10 +31,8 @@ def qa_result(context, question):
   pipe = model(model_name)
   result = pipe(question = question, context=context)
   answered = result['answer']
-  if answered[0].islower():
-    answered[0] = answered[0].upper()
-  # answered = answered.replace(answered[len(answered)-1], ":")
-  return answered
 theme = gr.themes.Soft().set(
     body_background_fill='*background_fill_secondary',

 import torch
 import transformers
 from transformers import pipeline
+import re
+import html
+def remove_references(text):
+    text = re.sub(r'\[\d+\]', '', text) ##[ref]
+    text = re.sub(r'\[https?://[^\[\]]+\s[^\[\]]+\]', '', text) ##hyperlink with text
+    text = re.sub(r'\[https?://[^\[\]]+\]', '', text) ##just the hyperlink
+    text = html.unescape(text)
+    text = re.sub(r'\s+', ' ', text).strip() ##clear out the white spaces
+    return text
 def model(model_name):
   tokenizer = AutoTokenizer.from_pretrained(model_name)
   model = AutoModelForQuestionAnswering.from_pretrained(model_name,return_dict = False)
   pipe = model(model_name)
   result = pipe(question = question, context=context)
   answered = result['answer']
+  text = remove_references(answered)
+  return text.capitalize()
 theme = gr.themes.Soft().set(
     body_background_fill='*background_fill_secondary',