docquery

Paused

App Files Files Community

mqcm2 commited on Sep 6, 2024

Commit

ec21dfa

verified ·

1 Parent(s): 733725d

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -42

app.py CHANGED Viewed

@@ -21,9 +21,8 @@ def ensure_list(x):
 CHECKPOINTS = {
-    "LayoutLMv1 🦉": "impira/layoutlm-document-qa",
-    "LayoutLMv1 for Invoices 💸": "impira/layoutlm-invoices",
-    "Donut 🍩": "naver-clova-ix/donut-base-finetuned-docvqa",
 }
 PIPELINES = {}
@@ -71,34 +70,6 @@ def normalize_bbox(box, width, height, padding=0.005):
     return [min_x * width, min_y * height, max_x * width, max_y * height]
-examples = [
-    [
-        "invoice.png",
-        "What is the invoice number?",
-    ],
-    [
-        "contract.jpeg",
-        "What is the purchase amount?",
-    ],
-    [
-        "statement.png",
-        "What are net sales for 2020?",
-    ],
-    #    [
-    #        "docquery.png",
-    #        "How many likes does the space have?",
-    #    ],
-    #    [
-    #        "hacker_news.png",
-    #        "What is the title of post number 5?",
-    #    ],
-]
-question_files = {
-    "What are net sales for 2020?": "statement.pdf",
-    "How many likes does the space have?": "https://huggingface.co/spaces/impira/docquery",
-    "What is the title of post number 5?": "https://news.ycombinator.com",
-}
 def process_path(path):
@@ -288,14 +259,11 @@ gradio-app h2, .gradio-app h2 {
 """
 with gr.Blocks(css=CSS) as demo:
-    gr.Markdown("# DocQuery: Document Query Engine")
     gr.Markdown(
-        "DocQuery (created by [Impira](https://impira.com?utm_source=huggingface&utm_medium=referral&utm_campaign=docquery_space))"
-        " uses LayoutLMv1 fine-tuned on DocVQA, a document visual question"
         " answering dataset, as well as SQuAD, which boosts its English-language comprehension."
-        " To use it, simply upload an image or PDF, type a question, and click 'submit', or "
-        " click one of the examples to load them."
-        " DocQuery is MIT-licensed and available on [Github](https://github.com/impira/docquery)."
     )
     document = gr.Variable()
@@ -330,16 +298,12 @@ with gr.Blocks(css=CSS) as demo:
                     )
             gr.Markdown("— or —")
             upload = gr.File(label=None, interactive=True, elem_id="short-upload-box")
-            gr.Examples(
-                examples=examples,
-                inputs=[example_image, example_question],
-            )
         with gr.Column() as col:
             gr.Markdown("## 2. Ask a question")
             question = gr.Textbox(
                 label="Question",
-                placeholder="e.g. What is the invoice number?",
                 lines=1,
                 max_lines=1,
             )

 CHECKPOINTS = {
+    "LayoutLMv1": "impira/layoutlm-document-qa",
+    "distilbert": "distilbert/distilbert-base-cased-distilled-squad",
 }
 PIPELINES = {}
     return [min_x * width, min_y * height, max_x * width, max_y * height]
 def process_path(path):
 """
 with gr.Blocks(css=CSS) as demo:
+    gr.Markdown("# Document Chatbot")
     gr.Markdown(
+        "Document Chatbot uses LayoutLMv1 fine-tuned on DocVQA, a document visual question"
         " answering dataset, as well as SQuAD, which boosts its English-language comprehension."
+        " To use it, simply upload an image or PDF, type a question, and click 'submit'."
     )
     document = gr.Variable()
                     )
             gr.Markdown("— or —")
             upload = gr.File(label=None, interactive=True, elem_id="short-upload-box")
         with gr.Column() as col:
             gr.Markdown("## 2. Ask a question")
             question = gr.Textbox(
                 label="Question",
+                placeholder="e.g. What is the document about?",
                 lines=1,
                 max_lines=1,
             )