Spaces:

wiusdy
/

VQA_fashion_hvar

Sleeping

wiusdy commited on Feb 2, 2024

Commit

0a5203f

1 Parent(s): 17f0aaa

engineering the code

Files changed (3) hide show

app.py CHANGED Viewed

@@ -1,16 +1,8 @@
 import gradio as gr
 import os
-from transformers import ViltProcessor, ViltForQuestionAnswering
-def vqa(image, text):
-    processor = ViltProcessor.from_pretrained("dandelin/vilt-b32-finetuned-vqa")
-    model = ViltForQuestionAnswering.from_pretrained("dandelin/vilt-b32-finetuned-vqa")
-    encoding = processor(image, text, return_tensors="pt")
-    outputs = model(**encoding)
-    logits = outputs.logits
-    idx = logits.argmax(-1).item()
-    return f"{model.config.id2label[idx]}"
 with gr.Blocks() as block:
@@ -22,7 +14,17 @@ with gr.Blocks() as block:
     dogs = os.path.join(os.path.dirname(__file__), "617.jpg")
     image = gr.Image(type="pil", value=dogs)
-    btn.click(vqa, inputs=[image, txt], outputs=[txt_3])
     btn = gr.Button(value="Submit")

 import gradio as gr
 import os
+from inference import *
+from utils import *
 with gr.Blocks() as block:
     dogs = os.path.join(os.path.dirname(__file__), "617.jpg")
     image = gr.Image(type="pil", value=dogs)
+    selected_option = block.get_element("dropdown").value
+    # here we can insert two or more models to inference the data
+    if selected_option == "Model 1":
+        btn.click(inference, inputs=[image, txt], outputs=[txt_3 + " Model 1"])
+    elif selected_option == "Model 2":
+        btn.click(inference, inputs=[image, txt], outputs=[txt_3 + " Model 2"])
+    elif selected_option == "Model 3":
+        btn.click(inference, inputs=[image, txt], outputs=[txt_3 + " Model 3"])
     btn = gr.Button(value="Submit")

inference.py ADDED Viewed

+from transformers import ViltProcessor, ViltForQuestionAnswering
+def inference(image, text):
+    processor = ViltProcessor.from_pretrained("dandelin/vilt-b32-finetuned-vqa")
+    model = ViltForQuestionAnswering.from_pretrained("dandelin/vilt-b32-finetuned-vqa")
+    encoding = processor(image, text, return_tensors="pt")
+    outputs = model(**encoding)
+    logits = outputs.logits
+    idx = logits.argmax(-1).item()
+    return f"{model.config.id2label[idx]}"

utils.py ADDED Viewed

File without changes