Spaces:

xdecoder
/

Demo

Runtime error

App Files Files Community

jw2yang commited on Dec 21, 2022

Commit

d1def87

•

1 Parent(s): d575688

change the task order

Browse files

Files changed (1) hide show

app.py +4 -4

app.py CHANGED Viewed

@@ -78,7 +78,7 @@ def inference(image, task, *args, **kwargs):
             return referring_captioning([model_last, model_cap], image, *args, **kwargs)
         elif task == 'Text Retrieval':
             return text_retrieval(model_cap, image, *args, **kwargs)
-        elif task == 'Image/Region Retrieval (Only Support Exampled 80 images)':
             return region_retrieval([model_cap, model_last], image, *args, **kwargs)
 '''
@@ -88,7 +88,7 @@ title = "X-Decoder All-in-One Demo"
 description = "<p style='text-align: center'> <a href='' target='_blank'>Project Page</a> | <a href='' target='_blank'>Paper</a> | <a href='https://github.com/microsoft/X-Decoder' target='_blank'>Github Repo</a> | <a href='' target='_blank'>Video</a> </p>"
 article = "The Demo is Run on X-Decoder (Focal-T)."
-inputs = [gr.inputs.Image(type='pil'), gr.inputs.Radio(choices=["Referring Segmentation", 'Open Vocabulary Semantic Segmentation','Open Vocabulary Instance Segmentation', "Open Vocabulary Panoptic Segmentation", "Image Captioning", "Text Retrieval", "Referring Editing", "Referring Captioning (Beta)", "Image/Region Retrieval (Only Support Exampled 80 images)"], type="value", default="OpenVocab Semantic Segmentation", label="Task"), gr.Textbox(label="xdecoder_text"), gr.Textbox(label="inpainting_text"), gr.Textbox(label="task_description")]
 gr.Interface(
     fn=inference,
     inputs=inputs,
@@ -99,7 +99,7 @@ gr.Interface(
         gr.Textbox(label="text restuls"),
         gr.outputs.Image(
         type="pil",
-        label="inpainting results"),
     ],
     examples=[
     ["./images/fruit.jpg", "Referring Segmentation", "The larger watermelon.,The front white flower.,White tea pot.,Flower bunch.,white vase.,The peach on the left.,The brown knife.", '', 'Format: s,s,s'],
@@ -108,7 +108,7 @@ gr.Interface(
     ["./images/owls.jpeg", "Open Vocabulary Instance Segmentation", "owl", '', 'Format: y,y,y'],
     ["./images/mountain.jpeg", "Image Captioning", "", '', ''],
     ["./images/rose.webp", "Text Retrieval", "lily,rose,peoney,tulip", '', 'Format: s,s,s'],
-    ["./images/region_retrieval.png", "Image/Region Retrieval (Only Support Exampled 80 images)", "The tangerine on the plate.", '', 'Please describe the object in a detailed way.'],
     ["./images/landscape.jpg", "Referring Captioning (Beta)", "cloud", '', 'Please fill in a noun/noun phrase. (may start with a/the)'],
     ["./images/apples.jpg", "Referring Editing", "a green apple", 'a pear', 'x-decoder + ldm (inference takes ~20s),  use inpainting_text "clean and empty scene" for image inpainting'],
     ],

             return referring_captioning([model_last, model_cap], image, *args, **kwargs)
         elif task == 'Text Retrieval':
             return text_retrieval(model_cap, image, *args, **kwargs)
+        elif task == 'Image/Region Retrieval':
             return region_retrieval([model_cap, model_last], image, *args, **kwargs)
 '''
 description = "<p style='text-align: center'> <a href='' target='_blank'>Project Page</a> | <a href='' target='_blank'>Paper</a> | <a href='https://github.com/microsoft/X-Decoder' target='_blank'>Github Repo</a> | <a href='' target='_blank'>Video</a> </p>"
 article = "The Demo is Run on X-Decoder (Focal-T)."
+inputs = [gr.inputs.Image(type='pil'), gr.inputs.Radio(choices=["Referring Segmentation", 'Open Vocabulary Semantic Segmentation','Open Vocabulary Instance Segmentation', "Open Vocabulary Panoptic Segmentation", "Image Captioning", "Text Retrieval", "Image/Region Retrieval", "Referring Captioning (Beta)", "Referring Editing"], type="value", default="OpenVocab Semantic Segmentation", label="Task"), gr.Textbox(label="xdecoder_text"), gr.Textbox(label="inpainting_text"), gr.Textbox(label="task_description")]
 gr.Interface(
     fn=inference,
     inputs=inputs,
         gr.Textbox(label="text restuls"),
         gr.outputs.Image(
         type="pil",
+        label="editing results"),
     ],
     examples=[
     ["./images/fruit.jpg", "Referring Segmentation", "The larger watermelon.,The front white flower.,White tea pot.,Flower bunch.,white vase.,The peach on the left.,The brown knife.", '', 'Format: s,s,s'],
     ["./images/owls.jpeg", "Open Vocabulary Instance Segmentation", "owl", '', 'Format: y,y,y'],
     ["./images/mountain.jpeg", "Image Captioning", "", '', ''],
     ["./images/rose.webp", "Text Retrieval", "lily,rose,peoney,tulip", '', 'Format: s,s,s'],
+    ["./images/region_retrieval.png", "Image/Region Retrieval", "The tangerine on the plate.", '', 'Please describe the object in a detailed way (80 images in the pool).'],
     ["./images/landscape.jpg", "Referring Captioning (Beta)", "cloud", '', 'Please fill in a noun/noun phrase. (may start with a/the)'],
     ["./images/apples.jpg", "Referring Editing", "a green apple", 'a pear', 'x-decoder + ldm (inference takes ~20s),  use inpainting_text "clean and empty scene" for image inpainting'],
     ],