File size: 1,125 Bytes
accbb3c
127eb07
accbb3c
127eb07
accbb3c
 
783650c
3daa867
 
 
9730cbb
 
accbb3c
 
 
c199bab
6b44c63
3daa867
accbb3c
 
c199bab
 
 
 
accbb3c
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29

import gradio as gr

from demo import query_image

description = """
Github link: <a href="https://github.com/ngthanhtin/owlvit_segment_anything">Link</a>
Gradio demo for combining <a href="https://github.com/facebookresearch/segment-anything">Segment-Anything (SAM)</a>
<a href="https://huggingface.co/docs/transformers/main/en/model_doc/owlvit">OWL-ViT</a>.
\n\nYou can use OWL-ViT to query boxes with text descriptions of any object, then SAM will segment anything in the boxes.

Note: In this demo, I only get the one box per class to demonstrate, you can modify the code to get multiple boxes beyond a threshold.
"""
demo = gr.Interface(
    query_image, 
    inputs=[gr.Image(), "text"], 
    outputs=["image", "image"],
    title="Segment Anything (SAM) with OWL-ViT",
    description=description,
    examples=[
        ["./demo_images/cats.png", "cats,ears"], 
        ["./demo_images/demo1.jpg", "bear,soil,sea"],
        ["./demo_images/demo2.jpg", "dog,ear,leg,eyes,tail"],
        ["./demo_images/tanager.jpg", "wing,eyes,back,legs,tail"]
    ],
)

# demo.launch()
demo.launch(server_name="0.0.0.0", debug=True)