Pangea-demo

Runtime error

App Files Files Community

paralym commited on Oct 21, 2024

Commit

df3ebe1

verified ·

1 Parent(s): 8f3bc2e

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -69

app.py CHANGED Viewed

@@ -31,6 +31,8 @@ from llava.mm_utils import (
     KeywordsStoppingCriteria,
 )
 from PIL import Image
 import requests
@@ -82,6 +84,8 @@ class InferenceDemo(object):
             conv_mode = "mpt"
         elif "qwen" in model_name.lower():
             conv_mode = "qwen_1_5"
         else:
             conv_mode = "llava_v0"
@@ -289,6 +293,8 @@ with gr.Blocks(
         [[Blog]](https://llava-vl.github.io/blog/2024-06-16-llava-next-interleave/)  [[Code]](https://github.com/LLaVA-VL/LLaVA-NeXT) [[Model]](https://huggingface.co/lmms-lab/llava-next-interleave-7b)
         Note: The internleave checkpoint is updated (Date: Jul. 24, 2024), the wrong checkpiont is used before.
     """
     tos_markdown = """
     ### TODO!. Terms of use
     By using this service, users are required to agree to the following terms:
@@ -304,7 +310,9 @@ with gr.Blocks(
         "LLaVA-Interleave-7B",
     ]
     cur_dir = os.path.dirname(os.path.abspath(__file__))
-    gr.Markdown(title_markdown)
     with gr.Column():
         with gr.Row():
             chatbot = gr.Chatbot([], elem_id="chatbot", bubble_full_width=False)
@@ -327,79 +335,14 @@ with gr.Blocks(
         print(cur_dir)
         gr.Examples(
             examples=[
-                # [
-                #     {
-                #         "text": "<image> <image> <image> Which image shows a different mood of character from the others?",
-                #         "files": [f"{cur_dir}/examples/examples_image12.jpg", f"{cur_dir}/examples/examples_image13.jpg", f"{cur_dir}/examples/examples_image14.jpg"]
-                #     },
-                #     {
-                #         "text": "Please pay attention to the movement of the object from the first image to the second image, then write a HTML code to show this movement.",
-                #         "files": [
-                #             f"{cur_dir}/examples/code1.jpeg",
-                #             f"{cur_dir}/examples/code2.jpeg",
-                #         ],
-                #     }
-                # ],
                 [
                     {
                         "files": [
                             f"{cur_dir}/examples/shub.jpg",
-                            f"{cur_dir}/examples/shuc.jpg",
-                            f"{cur_dir}/examples/shud.jpg",
-                        ],
-                        "text": "what is fun about the images?",
-                    }
-                ],
-                [
-                    {
-                        "files": [
-                            f"{cur_dir}/examples/iphone-15-price-1024x576.jpg",
-                            f"{cur_dir}/examples/dynamic-island-1024x576.jpg",
-                            f"{cur_dir}/examples/iphone-15-colors-1024x576.jpg",
-                            f"{cur_dir}/examples/Iphone-15-Usb-c-charger-1024x576.jpg",
-                            f"{cur_dir}/examples/A-17-processors-1024x576.jpg",
-                        ],
-                        "text": "The images are the PPT of iPhone 15 review. can you summarize the main information?",
-                    }
-                ],
-                [
-                    {
-                        "files": [
-                            f"{cur_dir}/examples/fangao3.jpeg",
-                            f"{cur_dir}/examples/fangao2.jpeg",
-                            f"{cur_dir}/examples/fangao1.jpeg",
                         ],
-                        "text": "Do you kown who draw these paintings?",
                     }
                 ],
-                [
-                    {
-                        "files": [
-                            f"{cur_dir}/examples/oprah-winfrey-resume.png",
-                            f"{cur_dir}/examples/steve-jobs-resume.jpg",
-                        ],
-                        "text": "Hi, there are two candidates, can you provide a brief description for each of them for me?",
-                    }
-                ],
-                [
-                    {
-                        "files": [
-                            f"{cur_dir}/examples/original_bench.jpeg",
-                            f"{cur_dir}/examples/changed_bench.jpeg",
-                        ],
-                        "text": "How to edit image1 to make it look like image2?",
-                    }
-                ],
-                [
-                    {
-                        "files": [
-                            f"{cur_dir}/examples/twitter2.jpeg",
-                            f"{cur_dir}/examples/twitter3.jpeg",
-                            f"{cur_dir}/examples/twitter4.jpeg",
-                        ],
-                        "text": "Please write a twitter blog post with the images.",
-                    }
-                ]
             ],
             inputs=[chat_input],
@@ -427,7 +370,7 @@ if __name__ == "__main__":
     argparser.add_argument("--server_name", default="0.0.0.0", type=str)
     argparser.add_argument("--port", default="6123", type=str)
     argparser.add_argument(
-        "--model_path", default="lmms-lab/llava-next-interleave-qwen-7b", type=str
     )
     # argparser.add_argument("--model-path", type=str, default="facebook/opt-350m")
     argparser.add_argument("--model-base", type=str, default=None)
@@ -448,4 +391,4 @@ if __name__ == "__main__":
     tokenizer, model, image_processor, context_len = load_pretrained_model(args.model_path, args.model_base, model_name, args.load_8bit, args.load_4bit)
     model=model.to(torch.device('cuda'))
     our_chatbot = None
-    demo.launch()

     KeywordsStoppingCriteria,
 )
+from serve_constants_mm_llm import html_header
 from PIL import Image
 import requests
             conv_mode = "mpt"
         elif "qwen" in model_name.lower():
             conv_mode = "qwen_1_5"
+        elif "pangea" in model_name.lower():
+            conv_mode = "qwen_1_5"
         else:
             conv_mode = "llava_v0"
         [[Blog]](https://llava-vl.github.io/blog/2024-06-16-llava-next-interleave/)  [[Code]](https://github.com/LLaVA-VL/LLaVA-NeXT) [[Model]](https://huggingface.co/lmms-lab/llava-next-interleave-7b)
         Note: The internleave checkpoint is updated (Date: Jul. 24, 2024), the wrong checkpiont is used before.
     """
     tos_markdown = """
     ### TODO!. Terms of use
     By using this service, users are required to agree to the following terms:
         "LLaVA-Interleave-7B",
     ]
     cur_dir = os.path.dirname(os.path.abspath(__file__))
+    # gr.Markdown(title_markdown)
+    gr.HTML(html_header)
     with gr.Column():
         with gr.Row():
             chatbot = gr.Chatbot([], elem_id="chatbot", bubble_full_width=False)
         print(cur_dir)
         gr.Examples(
             examples=[
                 [
                     {
                         "files": [
                             f"{cur_dir}/examples/shub.jpg",
                         ],
+                        "text": "what is fun about the image?",
                     }
                 ],
             ],
             inputs=[chat_input],
     argparser.add_argument("--server_name", default="0.0.0.0", type=str)
     argparser.add_argument("--port", default="6123", type=str)
     argparser.add_argument(
+        "--model_path", default="neulab/Pangea-7B", type=str
     )
     # argparser.add_argument("--model-path", type=str, default="facebook/opt-350m")
     argparser.add_argument("--model-base", type=str, default=None)
     tokenizer, model, image_processor, context_len = load_pretrained_model(args.model_path, args.model_base, model_name, args.load_8bit, args.load_4bit)
     model=model.to(torch.device('cuda'))
     our_chatbot = None
+    demo.launch()