Aria

Running on Zero

App Files Files Community

andito HF staff commited on Nov 19

Commit

d30dedf

•

1 Parent(s): 0fcfdf2

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -8

app.py CHANGED Viewed

@@ -13,11 +13,7 @@ processor = AutoProcessor.from_pretrained("HuggingFaceTB/SmolVLM_converted_4")
 model = Idefics3ForConditionalGeneration.from_pretrained("HuggingFaceTB/SmolVLM_converted_4",
         torch_dtype=torch.bfloat16,
-        #_attn_implementation="flash_attention_2"
-                                                        ).to("cuda")
-BAD_WORDS_IDS = processor.tokenizer(["<image>", "<fake_token_around_image>", "<row_", "apiro", "\u2500lrow_", "row_1"], add_special_tokens=False).input_ids
-EOS_WORDS_IDS = [processor.tokenizer.eos_token_id]
 @spaces.GPU
 def model_inference(
@@ -78,9 +74,9 @@ def model_inference(
 with gr.Blocks(fill_height=True) as demo:
-    gr.Markdown("## IDEFICS3-Llama 🐶")
-    gr.Markdown("Play with [HuggingFaceM4/Idefics3-8B-Llama3](https://huggingface.co/HuggingFaceM4/Idefics3-8B-Llama3) in this demo. To get started, upload an image and text or try one of the examples.")
-    gr.Markdown("**Disclaimer:** Idefics3 does not include an RLHF alignment stage, so it may not consistently follow prompts or handle complex tasks. However, this doesn't mean it is incapable of doing so. Adding a prefix to the assistant's response, such as Let's think step for a reasoning question or `<html>` for HTML code generation, can significantly improve the output in practice. You could also play with the parameters such as the temperature in non-greedy mode.")
     with gr.Column():
         image_input = gr.Image(label="Upload your Image", type="pil", scale=1)
         query_input = gr.Textbox(label="Prompt")

 model = Idefics3ForConditionalGeneration.from_pretrained("HuggingFaceTB/SmolVLM_converted_4",
         torch_dtype=torch.bfloat16,
+        _attn_implementation="flash_attention_2").to("cuda")
 @spaces.GPU
 def model_inference(
 with gr.Blocks(fill_height=True) as demo:
+    gr.Markdown("## SmolVLM 🐶")
+    gr.Markdown("Play with [HuggingFaceTB/SmolVLM](https://huggingface.co/HuggingFaceTB/SmolVLM) in this demo. To get started, upload an image and text or try one of the examples.")
+    gr.Markdown("**Disclaimer:** SmolVLM does not include an RLHF alignment stage, so it may not consistently follow prompts or handle complex tasks. However, this doesn't mean it is incapable of doing so. Adding a prefix to the assistant's response, such as Let's think step for a reasoning question or `<html>` for HTML code generation, can significantly improve the output in practice. You could also play with the parameters such as the temperature in non-greedy mode.")
     with gr.Column():
         image_input = gr.Image(label="Upload your Image", type="pil", scale=1)
         query_input = gr.Textbox(label="Prompt")