Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -7,9 +7,9 @@ from PIL import Image
|
|
7 |
import subprocess
|
8 |
subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
|
9 |
|
10 |
-
model = AutoModelForCausalLM.from_pretrained('
|
11 |
|
12 |
-
processor = AutoProcessor.from_pretrained('
|
13 |
|
14 |
|
15 |
TITLE = "# [Florence-2 SD3 Long Captioner](https://huggingface.co/gokaygokay/Florence-2-SD3-Captioner/)"
|
@@ -47,7 +47,7 @@ def modify_caption(caption: str) -> str:
|
|
47 |
def run_example(image):
|
48 |
image = Image.fromarray(image)
|
49 |
task_prompt = "<DESCRIPTION>"
|
50 |
-
prompt = task_prompt + "As an AI image annotation expert, please provide accurate annotations for the image to enhance the T5 model understanding of the content. Accurately describe images and images in the form of natural language. Your description should include key elements such as the actions, clothing, hairstyle, facial expressions, environment, dressing style, etc. of the characters in the image, as well as background content and any other important information. If the image has a distinct special style or filter, it needs to be described, otherwise it is not necessary. Your description should be accurate and accurate, only describing the actual content of the image, without describing abstract feelings such as atmosphere or quality, and should not exceed
|
51 |
|
52 |
# Ensure the image is in RGB mode
|
53 |
if image.mode != "RGB":
|
|
|
7 |
import subprocess
|
8 |
subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
|
9 |
|
10 |
+
model = AutoModelForCausalLM.from_pretrained('microsoft/Florence-2-large', trust_remote_code=True).to("cuda").eval()
|
11 |
|
12 |
+
processor = AutoProcessor.from_pretrained('microsoft/Florence-2-large', trust_remote_code=True)
|
13 |
|
14 |
|
15 |
TITLE = "# [Florence-2 SD3 Long Captioner](https://huggingface.co/gokaygokay/Florence-2-SD3-Captioner/)"
|
|
|
47 |
def run_example(image):
|
48 |
image = Image.fromarray(image)
|
49 |
task_prompt = "<DESCRIPTION>"
|
50 |
+
prompt = task_prompt + "As an AI image annotation expert, please provide accurate annotations for the image to enhance the T5 model understanding of the content. Accurately describe images and images in the form of natural language. Your description should include key elements such as the actions, clothing, hairstyle, facial expressions, environment, dressing style, etc. of the characters in the image, as well as background content and any other important information. If the image has a distinct special style or filter, it needs to be described, otherwise it is not necessary. Your description should be accurate and accurate, only describing the actual content of the image, without describing abstract feelings such as atmosphere or quality, and should not exceed five sentences. These descriptions will be used for image reconstruction, so the closer the similarity to the original image, the better the label quality. Special tags will receive a reward of $10 per image."
|
51 |
|
52 |
# Ensure the image is in RGB mode
|
53 |
if image.mode != "RGB":
|