BleachNick
commited on
Commit
•
8862295
1
Parent(s):
078d257
Update README.md
Browse files
README.md
CHANGED
@@ -8,7 +8,7 @@ library_name: transformers
|
|
8 |
# Model Card for MMICL
|
9 |
|
10 |
## Temporal Demo for MMICL
|
11 |
-
[Playground for MMICL-FLANT5XXL](https://
|
12 |
support multi-image input as well as video input.
|
13 |
<!-- Provide a quick summary of what the model is/does. -->
|
14 |
|
@@ -53,16 +53,12 @@ import json
|
|
53 |
import transformers
|
54 |
from PIL import Image
|
55 |
import torch
|
56 |
-
from model.blip2 import Blip2Processor,Blip2ForConditionalGeneration
|
57 |
-
from model.blip2 import Blip2Config
|
58 |
model_type="instructblip"
|
59 |
model_ckpt="BleachNick/MMICL-Instructblip-T5-xxl"
|
|
|
|
|
60 |
|
61 |
-
if '
|
62 |
-
model = Blip2ForConditionalGeneration.from_pretrained(
|
63 |
-
model_ckpt,
|
64 |
-
config=config).to('cuda:0',dtype=torch.bfloat16)
|
65 |
-
elif 'instructblip' in model_type:
|
66 |
model = InstructBlipForConditionalGeneration.from_pretrained(
|
67 |
model_ckpt,
|
68 |
config=config).to('cuda:0',dtype=torch.bfloat16)
|
@@ -73,16 +69,14 @@ sp = ["图"]+[f"<image{i}>" for i in range(20)]
|
|
73 |
processor = InstructBlipProcessor.from_pretrained(
|
74 |
model_ckpt
|
75 |
)
|
76 |
-
|
77 |
-
# model_ckpt
|
78 |
-
# )
|
79 |
|
80 |
sp = sp+processor.tokenizer.additional_special_tokens[len(sp):]
|
81 |
processor.tokenizer.add_special_tokens({'additional_special_tokens':sp})
|
82 |
|
83 |
|
84 |
prompt = ['Use the image 0: <image0>图,image 1: <image1>图 and image 2: <image2>图 as a visual aid to help you calculate the equation accurately. image 0 is 2+1=3.\nimage 1 is 5+6=11.\nimage 2 is"']
|
85 |
-
|
86 |
prompt = " ".join(prompt)
|
87 |
|
88 |
inputs = processor(images=images, text=prompt, return_tensors="pt")
|
|
|
8 |
# Model Card for MMICL
|
9 |
|
10 |
## Temporal Demo for MMICL
|
11 |
+
[Playground for MMICL-FLANT5XXL](https://bcd7bc41d42486e7c8.gradio.live/)
|
12 |
support multi-image input as well as video input.
|
13 |
<!-- Provide a quick summary of what the model is/does. -->
|
14 |
|
|
|
53 |
import transformers
|
54 |
from PIL import Image
|
55 |
import torch
|
|
|
|
|
56 |
model_type="instructblip"
|
57 |
model_ckpt="BleachNick/MMICL-Instructblip-T5-xxl"
|
58 |
+
config_ckpt = "Salesforce/instructblip-flan-t5-xxl"
|
59 |
+
config = InstructBlipConfig.from_pretrained(config_ckpt )
|
60 |
|
61 |
+
if 'instructblip' in model_type:
|
|
|
|
|
|
|
|
|
62 |
model = InstructBlipForConditionalGeneration.from_pretrained(
|
63 |
model_ckpt,
|
64 |
config=config).to('cuda:0',dtype=torch.bfloat16)
|
|
|
69 |
processor = InstructBlipProcessor.from_pretrained(
|
70 |
model_ckpt
|
71 |
)
|
72 |
+
|
|
|
|
|
73 |
|
74 |
sp = sp+processor.tokenizer.additional_special_tokens[len(sp):]
|
75 |
processor.tokenizer.add_special_tokens({'additional_special_tokens':sp})
|
76 |
|
77 |
|
78 |
prompt = ['Use the image 0: <image0>图,image 1: <image1>图 and image 2: <image2>图 as a visual aid to help you calculate the equation accurately. image 0 is 2+1=3.\nimage 1 is 5+6=11.\nimage 2 is"']
|
79 |
+
# images try to load the images to be a list of PIL.Image object.
|
80 |
prompt = " ".join(prompt)
|
81 |
|
82 |
inputs = processor(images=images, text=prompt, return_tensors="pt")
|