weizhiwang
commited on
Commit
•
a930042
1
Parent(s):
d3464c5
Update README.md
Browse files
README.md
CHANGED
@@ -31,6 +31,7 @@ from llava.model.builder import load_pretrained_model
|
|
31 |
from llava.mm_utils import tokenizer_image_token, process_images, get_model_name_from_path
|
32 |
from PIL import Image
|
33 |
import requests
|
|
|
34 |
|
35 |
# load model and processor
|
36 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
@@ -41,7 +42,9 @@ tokenizer, model, image_processor, context_len = load_pretrained_model(weizhiwan
|
|
41 |
text = '<image>' + '\n' + "Describe the image."
|
42 |
conv.append_message(conv.roles[0], text)
|
43 |
conv.append_message(conv.roles[1], None)
|
44 |
-
url =
|
|
|
|
|
45 |
image_tensor = image_processor.preprocess(image, return_tensors='pt')['pixel_values'].half().cuda()
|
46 |
|
47 |
# autoregressively generate text
|
|
|
31 |
from llava.mm_utils import tokenizer_image_token, process_images, get_model_name_from_path
|
32 |
from PIL import Image
|
33 |
import requests
|
34 |
+
from io import BytesIO
|
35 |
|
36 |
# load model and processor
|
37 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
|
|
42 |
text = '<image>' + '\n' + "Describe the image."
|
43 |
conv.append_message(conv.roles[0], text)
|
44 |
conv.append_message(conv.roles[1], None)
|
45 |
+
url = https://upload.wikimedia.org/wikipedia/en/thumb/7/7d/Lenna_%28test_image%29.png/330px-Lenna_%28test_image%29.png" # Lena
|
46 |
+
response = requests.get(url)
|
47 |
+
image = Image.open(BytesIO(response.content)).convert('RGB')
|
48 |
image_tensor = image_processor.preprocess(image, return_tensors='pt')['pixel_values'].half().cuda()
|
49 |
|
50 |
# autoregressively generate text
|