Spaces:

Wuyouz
/

English-Writing-Teacher

Sleeping

liudongqing commited on Nov 8, 2024

Commit

76209e3

1 Parent(s): d398fa0

reduce the tokens

Files changed (1) hide show

app.py CHANGED Viewed

@@ -16,7 +16,7 @@ model_id = "unsloth/Llama-3.2-11B-Vision"
 model = AutoModelForImageTextToText.from_pretrained(
     model_id,
     torch_dtype=torch.bfloat16,
-    # device_map="auto",
 )
 processor = AutoProcessor.from_pretrained(model_id)
@@ -32,7 +32,7 @@ def score_it(input_img):
     prompt = "<|image|><|begin_of_text|>extract the text in this picture"
     inputs = processor(image, prompt, return_tensors="pt").to(model.device)
-    output = model.generate(**inputs, max_new_tokens=300)
     return processor.decode(output[0])

 model = AutoModelForImageTextToText.from_pretrained(
     model_id,
     torch_dtype=torch.bfloat16,
+    device_map="auto",
 )
 processor = AutoProcessor.from_pretrained(model_id)
     prompt = "<|image|><|begin_of_text|>extract the text in this picture"
     inputs = processor(image, prompt, return_tensors="pt").to(model.device)
+    output = model.generate(**inputs, max_new_tokens=200)
     return processor.decode(output[0])