File size: 623 Bytes
ca7e9c6 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 |
import numpy as np
import matplotlib.pyplot as plt
from transformers import T5Tokenizer, T5ForConditionalGeneration
model_path = "/Users/pmui/models/flan-t5-xl"
tokenizer = T5Tokenizer.from_pretrained(model_path)
model = T5ForConditionalGeneration.from_pretrained(model_path, device_map="auto")
def inference(input_text):
input_ids = tokenizer(input_text, return_tensors="pt").input_ids
outputs = model.generate(input_ids, max_length=200, bos_token_id=0)
result = tokenizer.decode(outputs[0], skip_special_tokens=True)
print(result)
input_text = "What is the tallest building in the world?"
inference(input_text) |