File size: 2,392 Bytes
feee0c8 e3463bc feee0c8 eee75cd feee0c8 e06d0f8 41efb19 e06d0f8 feee0c8 771fad4 feee0c8 771fad4 feee0c8 e06d0f8 feee0c8 e06d0f8 feee0c8 771fad4 41efb19 feee0c8 8362905 feee0c8 e3463bc 8362905 feee0c8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 |
from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
from gradio import Interface
# Define the model name (change if desired)
model_name = "facebook/bart-base"
# Load tokenizer and model
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
def generate_questions(email):
"""Generates questions based on the input email."""
# ... (existing code for encoding the email)
# Check length instead of shape
if len(inputs["input_ids"]) > 512: # Adjust maximum sequence length as needed
print("WARNING: Input sequence exceeds maximum length. Truncating.")
inputs["input_ids"] = inputs["input_ids"][:512]
# Generate questions using model
generation = model.generate(
**inputs, # Unpack the entire inputs dictionary
max_length=256, # Adjust max length as needed
# ... (other generation parameters)
)
# ... (existing code for decoding the generation)
# Decode the generated text
return tokenizer.decode(generation[0], skip_special_tokens=True)
def generate_answers(questions):
"""Generates possible answers to the input questions."""
# Encode each question with tokenizer, separated by newline
inputs = tokenizer("\n".join(questions), return_tensors="pt")
# Generate answers using model with specific prompt
generation = model.generate(
input_ids=inputs["input_ids"],
max_length=512, # Adjust max length as needed
num_beams=3, # Adjust beam search for better quality (slower)
early_stopping=True,
prompt="Here are some possible answers to the questions:\n",
)
# Decode the generated text
answers = tokenizer.decode(generation[0], skip_special_tokens=True).split("\n")
return zip(questions, answers[1:]) # Skip the first answer (prompt repetition)
def gradio_app(email):
"""Gradio interface function"""
questions = generate_questions(email)
answers = generate_answers(questions.split("\n"))
return questions, [answer for _, answer in answers]
# Gradio interface definition
# Gradio interface definition (without label)
interface = Interface(
fn=gradio_app,
inputs="textbox",
outputs=["text", "text"],
title="AI Email Assistant",
description="Enter a long email and get questions and possible answers generated by an AI model.",
elem_id="email-input"
)
# Launch the Gradio interface
interface.launch()
|