import torch
import streamlit as st
from transformers import pipeline, AutoTokenizer, AutoModelForQuestionAnswering
st.set_page_config(page_title="Common NLP Tasks")
st.title("Common NLP Tasks")
st.subheader("Use the menu on the left to select a NLP task to do (click on > if closed).")
expander = st.sidebar.expander('About')
expander.write("This web app allows you to perform common Natural Language Processing tasks, select a task below to get started.")
st.sidebar.header('What will you like to do?')
option = st.sidebar.radio('', ['Extractive question answering', 'Text summarization', 'Text generation', 'Sentiment analysis'])
@st.cache(show_spinner=False, allow_output_mutation=True)
def question_answerer(context, question):
tokenizer = AutoTokenizer.from_pretrained("deepset/roberta-base-squad2")
model = AutoModelForQuestionAnswering.from_pretrained("deepset/roberta-base-squad2")
inputs = tokenizer(question, context, add_special_tokens=True, return_tensors="pt")
input_ids = inputs["input_ids"].tolist()[0]
outputs = model(**inputs)
answer_start_scores = outputs.start_logits
answer_end_scores = outputs.end_logits
# Get the most likely beginning of answer with the argmax of the score
answer_start = torch.argmax(answer_start_scores)
# Get the most likely end of answer with the argmax of the score
answer_end = torch.argmax(answer_end_scores) + 1
answer = tokenizer.convert_tokens_to_string(tokenizer.convert_ids_to_tokens(input_ids[answer_start:answer_end]))
return answer
@st.cache(show_spinner=False, allow_output_mutation=True)
def summarization_model():
summarizer = pipeline("summarization")
return summarizer
@st.cache(show_spinner=False, allow_output_mutation=True)
def generation_model():
generator = pipeline("text-generation")
return generator
@st.cache(show_spinner=False, allow_output_mutation=True)
def sentiment_model():
sentiment_analysis = pipeline("sentiment-analysis")
return sentiment_analysis
if option == 'Extractive question answering':
st.markdown("
Extract answer from text
", unsafe_allow_html=True)
sample_text = "sample text"
source = st.radio("How would you like to start? Choose an option below", ["I want to input some text", "I want to upload a file"])
if source == "I want to input some text":
context = st.text_area('Use the example below or input your own text in English (between 1,000 and 10,000 characters)', value=sample_text, max_chars=10000, height=330)
question = st.text_input(label='Enter your question')
button = st.button('Get answer')
if button:
with st.spinner(text="Getting answer..."):
answer = question_answerer(context, question)
st.write(answer)
elif source == "I want to upload a file":
uploaded_file = st.file_uploader("Choose a .txt file to upload", type=["txt"])
question = st.text_input(label='Enter your question')
button = st.button('Get answer')
if button:
question_answerer = question_model()
with st.spinner(text="Getting answer..."):
answer = question_answerer(context=context, question=question)
st.write(answer["answer"])
elif option == 'Text summarization':
st.markdown("Summarize text
", unsafe_allow_html=True)
sample_text = "sample text"
source = st.radio("How would you like to start? Choose an option below", ["I want to input some text", "I want to upload a file"])
if source == "I want to input some text":
text = st.text_area('Input a text in English (between 1,000 and 10,000 characters)', value=sample_text, max_chars=10000, height=330)
button = st.button('Get summary')
if button:
summarizer = summarization_model()
with st.spinner(text="Summarizing text..."):
summary = summarizer(text, max_length=130, min_length=30)
st.write(summary)
elif source == "I want to upload a file":
uploaded_file = st.file_uploader("Choose a .txt file to upload", type=["txt"])
button = st.button('Get summary')
if button:
summarizer = summarization_model()
with st.spinner(text="Summarizing text..."):
summary = summarizer(text, max_length=130, min_length=30)
st.write(summary)
elif option == 'Text generation':
st.markdown("Generate text
", unsafe_allow_html=True)
text = st.text_input(label='Enter one line of text and let the NLP model generate the rest for you')
button = st.button('Generate text')
if button:
generator = generation_model()
with st.spinner(text="Generating text..."):
generated_text = generator(text, max_length=50)
st.write(generated_text[0]["generated_text"])
elif option == 'Sentiment analysis':
st.markdown("Classify review
", unsafe_allow_html=True)
text = st.text_input(label='Enter a sentence to get its sentiment analysis')
button = st.button('Get sentiment analysis')
if button:
sentiment_analysis = sentiment_model()
with st.spinner(text="Getting sentiment analysis..."):
sentiment = sentiment_analysis(text)
st.write(sentiment[0]["label"])