import gradio as gr
from df.PaperCentral import PaperCentral
from gradio_calendar import Calendar
from datetime import datetime, timedelta
from typing import Union, List, Optional, Tuple
from author_leaderboard_tab import author_leaderboard_tab
from pr_paper_central_tab import pr_paper_central_tab
from huggingface_hub import whoami
import json
import requests
from bs4 import BeautifulSoup
from author_leaderboard_contrib_tab import author_resource_leaderboard_tab
from paper_chat_tab import paper_chat_tab
from zoneinfo import ZoneInfo # Available in Python 3.9 and later
# Initialize the PaperCentral class instance
paper_central_df = PaperCentral()
def logging_flow(oauth_token: Optional[gr.OAuthToken]):
if oauth_token is None:
# User is not logged in
visibility_update = gr.update(visible=True)
user_info_update = gr.update(value="", label="User")
return visibility_update, user_info_update
try:
# Attempt to get user information
user_info = whoami(oauth_token.token)
visibility_update = gr.update(visible=False)
except requests.exceptions.HTTPError as e:
# If there's an error (e.g., token is invalid), treat as not logged in
visibility_update = gr.update(visible=True)
user_info_update = gr.update(value="", label="User")
return visibility_update, user_info_update
# Prepare user information for display
avatar_url = user_info.get("avatarUrl", "")
name = user_info.get("name", "")
avatar_html = f'''
{name}
Head to "Edit papers" tab to modify your paper!
'''
user_info_update = gr.update(value=avatar_html, label="User")
return visibility_update, user_info_update
# Create the Gradio Blocks app with custom CSS
with gr.Blocks(css_paths="style.css") as demo:
gr.Markdown("# Paper Central")
with gr.Row():
with gr.Column(scale=1):
login_button = gr.LoginButton(value="Add or edit your papers")
user_info_md = gr.HTML()
with gr.Column(scale=1):
with gr.Accordion(label="⭐Release notes", open=False):
gr.Markdown("""
- **November 21, 2024** – Neurips D&B 2024 proceedings added.
- **November 20, 2024** – Neurips 2024 proceedings added.
- **November 15, 2024** – EMNLP 2024 proceedings added.
- **October 24, 2024** – CoRL 2024 proceedings added.
- **October 20, 2024** – You can now add or edit papers.
- **October 19, 2024** – Papers with github now have github stars.
- **October 16, 2024** – Added functionality to filter papers by date ranges.
- **October 11, 2024** – Introduced leaderboards feature.
- **October 8, 2024** – MICCAI 2024 proceedings added.
- **October 7, 2024** – COLM 2024 proceedings added.
- **October 4, 2024** – Added functionality to filter papers by title.
""")
gr.Button(value="Use paper-central in datasets",
icon="https://huggingface.co/front/assets/huggingface_logo-noborder.svg",
size="sm",
link="https://huggingface.co/datasets/huggingface/paper-central-data")
with gr.Tabs() as tabs:
with gr.Tab("Paper-central", id="tab-paper-central"):
# Create a row for navigation buttons and calendar
with gr.Row():
with gr.Column(scale=1):
# Define the 'Next Day' and 'Previous Day' buttons
next_day_btn = gr.Button("Next Day")
prev_day_btn = gr.Button("Previous Day")
with gr.Column(scale=4):
# Define the calendar component for date selection
calendar = Calendar(
type="datetime",
label="Select a date",
info="Click the calendar icon to bring up the calendar.",
value=datetime.now(ZoneInfo('America/Los_Angeles')).strftime('%Y-%m-%d')
# Default to today's date in PST
)
# Add Radio buttons for date ranges
date_range_radio = gr.Radio(
label="Date Range",
choices=["This week", "This month", "This year", "All time"],
value=None,
)
# Create a row for Hugging Face options and Conference options
with gr.Row():
with gr.Column():
# Define the checkbox group for Hugging Face options
cat_options = gr.CheckboxGroup(
label="Category",
choices=[
'(ALL)',
'cs.*',
'eess.*',
'econ.*',
'math.*',
'astro-ph.*',
'cond-mat.*',
'gr-qc',
'hep-ex',
'hep-lat',
'hep-ph',
'hep-th',
'math-ph',
'nlin.*',
'nucl-ex',
'nucl-th',
'physics.*',
'quant-ph',
'q-bio.*',
'q-fin.*',
'stat.*',
],
value=["(ALL)"]
)
hf_options = gr.CheckboxGroup(
label="Hugging Face options",
choices=["🤗 artifacts", "datasets", "models", "spaces", "github", "project page"],
value=[],
elem_id="hf_options"
)
with gr.Column():
# Define the checkbox group for Conference options
conference_options = gr.CheckboxGroup(
label="Conference options",
choices=["ALL"] + PaperCentral.CONFERENCES
)
with gr.Row():
# Define a Textbox for author search
author_search = gr.Textbox(
label="Search Authors",
placeholder="Enter author name",
)
title_search = gr.Textbox(
label="Search Title",
placeholder="Enter keywords",
)
# Define the Dataframe component to display paper data
# List of columns in your DataFrame
columns = paper_central_df.COLUMNS_START_PAPER_PAGE
paper_central_component = gr.Dataframe(
label="Paper Data",
value=paper_central_df.df_prettified[columns],
datatype=[
paper_central_df.DATATYPES[column]
for column in columns
],
row_count=(0, "dynamic"),
interactive=False,
max_height=1000,
elem_id="table",
wrap=True,
)
with gr.Tab("Edit papers", id="tab-pr"):
pr_paper_central_tab(paper_central_df.df_raw)
with gr.Tab("Leaderboards", id="tab-leaderboards"):
with gr.Tab("Authors"):
author_leaderboard_tab()
with gr.Tab("Contributors"):
author_resource_leaderboard_tab()
with gr.Tab("Chat With Paper", id="tab-chat-with-paper", visible=False) as tab_chat_paper:
gr.Markdown("## Chat with Paper")
arxiv_id = gr.State(value=None)
paper_from = gr.State(value=None)
paper_chat_tab(arxiv_id, paper_from)
# chat with paper
def get_selected(evt: gr.SelectData, dataframe_origin):
paper_id = gr.update(value=None)
paper_from = gr.update(value=None)
tab_chat_paper = gr.update(visible=False)
selected_tab = gr.Tabs()
try:
# Parse the HTML content
soup = BeautifulSoup(evt.value, "html.parser")
# Find all tags
a_tags = soup.find_all('a')
for a_tag in a_tags:
# Check if 'action_id' attribute exists and equals 'chat-with-paper'
if a_tag.get('action_id') == 'chat-with-paper':
paper_id = a_tag.get("paper_id")
paper_from = a_tag.get("paper_from")
tab_chat_paper = gr.update(visible=True)
selected_tab = gr.Tabs(selected="tab-chat-with-paper")
except Exception as e:
print("The content is not valid HTML or another error occurred:", str(e))
pass
return paper_id, paper_from, tab_chat_paper, selected_tab
paper_central_component.select(get_selected, inputs=[paper_central_component],
outputs=[arxiv_id, paper_from, tab_chat_paper, tabs])
# Define function to move to the next day
def go_to_next_day(
date: Union[str, datetime],
cat_options_list: List[str],
hf_options_list: List[str],
conference_options_list: List[str],
author_search_input: str,
title_search_input: str,
date_range_option: Optional[str],
) -> tuple:
"""
Moves the selected date to the next day and updates the data.
Returns:
tuple: The new date as a string and the updated Dataframe component.
"""
date_range_update = gr.update(value=None)
# Ensure the date is in string format
if isinstance(date, datetime):
date_str = date.strftime('%Y-%m-%d')
else:
date_str = date
# Parse the date string and add one day
new_date = datetime.strptime(date_str, '%Y-%m-%d') + timedelta(days=1)
new_date_str = new_date.strftime('%Y-%m-%d')
# Update the Dataframe
updated_data = paper_central_df.filter(
selected_date=new_date_str,
cat_options=cat_options_list,
hf_options=hf_options_list,
conference_options=conference_options_list,
author_search_input=author_search_input,
title_search_input=title_search_input,
date_range_option=date_range_option,
)
# Return the new date and updated Dataframe
return new_date_str, updated_data, date_range_update
# Define function to move to the previous day
def go_to_previous_day(
date: Union[str, datetime],
cat_options_list: List[str],
hf_options_list: List[str],
conference_options_list: List[str],
author_search_input: str,
title_search_input: str,
date_range_option: Optional[str],
) -> tuple:
"""
Moves the selected date to the previous day and updates the data.
Returns:
tuple: The new date as a string and the updated Dataframe component.
"""
# If date_range_option is selected, do nothing
date_range_update = gr.update(value=None)
# Ensure the date is in string format
if isinstance(date, datetime):
date_str = date.strftime('%Y-%m-%d')
else:
date_str = date
# Parse the date string and subtract one day
new_date = datetime.strptime(date_str, '%Y-%m-%d') - timedelta(days=1)
new_date_str = new_date.strftime('%Y-%m-%d')
# Update the Dataframe
updated_data = paper_central_df.filter(
selected_date=new_date_str,
cat_options=cat_options_list,
hf_options=hf_options_list,
conference_options=conference_options_list,
author_search_input=author_search_input,
title_search_input=title_search_input,
date_range_option=date_range_option,
)
# Return the new date and updated Dataframe
return new_date_str, updated_data, date_range_update
# Define function to update data when date or options change
def update_data(
date: Union[str, datetime],
cat_options_list: List[str],
hf_options_list: List[str],
conference_options_list: List[str],
author_search_input: str,
title_search_input: str,
date_range_option: Optional[str],
):
"""
Updates the data displayed in the Dataframe based on the selected date and options.
"""
return paper_central_df.filter(
selected_date=date,
cat_options=cat_options_list,
hf_options=hf_options_list,
conference_options=conference_options_list,
author_search_input=author_search_input,
title_search_input=title_search_input,
date_range_option=date_range_option,
)
# Function to handle conference options change
def on_conference_options_change(
date: Union[str, datetime],
cat_options_list: List[str],
hf_options_list: List[str],
conference_options_list: List[str],
author_search_input: str,
title_search_input: str,
date_range_option: Optional[str],
):
cat_options_update = gr.update()
paper_central_component_update = gr.update()
visible = True
# Some conference options are selected
# Update cat_options to empty list
if conference_options_list:
cat_options_update = gr.update(value=[])
paper_central_component_update = update_data(
date,
[],
hf_options_list,
conference_options_list,
author_search_input,
title_search_input,
None,
)
visible = False
calendar_update = gr.update(visible=visible)
next_day_btn_update = gr.update(visible=visible)
prev_day_btn_update = gr.update(visible=visible)
date_range_option_update = gr.update(visible=visible, value=None)
return paper_central_component_update, cat_options_update, calendar_update, next_day_btn_update, prev_day_btn_update, date_range_option_update
# Function to handle category options change
def on_cat_options_change(
date: Union[str, datetime],
cat_options_list: List[str],
hf_options_list: List[str],
conference_options_list: List[str],
author_search_input: str,
title_search_input: str,
date_range_option: Optional[str],
):
conference_options_update = gr.update()
paper_central_component_update = gr.update()
visible = False
# Some category options are selected
# Update conference_options to empty list
if cat_options_list:
conference_options_update = gr.update(value=[])
paper_central_component_update = update_data(
date,
cat_options_list,
hf_options_list,
[],
author_search_input,
title_search_input,
date_range_option,
)
visible = True
calendar_update = gr.update(visible=visible)
next_day_btn_update = gr.update(visible=visible)
prev_day_btn_update = gr.update(visible=visible)
date_range_option_update = gr.update(visible=visible)
return paper_central_component_update, conference_options_update, calendar_update, next_day_btn_update, prev_day_btn_update, date_range_option_update
# Include date_range_radio in the inputs
inputs = [
calendar,
cat_options,
hf_options,
conference_options,
author_search,
title_search,
date_range_radio,
]
# Set up the event listener for the author search
author_search.submit(
fn=update_data,
inputs=inputs,
outputs=paper_central_component,
api_name=False
)
title_search.submit(
fn=update_data,
inputs=inputs,
outputs=paper_central_component,
api_name=False
)
# Set up the event listener for the 'Next Day' button
next_day_btn.click(
fn=go_to_next_day,
inputs=inputs,
outputs=[calendar, paper_central_component, date_range_radio],
api_name=False
)
# Set up the event listener for the 'Previous Day' button
prev_day_btn.click(
fn=go_to_previous_day,
inputs=inputs,
outputs=[calendar, paper_central_component, date_range_radio],
api_name=False
)
# Set up the event listener for the calendar date change
calendar.change(
fn=update_data,
inputs=inputs,
outputs=paper_central_component,
api_name=False
)
# Set up the event listener for the Hugging Face options change
hf_options.change(
fn=update_data,
inputs=inputs,
outputs=paper_central_component,
api_name=False
)
# Event chaining for conference options change
conference_options.change(
fn=on_conference_options_change,
inputs=inputs,
outputs=[paper_central_component, cat_options, calendar, next_day_btn, prev_day_btn, date_range_radio],
api_name=False
)
# Event chaining for category options change
cat_options.change(
fn=on_cat_options_change,
inputs=inputs,
outputs=[paper_central_component, conference_options, calendar, next_day_btn, prev_day_btn, date_range_radio],
api_name=False
)
# Set up the event listener for the date range radio button change
date_range_radio.change(
fn=update_data,
inputs=inputs,
outputs=paper_central_component,
api_name=False
)
# Load the initial data when the app starts
request = gr.Request()
def echo(request: gr.Request):
"""
Echoes the input text and prints request details.
Args:
text (str): The input text from the user.
request (gr.Request): The HTTP request object.
Returns:
str: The echoed text.
"""
calendar = gr.update(datetime.today().strftime('%Y-%m-%d'))
date_range = gr.update(value=None)
conferences = gr.update(value=[])
hf_options = gr.update(value=[])
selected_tab = gr.Tabs()
paper_id = gr.update(value=None)
tab_chat_paper = gr.update(visible=False)
if request:
# print("Request headers dictionary:", dict(request.headers))
# print("IP address:", request.client.host)
# print("Query parameters:", dict(request.query_params))
# print("Session hash:", request.session_hash)
if 'date' in request.query_params:
calendar = gr.update(value=request.query_params['date'])
if 'date_range' in request.query_params:
date_range = gr.update(value=request.query_params['date_range'])
if 'conferences' in request.query_params:
conferences = request.query_params['conferences']
try:
conferences = [value for value in conferences.split(',')]
except ValueError:
conferences = []
conferences = gr.update(value=conferences)
if "hf_options" in request.query_params:
hf_options = request.query_params['hf_options']
try:
hf_options = [value for value in hf_options.split(',')]
except ValueError:
hf_options = []
hf_options = gr.update(value=hf_options)
if "tab" in request.query_params:
tab = request.query_params['tab']
if tab == "tab-leaderboards":
selected_tab = gr.Tabs(selected="tab-leaderboards")
elif tab == "tab-chat-with-paper":
selected_tab = gr.Tabs(selected="tab-chat-with-paper")
if "paper_id" in request.query_params:
paper_id = request.query_params['paper_id']
tab_chat_paper = gr.update(visible=True)
return calendar, date_range, conferences, hf_options, selected_tab, paper_id, tab_chat_paper
demo.load(
fn=update_data,
inputs=inputs,
outputs=paper_central_component,
api_name="update_data",
).then(
fn=echo,
outputs=[calendar, date_range_radio, conference_options, hf_options, tabs, arxiv_id, tab_chat_paper],
api_name=False,
).then(
# New then to handle LoginButton and HTML components
fn=logging_flow,
outputs=[login_button, user_info_md],
api_name=False,
)
# Define the main function to launch the app
def main():
"""
Launches the Gradio app.
"""
demo.launch(ssr_mode=False, share=True)
# Run the main function when the script is executed
if __name__ == "__main__":
main()