import gradio as gr from gradio_leaderboard import Leaderboard, ColumnFilter, SelectColumns import pandas as pd from apscheduler.schedulers.background import BackgroundScheduler from huggingface_hub import snapshot_download from src.about import ( CITATION_BUTTON_LABEL, CITATION_BUTTON_TEXT, EVALUATION_QUEUE_TEXT, INTRODUCTION_TEXT, LLM_BENCHMARKS_TEXT, TITLE, ) from src.display.css_html_js import custom_css, get_window_url_params from src.display.utils import ( COLUMNS, COLS, BENCHMARK_COLS, EVAL_COLS, EVAL_TYPES, ModelType, WeightType, Precision ) from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO, TOKEN from src.populate import get_evaluation_queue_df, get_leaderboard_df from src.submission.submit import add_new_eval def restart_space(): API.restart_space(repo_id=REPO_ID) ### Space initialization try: print(EVAL_REQUESTS_PATH) snapshot_download( repo_id=QUEUE_REPO, local_dir=EVAL_REQUESTS_PATH, repo_type="dataset", tqdm_class=None, etag_timeout=30, token=TOKEN ) except Exception: restart_space() try: print(EVAL_RESULTS_PATH) snapshot_download( repo_id=RESULTS_REPO, local_dir=EVAL_RESULTS_PATH, repo_type="dataset", tqdm_class=None, etag_timeout=30, token=TOKEN ) except Exception: restart_space() # Load the leaderboard DataFrame LEADERBOARD_DF = get_leaderboard_df(EVAL_RESULTS_PATH, EVAL_REQUESTS_PATH, COLS, BENCHMARK_COLS) print("LEADERBOARD_DF Shape:", LEADERBOARD_DF.shape) # Debug print("LEADERBOARD_DF Columns:", LEADERBOARD_DF.columns.tolist()) # Debug # Load the evaluation queue DataFrames finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df = get_evaluation_queue_df(EVAL_REQUESTS_PATH, EVAL_COLS) demo = gr.Blocks(css=custom_css + """ /* Column selection improvements */ .select-columns-container label { display: inline-block; width: 24%; font-size: 0.9em; padding: 2px 5px; margin: 2px 0; vertical-align: top; } /* Make column section more compact */ .select-columns-section { max-height: 300px; overflow-y: auto; padding: 0 !important; } /* Add category headers */ .column-category { font-weight: bold; margin-top: 10px; margin-bottom: 5px; border-bottom: 1px solid #eee; padding-bottom: 3px; } """) with demo: gr.HTML(TITLE) gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text") with gr.Tabs(elem_classes="tab-buttons") as tabs: with gr.TabItem("🏅 LLM Benchmark", elem_id="llm-benchmark-tab-table", id=0): if LEADERBOARD_DF.empty: gr.Markdown("No evaluations have been performed yet. The leaderboard is currently empty.") else: default_selection = [col.name for col in COLUMNS if col.displayed_by_default] print("Default Selection before ensuring 'model_name':", default_selection) # Debug # Ensure "model_name" is included if "model_name" not in default_selection: default_selection.insert(0, "model_name") print("Default Selection after ensuring 'model_name':", default_selection) # Debug # Add a custom accordion for better organization of column options with gr.Accordion("📊 Select Columns to Display", open=False): # Will be visually hidden and replaced with our custom layout gr.HTML("