Spaces:
Running
Running
import gradio as gr | |
import src.dependency # noqa | |
from src.assets import custom_css | |
# from src.attention import create_attn_plots | |
from src.content import ABOUT, CITATION_BUTTON, CITATION_BUTTON_LABEL, LOGO, LOGO2, TITLE | |
from src.hardware import load_hardware_configs | |
from src.leaderboard import create_leaderboard_table | |
from src.llm_perf import get_llm_perf_df | |
from src.panel import ( | |
create_control_callback, | |
create_control_panel, | |
create_select_callback, | |
) | |
configs = load_hardware_configs("hardware.yaml") | |
demo = gr.Blocks( | |
css=custom_css, | |
theme=gr.themes.Default(primary_hue="indigo", secondary_hue="indigo"), | |
) | |
with demo: | |
with gr.Row(): | |
gr.HTML(LOGO, elem_classes="logo") | |
gr.HTML(LOGO2, elem_classes="logo2") | |
gr.HTML(TITLE, elem_classes="title") | |
####################### HARDWARE TABS ####################### | |
with gr.Tabs(elem_classes="tabs"): | |
for id, config in enumerate(configs): | |
with gr.TabItem("Leaderboard", id=id): | |
####################### HARDWARE DETAILS ####################### | |
if config.detail: | |
gr.Markdown(config.detail, elem_classes="descriptive-text") | |
######################## CONTROL PANEL ####################### | |
# ( | |
# filter_button, | |
# machine_value, | |
# backends_value, | |
# hardware_type_value, | |
# memory_slider, | |
# quantization_checkboxes, | |
# ) = create_control_panel( | |
# machine=config.machine, | |
# backends=config.backends, | |
# hardware_provider=config.hardware_provider, | |
# hardware_type=config.hardware_type, | |
# ) | |
machine_value = gr.State(value=config.machine) | |
backends_value = gr.State(value=config.backends) | |
hardware_type_value = gr.State(value=config.hardware_type) | |
####################### HARDWARE SUBTABS ####################### | |
with gr.Tabs(elem_classes="subtabs"): | |
open_llm_perf_df = get_llm_perf_df( | |
machine=config.machine, | |
backends=config.backends, | |
hardware_type=config.hardware_type, | |
) | |
####################### LEADERBOARD TAB ####################### | |
with gr.TabItem("Raspberry Pi 5 - Cortex A76", id=0): | |
search_bar, columns_checkboxes, leaderboard_table = ( | |
create_leaderboard_table(open_llm_perf_df) | |
) | |
###################### ATTENTIONS SPEEDUP TAB ####################### | |
# with gr.TabItem("Attention π", id=2): | |
# attn_prefill_plot, attn_decode_plot = create_attn_plots( | |
# open_llm_perf_df | |
# ) | |
# ####################### KERNELS SPEEDUP TAB ####################### | |
# with gr.TabItem("Kernels π", id=4): | |
# quant_krnl_prefill_plot, quant_krnl_decode_plot = ( | |
# create_quant_krnl_plots(llm_perf_df) | |
# ) | |
####################### CONTROL CALLBACK ####################### | |
# create_control_callback( | |
# filter_button, | |
# # inputs | |
# machine_value, | |
# backends_value, | |
# hardware_type_value, | |
# memory_slider, | |
# quantization_checkboxes, | |
# # interactive | |
# columns_checkboxes, | |
# search_bar, | |
# # outputs | |
# leaderboard_table, | |
# # attn_prefill_plot, | |
# # attn_decode_plot, | |
# # quant_krnl_prefill_plot, | |
# # quant_krnl_decode_plot, | |
# ) | |
create_select_callback( | |
# inputs | |
machine_value, | |
backends_value, | |
hardware_type_value, | |
# interactive | |
columns_checkboxes, | |
search_bar, | |
# outputs | |
leaderboard_table, | |
) | |
####################### ABOUT TAB ####################### | |
with gr.TabItem("About π", id=len(configs)): | |
gr.Markdown(ABOUT, elem_classes="descriptive-text") | |
####################### CITATION | |
with gr.Row(): | |
with gr.Accordion("π Citation", open=False): | |
citation_button = gr.Textbox( | |
value=CITATION_BUTTON, | |
label=CITATION_BUTTON_LABEL, | |
elem_id="citation-button", | |
show_copy_button=True, | |
lines=7 | |
) | |
if __name__ == "__main__": | |
# Launch demo | |
demo.queue().launch() | |