Spaces:
Running
Running
File size: 5,026 Bytes
2fcb72a aa8b4d6 2fcb72a aa8b4d6 2fcb72a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 |
import gradio as gr
import src.dependency # noqa
from src.assets import custom_css
# from src.attention import create_attn_plots
from src.content import ABOUT, CITATION_BUTTON, CITATION_BUTTON_LABEL, LOGO, TITLE
from src.hardware import load_hardware_configs
from src.leaderboard import create_leaderboard_table
from src.llm_perf import get_llm_perf_df
from src.panel import (
create_control_callback,
create_control_panel,
create_select_callback,
)
configs = load_hardware_configs("hardware.yaml")
demo = gr.Blocks(
css=custom_css,
theme=gr.themes.Default(primary_hue="indigo", secondary_hue="indigo"),
)
with demo:
gr.HTML(LOGO, elem_classes="logo")
gr.HTML(TITLE, elem_classes="title")
####################### HARDWARE TABS #######################
with gr.Tabs(elem_classes="tabs"):
for id, config in enumerate(configs):
with gr.TabItem(config.description, id=id):
####################### HARDWARE DETAILS #######################
if config.detail:
gr.Markdown(config.detail, elem_classes="descriptive-text")
######################## CONTROL PANEL #######################
# (
# filter_button,
# machine_value,
# backends_value,
# hardware_type_value,
# memory_slider,
# quantization_checkboxes,
# ) = create_control_panel(
# machine=config.machine,
# backends=config.backends,
# hardware_provider=config.hardware_provider,
# hardware_type=config.hardware_type,
# )
machine_value = gr.State(value=config.machine)
backends_value = gr.State(value=config.backends)
hardware_type_value = gr.State(value=config.hardware_type)
####################### HARDWARE SUBTABS #######################
with gr.Tabs(elem_classes="subtabs"):
open_llm_perf_df = get_llm_perf_df(
machine=config.machine,
backends=config.backends,
hardware_type=config.hardware_type,
)
####################### LEADERBOARD TAB #######################
with gr.TabItem("Leaderboard π
", id=0):
search_bar, columns_checkboxes, leaderboard_table = (
create_leaderboard_table(open_llm_perf_df)
)
###################### ATTENTIONS SPEEDUP TAB #######################
# with gr.TabItem("Attention π", id=2):
# attn_prefill_plot, attn_decode_plot = create_attn_plots(
# open_llm_perf_df
# )
# ####################### KERNELS SPEEDUP TAB #######################
# with gr.TabItem("Kernels π", id=4):
# quant_krnl_prefill_plot, quant_krnl_decode_plot = (
# create_quant_krnl_plots(llm_perf_df)
# )
####################### CONTROL CALLBACK #######################
# create_control_callback(
# filter_button,
# # inputs
# machine_value,
# backends_value,
# hardware_type_value,
# memory_slider,
# quantization_checkboxes,
# # interactive
# columns_checkboxes,
# search_bar,
# # outputs
# leaderboard_table,
# # attn_prefill_plot,
# # attn_decode_plot,
# # quant_krnl_prefill_plot,
# # quant_krnl_decode_plot,
# )
create_select_callback(
# inputs
machine_value,
backends_value,
hardware_type_value,
# interactive
columns_checkboxes,
search_bar,
# outputs
leaderboard_table,
)
####################### ABOUT TAB #######################
with gr.TabItem("About π", id=len(configs)):
gr.Markdown(ABOUT, elem_classes="descriptive-text")
####################### CITATION
with gr.Row():
with gr.Accordion("π Citation", open=False):
citation_button = gr.Textbox(
value=CITATION_BUTTON,
label=CITATION_BUTTON_LABEL,
elem_id="citation-button",
show_copy_button=True,
)
if __name__ == "__main__":
# Launch demo
demo.queue().launch()
|