Spaces:
Sleeping
Sleeping
lordspline
commited on
Upload 2 files
Browse files- arena_ui.py +35 -0
- ratings.json +1 -0
arena_ui.py
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import gradio as gr
|
2 |
+
import os
|
3 |
+
import pandas as pd
|
4 |
+
import json
|
5 |
+
|
6 |
+
ratings = json.load(open("ratings.json"))
|
7 |
+
# df = pd.DataFrame(columns=["Rank", "Name", "Arena Elo"])
|
8 |
+
# for i in range(len(ratings)):
|
9 |
+
# df = df.append(
|
10 |
+
# {"Rank": i + 1, "Name": ratings[i][0], "Arena Elo": ratings[i][1]},
|
11 |
+
# ignore_index=True,
|
12 |
+
# )
|
13 |
+
df = pd.DataFrame(ratings, columns=["Name", "Arena Elo"])
|
14 |
+
df["Rank"] = df.index + 1
|
15 |
+
df = df[["Rank", "Name", "Arena Elo"]]
|
16 |
+
|
17 |
+
|
18 |
+
with gr.Blocks(css="footer {visibility: hidden}") as demo:
|
19 |
+
md = gr.Markdown(
|
20 |
+
"""## Internal Leaderboard
|
21 |
+
"""
|
22 |
+
)
|
23 |
+
|
24 |
+
md2 = gr.Markdown(
|
25 |
+
"""Notes:
|
26 |
+
- This is very unreliable as of now.
|
27 |
+
- The agents have been implemented haphazardly and only evaluated on 10 tasks.
|
28 |
+
"""
|
29 |
+
)
|
30 |
+
with gr.Row():
|
31 |
+
table = gr.Dataframe(df)
|
32 |
+
|
33 |
+
if __name__ == "__main__":
|
34 |
+
demo.queue()
|
35 |
+
demo.launch(debug=True)
|
ratings.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
[["vision_agent_reranking", 1013.6523617512925], ["standard_agent", 1003.3564093107665], ["standard_agent_reranking", 997.2581907453138], ["vision_agent", 985.7330381926273]]
|