lordspline commited on
Commit
12edcf1
·
verified ·
1 Parent(s): d80c1c8

Upload 2 files

Browse files
Files changed (2) hide show
  1. arena_ui.py +35 -0
  2. ratings.json +1 -0
arena_ui.py ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ import os
3
+ import pandas as pd
4
+ import json
5
+
6
+ ratings = json.load(open("ratings.json"))
7
+ # df = pd.DataFrame(columns=["Rank", "Name", "Arena Elo"])
8
+ # for i in range(len(ratings)):
9
+ # df = df.append(
10
+ # {"Rank": i + 1, "Name": ratings[i][0], "Arena Elo": ratings[i][1]},
11
+ # ignore_index=True,
12
+ # )
13
+ df = pd.DataFrame(ratings, columns=["Name", "Arena Elo"])
14
+ df["Rank"] = df.index + 1
15
+ df = df[["Rank", "Name", "Arena Elo"]]
16
+
17
+
18
+ with gr.Blocks(css="footer {visibility: hidden}") as demo:
19
+ md = gr.Markdown(
20
+ """## Internal Leaderboard
21
+ """
22
+ )
23
+
24
+ md2 = gr.Markdown(
25
+ """Notes:
26
+ - This is very unreliable as of now.
27
+ - The agents have been implemented haphazardly and only evaluated on 10 tasks.
28
+ """
29
+ )
30
+ with gr.Row():
31
+ table = gr.Dataframe(df)
32
+
33
+ if __name__ == "__main__":
34
+ demo.queue()
35
+ demo.launch(debug=True)
ratings.json ADDED
@@ -0,0 +1 @@
 
 
1
+ [["vision_agent_reranking", 1013.6523617512925], ["standard_agent", 1003.3564093107665], ["standard_agent_reranking", 997.2581907453138], ["vision_agent", 985.7330381926273]]