Spaces:
Runtime error
Runtime error
liorgreenb
commited on
Commit
·
ba1ec42
1
Parent(s):
cbca473
Use dataset config as tasks
Browse files- app.py +11 -8
- paper_models.csv +5 -5
app.py
CHANGED
@@ -12,11 +12,14 @@ hf_api = HfApi()
|
|
12 |
|
13 |
models = list(hf_api.list_models(filter=benchmark_tag))
|
14 |
|
15 |
-
|
|
|
|
|
|
|
|
|
|
|
16 |
|
17 |
-
|
18 |
-
fashion_dataset: "ROC_AUC"
|
19 |
-
}
|
20 |
|
21 |
def create_model_link(model_id, link=None, type='repos'):
|
22 |
|
@@ -38,9 +41,9 @@ def get_model_results(model_meta):
|
|
38 |
metrics_meta = []
|
39 |
for index in model_meta['model-index']:
|
40 |
for result in index['results']:
|
41 |
-
if result['dataset']['type'].split('/')[0] == benchmark_user:
|
42 |
metrics_dict = {metric['name']: metric['value'] for metric in result['metrics']}
|
43 |
-
metrics_meta += [dict(dataset=result['dataset']['type'], **metrics_dict)]
|
44 |
|
45 |
return metrics_meta
|
46 |
|
@@ -67,10 +70,10 @@ print(df)
|
|
67 |
block = gr.Blocks()
|
68 |
|
69 |
with block:
|
70 |
-
for group_name, group in df.groupby('
|
71 |
gr.Markdown(f"## Task - {group_name}")
|
72 |
|
73 |
-
group = group.sort_values(
|
74 |
group['dataset'] = group['dataset'].apply(lambda x: create_model_link(x, type="datasets"))
|
75 |
gr.DataFrame(
|
76 |
group.reset_index(drop=True),
|
|
|
12 |
|
13 |
models = list(hf_api.list_models(filter=benchmark_tag))
|
14 |
|
15 |
+
supported_tasks = [
|
16 |
+
'in_catalog_retrieval_zero_shot',
|
17 |
+
'in_catalog_open_catalog',
|
18 |
+
'in_catalog_closed_catalog',
|
19 |
+
'consumer-catalog_wild_zero_shot',
|
20 |
+
]
|
21 |
|
22 |
+
print("Tagged models", models)
|
|
|
|
|
23 |
|
24 |
def create_model_link(model_id, link=None, type='repos'):
|
25 |
|
|
|
41 |
metrics_meta = []
|
42 |
for index in model_meta['model-index']:
|
43 |
for result in index['results']:
|
44 |
+
if result['dataset']['type'].split('/')[0] == benchmark_user and result['dataset']['config'] in supported_tasks:
|
45 |
metrics_dict = {metric['name']: metric['value'] for metric in result['metrics']}
|
46 |
+
metrics_meta += [dict(dataset=result['dataset']['type'], task=result['dataset']['config'], **metrics_dict)]
|
47 |
|
48 |
return metrics_meta
|
49 |
|
|
|
70 |
block = gr.Blocks()
|
71 |
|
72 |
with block:
|
73 |
+
for group_name, group in df.groupby('task'):
|
74 |
gr.Markdown(f"## Task - {group_name}")
|
75 |
|
76 |
+
group = group.sort_values('ROC_AUC', ascending=False)
|
77 |
group['dataset'] = group['dataset'].apply(lambda x: create_model_link(x, type="datasets"))
|
78 |
gr.DataFrame(
|
79 |
group.reset_index(drop=True),
|
paper_models.csv
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
-
,dataset,model,ROC_AUC,MRR@5
|
2 |
-
0,vsd-benchmark/vsd-fashion,Beit,75.5,93.5
|
3 |
-
1,vsd-benchmark/vsd-fashion,DINO,70.4,93.3
|
4 |
-
2,vsd-benchmark/vsd-fashion,ResNext,62.7,84.5
|
5 |
-
3,vsd-benchmark/vsd-fashion,CLIP,67.8,84.8
|
|
|
1 |
+
,dataset,task,model,ROC_AUC,MRR@5
|
2 |
+
0,vsd-benchmark/vsd-fashion,in_catalog_retrieval_zero_shot,Beit,75.5,93.5
|
3 |
+
1,vsd-benchmark/vsd-fashion,in_catalog_retrieval_zero_shot,DINO,70.4,93.3
|
4 |
+
2,vsd-benchmark/vsd-fashion,in_catalog_retrieval_zero_shot,ResNext,62.7,84.5
|
5 |
+
3,vsd-benchmark/vsd-fashion,in_catalog_retrieval_zero_shot,CLIP,67.8,84.8
|