liorgreenb commited on
Commit
ba1ec42
·
1 Parent(s): cbca473

Use dataset config as tasks

Browse files
Files changed (2) hide show
  1. app.py +11 -8
  2. paper_models.csv +5 -5
app.py CHANGED
@@ -12,11 +12,14 @@ hf_api = HfApi()
12
 
13
  models = list(hf_api.list_models(filter=benchmark_tag))
14
 
15
- print("Tagged models", models)
 
 
 
 
 
16
 
17
- MAIN_METRIC_PER_TASK = {
18
- fashion_dataset: "ROC_AUC"
19
- }
20
 
21
  def create_model_link(model_id, link=None, type='repos'):
22
 
@@ -38,9 +41,9 @@ def get_model_results(model_meta):
38
  metrics_meta = []
39
  for index in model_meta['model-index']:
40
  for result in index['results']:
41
- if result['dataset']['type'].split('/')[0] == benchmark_user:
42
  metrics_dict = {metric['name']: metric['value'] for metric in result['metrics']}
43
- metrics_meta += [dict(dataset=result['dataset']['type'], **metrics_dict)]
44
 
45
  return metrics_meta
46
 
@@ -67,10 +70,10 @@ print(df)
67
  block = gr.Blocks()
68
 
69
  with block:
70
- for group_name, group in df.groupby('dataset'):
71
  gr.Markdown(f"## Task - {group_name}")
72
 
73
- group = group.sort_values(MAIN_METRIC_PER_TASK[group_name], ascending=False)
74
  group['dataset'] = group['dataset'].apply(lambda x: create_model_link(x, type="datasets"))
75
  gr.DataFrame(
76
  group.reset_index(drop=True),
 
12
 
13
  models = list(hf_api.list_models(filter=benchmark_tag))
14
 
15
+ supported_tasks = [
16
+ 'in_catalog_retrieval_zero_shot',
17
+ 'in_catalog_open_catalog',
18
+ 'in_catalog_closed_catalog',
19
+ 'consumer-catalog_wild_zero_shot',
20
+ ]
21
 
22
+ print("Tagged models", models)
 
 
23
 
24
  def create_model_link(model_id, link=None, type='repos'):
25
 
 
41
  metrics_meta = []
42
  for index in model_meta['model-index']:
43
  for result in index['results']:
44
+ if result['dataset']['type'].split('/')[0] == benchmark_user and result['dataset']['config'] in supported_tasks:
45
  metrics_dict = {metric['name']: metric['value'] for metric in result['metrics']}
46
+ metrics_meta += [dict(dataset=result['dataset']['type'], task=result['dataset']['config'], **metrics_dict)]
47
 
48
  return metrics_meta
49
 
 
70
  block = gr.Blocks()
71
 
72
  with block:
73
+ for group_name, group in df.groupby('task'):
74
  gr.Markdown(f"## Task - {group_name}")
75
 
76
+ group = group.sort_values('ROC_AUC', ascending=False)
77
  group['dataset'] = group['dataset'].apply(lambda x: create_model_link(x, type="datasets"))
78
  gr.DataFrame(
79
  group.reset_index(drop=True),
paper_models.csv CHANGED
@@ -1,5 +1,5 @@
1
- ,dataset,model,ROC_AUC,MRR@5
2
- 0,vsd-benchmark/vsd-fashion,Beit,75.5,93.5
3
- 1,vsd-benchmark/vsd-fashion,DINO,70.4,93.3
4
- 2,vsd-benchmark/vsd-fashion,ResNext,62.7,84.5
5
- 3,vsd-benchmark/vsd-fashion,CLIP,67.8,84.8
 
1
+ ,dataset,task,model,ROC_AUC,MRR@5
2
+ 0,vsd-benchmark/vsd-fashion,in_catalog_retrieval_zero_shot,Beit,75.5,93.5
3
+ 1,vsd-benchmark/vsd-fashion,in_catalog_retrieval_zero_shot,DINO,70.4,93.3
4
+ 2,vsd-benchmark/vsd-fashion,in_catalog_retrieval_zero_shot,ResNext,62.7,84.5
5
+ 3,vsd-benchmark/vsd-fashion,in_catalog_retrieval_zero_shot,CLIP,67.8,84.8