ToluClassics commited on
Commit
4a7f4b8
·
1 Parent(s): c25e6bb

fix prod bugs

Browse files
Files changed (1) hide show
  1. app.py +9 -3
app.py CHANGED
@@ -16,7 +16,7 @@ AFRIXNLI_TRANSLATE = "afrixnli_translate"
16
 
17
  BENCHMARKS = [AFRIMMLU_DIRECT, AFRIMMLU_TRANSLATE, AFRIXNLI_DIRECT, AFRIXNLI_TRANSLATE]
18
 
19
- METRICS = ["acc_norm", "acc_norm", "acc_norm", "mc2"]
20
 
21
  LANGS = ['amh', 'eng', 'ewe', 'fra', 'hau', 'ibo', 'kin', 'lin', 'lug', 'orm', 'sna', 'sot', 'swa', 'twi', 'wol', 'xho', 'yor', 'zul']
22
 
@@ -66,11 +66,17 @@ def collect_results():
66
  pretrained_models.add(pretrained)
67
 
68
  for lang_task, perfs in results.items():
69
- task, lang = lang_task.split('_')
 
 
 
 
 
70
  assert task in BENCHMARKS
71
 
72
  if lang and task:
73
- metric = METRICS[BENCHMARKS.index(task)]
 
74
  p = round(perfs[metric] * 100, 1)
75
  performance_dict[(pretrained, lang)][task] = p
76
  return performance_dict, pretrained_models
 
16
 
17
  BENCHMARKS = [AFRIMMLU_DIRECT, AFRIMMLU_TRANSLATE, AFRIXNLI_DIRECT, AFRIXNLI_TRANSLATE]
18
 
19
+ METRICS = ["acc_norm", "acc_norm", "acc_norm"]
20
 
21
  LANGS = ['amh', 'eng', 'ewe', 'fra', 'hau', 'ibo', 'kin', 'lin', 'lug', 'orm', 'sna', 'sot', 'swa', 'twi', 'wol', 'xho', 'yor', 'zul']
22
 
 
66
  pretrained_models.add(pretrained)
67
 
68
  for lang_task, perfs in results.items():
69
+ print(lang_task)
70
+ print(perfs)
71
+ lang_task = lang_task.split('_')
72
+ lang = lang_task[-1]
73
+ task = '_'.join(lang_task[:-1])
74
+
75
  assert task in BENCHMARKS
76
 
77
  if lang and task:
78
+ print(BENCHMARKS.index(task))
79
+ metric = METRICS[BENCHMARKS.index(task)-1]
80
  p = round(perfs[metric] * 100, 1)
81
  performance_dict[(pretrained, lang)][task] = p
82
  return performance_dict, pretrained_models