Commit
·
4a7f4b8
1
Parent(s):
c25e6bb
fix prod bugs
Browse files
app.py
CHANGED
@@ -16,7 +16,7 @@ AFRIXNLI_TRANSLATE = "afrixnli_translate"
|
|
16 |
|
17 |
BENCHMARKS = [AFRIMMLU_DIRECT, AFRIMMLU_TRANSLATE, AFRIXNLI_DIRECT, AFRIXNLI_TRANSLATE]
|
18 |
|
19 |
-
METRICS = ["acc_norm", "acc_norm", "acc_norm"
|
20 |
|
21 |
LANGS = ['amh', 'eng', 'ewe', 'fra', 'hau', 'ibo', 'kin', 'lin', 'lug', 'orm', 'sna', 'sot', 'swa', 'twi', 'wol', 'xho', 'yor', 'zul']
|
22 |
|
@@ -66,11 +66,17 @@ def collect_results():
|
|
66 |
pretrained_models.add(pretrained)
|
67 |
|
68 |
for lang_task, perfs in results.items():
|
69 |
-
|
|
|
|
|
|
|
|
|
|
|
70 |
assert task in BENCHMARKS
|
71 |
|
72 |
if lang and task:
|
73 |
-
|
|
|
74 |
p = round(perfs[metric] * 100, 1)
|
75 |
performance_dict[(pretrained, lang)][task] = p
|
76 |
return performance_dict, pretrained_models
|
|
|
16 |
|
17 |
BENCHMARKS = [AFRIMMLU_DIRECT, AFRIMMLU_TRANSLATE, AFRIXNLI_DIRECT, AFRIXNLI_TRANSLATE]
|
18 |
|
19 |
+
METRICS = ["acc_norm", "acc_norm", "acc_norm"]
|
20 |
|
21 |
LANGS = ['amh', 'eng', 'ewe', 'fra', 'hau', 'ibo', 'kin', 'lin', 'lug', 'orm', 'sna', 'sot', 'swa', 'twi', 'wol', 'xho', 'yor', 'zul']
|
22 |
|
|
|
66 |
pretrained_models.add(pretrained)
|
67 |
|
68 |
for lang_task, perfs in results.items():
|
69 |
+
print(lang_task)
|
70 |
+
print(perfs)
|
71 |
+
lang_task = lang_task.split('_')
|
72 |
+
lang = lang_task[-1]
|
73 |
+
task = '_'.join(lang_task[:-1])
|
74 |
+
|
75 |
assert task in BENCHMARKS
|
76 |
|
77 |
if lang and task:
|
78 |
+
print(BENCHMARKS.index(task))
|
79 |
+
metric = METRICS[BENCHMARKS.index(task)-1]
|
80 |
p = round(perfs[metric] * 100, 1)
|
81 |
performance_dict[(pretrained, lang)][task] = p
|
82 |
return performance_dict, pretrained_models
|