nicholasKluge commited on
Commit
c204c8e
1 Parent(s): 535a088

Upload results-multilingual.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. results-multilingual.json +37 -0
results-multilingual.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "arc_pt": {
4
+ "acc": 0.24444444444444444,
5
+ "acc_stderr": 0.012569442967524474,
6
+ "acc_norm": 0.28888888888888886,
7
+ "acc_norm_stderr": 0.013256439556126792
8
+ },
9
+ "hellaswag_pt": {
10
+ "acc": 0.3326470906923827,
11
+ "acc_stderr": 0.004904738424240269,
12
+ "acc_norm": 0.39408386607433094,
13
+ "acc_norm_stderr": 0.00508682495262388
14
+ },
15
+ "truthfulqa_pt": {
16
+ "mc1": 0.23604060913705585,
17
+ "mc1_stderr": 0.015137046117152837,
18
+ "mc2": 0.42762827969970946,
19
+ "mc2_stderr": 0.014911010832660198
20
+ }
21
+ },
22
+ "versions": {
23
+ "arc_pt": 0,
24
+ "hellaswag_pt": 1,
25
+ "truthfulqa_pt": 1
26
+ },
27
+ "config": {
28
+ "model": "hf-auto",
29
+ "model_args": "pretrained=/lustre/mlnvme/data/asen_hpc-mula/checkpoints-llama/slurm_job_17032104/step_400000",
30
+ "batch_size": 1,
31
+ "device": "cuda:0",
32
+ "no_cache": false,
33
+ "limit": null,
34
+ "bootstrap_iters": 100000,
35
+ "description_dict": {}
36
+ }
37
+ }