henryL7 commited on
Commit
97950bf
·
1 Parent(s): 9767697

clean up repo

Browse files
Files changed (1) hide show
  1. src/populate.py +2 -1
src/populate.py CHANGED
@@ -6,6 +6,7 @@ import yaml
6
  from sklearn.metrics import cohen_kappa_score
7
  import numpy as np
8
  from datasets import load_dataset
 
9
 
10
  TYPES = ["str", "number", "number", "number", "number", "number"]
11
 
@@ -84,7 +85,7 @@ def load_leaderboard() -> pd.DataFrame:
84
  """Loads the leaderboard from the file system"""
85
  with open("./data/models.yaml") as fp:
86
  models = yaml.safe_load(fp)
87
- human_responses = load_dataset("salesforce/instrusum", "human_eval_pairwise")["data"]
88
  human_responses = [x for x in human_responses]
89
 
90
  predictions = {k: [] for k in ["Model", "Accuracy", "Agreement", "Self-Accuracy", "Self-Agreement"]}
 
6
  from sklearn.metrics import cohen_kappa_score
7
  import numpy as np
8
  from datasets import load_dataset
9
+ from envs import TOKEN
10
 
11
  TYPES = ["str", "number", "number", "number", "number", "number"]
12
 
 
85
  """Loads the leaderboard from the file system"""
86
  with open("./data/models.yaml") as fp:
87
  models = yaml.safe_load(fp)
88
+ human_responses = load_dataset("salesforce/instrusum", "human_eval_pairwise", token=TOKEN)["data"]
89
  human_responses = [x for x in human_responses]
90
 
91
  predictions = {k: [] for k in ["Model", "Accuracy", "Agreement", "Self-Accuracy", "Self-Agreement"]}