LiveBench / src /populate.py
pufanyi's picture
Refactor load_dataset to include split parameter in populate.py
95e674a
raw
history blame
744 Bytes
import json
import os
import pandas as pd
from src.display.formatting import has_no_nan_values, make_clickable_model
from src.display.utils import AutoEvalColumn, EvalQueueColumn
from datasets import load_dataset, get_dataset_config_names
def get_leaderboard_df(results_repo):
subsets = get_dataset_config_names(results_repo)
subset_dfs = {}
for subset in subsets:
subset_data = load_dataset(results_repo, subset, split="test")
subset_df = subset_data.to_pandas()
subset_df = subset_df.sort_values(by="Total", ascending=False)
subset_df = subset_df.round(2) # Round all numeric columns to two decimal places
print(subset_df)
subset_dfs[subset] = subset_df
return subset_dfs