Update src/populate.py
Browse files- src/populate.py +8 -7
src/populate.py
CHANGED
@@ -10,18 +10,19 @@ from src.leaderboard.read_evals import get_raw_eval_results
|
|
10 |
|
11 |
def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchmark_cols: list) -> pd.DataFrame:
|
12 |
"""Creates a dataframe from all the individual experiment results"""
|
13 |
-
|
14 |
-
|
15 |
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
|
20 |
-
|
21 |
import os
|
22 |
print(os.getcwd()) # 获取并打印当前工作目录
|
23 |
|
24 |
-
df = pd.read_csv('model_performance.csv')#
|
|
|
25 |
return df
|
26 |
|
27 |
|
|
|
10 |
|
11 |
def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchmark_cols: list) -> pd.DataFrame:
|
12 |
"""Creates a dataframe from all the individual experiment results"""
|
13 |
+
raw_data = get_raw_eval_results(results_path, requests_path)
|
14 |
+
all_data_json = [v.to_dict() for v in raw_data]
|
15 |
|
16 |
+
df = pd.DataFrame.from_records(all_data_json)
|
17 |
+
df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
18 |
+
df = df[cols].round(decimals=2)
|
19 |
|
20 |
+
filter out if any of the benchmarks have not been produced
|
21 |
import os
|
22 |
print(os.getcwd()) # 获取并打印当前工作目录
|
23 |
|
24 |
+
df = df[has_no_nan_values(df, benchmark_cols)] #pd.read_csv('model_performance.csv')#
|
25 |
+
print(df)
|
26 |
return df
|
27 |
|
28 |
|