Spaces:
Running
Running
update the formatting. and links
Browse files- _header.md +1 -1
- app.py +3 -2
_header.md
CHANGED
@@ -2,4 +2,4 @@
|
|
2 |
|
3 |
# π¦ ZebraLogic: On the Scaling Limits of LLMs for Logical Reasoning
|
4 |
<!-- [π FnF Paper](https://arxiv.org/abs/2305.18654) | -->
|
5 |
-
[
|
|
|
2 |
|
3 |
# π¦ ZebraLogic: On the Scaling Limits of LLMs for Logical Reasoning
|
4 |
<!-- [π FnF Paper](https://arxiv.org/abs/2305.18654) | -->
|
5 |
+
[π Paper](https://arxiv.org/abs/2502.01100) | [π» GitHub](https://github.com/WildEval/ZeroEval) | [π€ Dataset](https://huggingface.co/datasets/WildEval/ZebraLogic) | Updated: **{LAST_UPDATED}**
|
app.py
CHANGED
@@ -190,7 +190,7 @@ def data_load(result_file):
|
|
190 |
main_ordered_columns = ORDERED_COLUMN_NAMES
|
191 |
# filter the data with Total Puzzles == 1000
|
192 |
|
193 |
-
click_url =
|
194 |
# read json file from the result_file
|
195 |
with open(result_file, "r") as f:
|
196 |
raw_data = json.load(f)
|
@@ -203,7 +203,8 @@ def data_load(result_file):
|
|
203 |
pass
|
204 |
original_df = pd.DataFrame(raw_data)
|
205 |
original_df = original_df[original_df["Total Puzzles"] == 1000]
|
206 |
-
|
|
|
207 |
original_df = post_processing(original_df, column_names_main, ordered_columns=main_ordered_columns, click_url=click_url, rank_column=RANKING_COLUMN)
|
208 |
print(f"original_df.columns: {original_df.columns}")
|
209 |
# print(original_df.columns)
|
|
|
190 |
main_ordered_columns = ORDERED_COLUMN_NAMES
|
191 |
# filter the data with Total Puzzles == 1000
|
192 |
|
193 |
+
click_url = False
|
194 |
# read json file from the result_file
|
195 |
with open(result_file, "r") as f:
|
196 |
raw_data = json.load(f)
|
|
|
203 |
pass
|
204 |
original_df = pd.DataFrame(raw_data)
|
205 |
original_df = original_df[original_df["Total Puzzles"] == 1000]
|
206 |
+
# let's remove some models in the list: ["o1-preview-2024-09-12-v2", "o1-mini-2024-09-12-v2", "o1-mini-2024-09-12"]
|
207 |
+
original_df = original_df[~original_df["Model"].isin(["o1-preview-2024-09-12-v2", "o1-mini-2024-09-12-v2", "o1-mini-2024-09-12"])]
|
208 |
original_df = post_processing(original_df, column_names_main, ordered_columns=main_ordered_columns, click_url=click_url, rank_column=RANKING_COLUMN)
|
209 |
print(f"original_df.columns: {original_df.columns}")
|
210 |
# print(original_df.columns)
|