yuchenlin commited on
Commit
42bdfa0
Β·
1 Parent(s): 29abfee

update the formatting. and links

Browse files
Files changed (2) hide show
  1. _header.md +1 -1
  2. app.py +3 -2
_header.md CHANGED
@@ -2,4 +2,4 @@
2
 
3
  # πŸ¦“ ZebraLogic: On the Scaling Limits of LLMs for Logical Reasoning
4
  <!-- [πŸ“‘ FnF Paper](https://arxiv.org/abs/2305.18654) | -->
5
- [πŸ“° Blog](https://huggingface.co/blog/yuchenlin/zebra-logic) [πŸ’» GitHub](https://github.com/WildEval/ZeroEval) | [πŸ€— HuggingFace](https://huggingface.co/collections/allenai/zebra-logic-bench-6697137cbaad0b91e635e7b0) | [🐦 X](https://twitter.com/billyuchenlin/) | [πŸ’¬ Discussion](https://huggingface.co/spaces/allenai/ZebraLogicBench-Leaderboard/discussions) | Updated: **{LAST_UPDATED}**
 
2
 
3
  # πŸ¦“ ZebraLogic: On the Scaling Limits of LLMs for Logical Reasoning
4
  <!-- [πŸ“‘ FnF Paper](https://arxiv.org/abs/2305.18654) | -->
5
+ [πŸ“‘ Paper](https://arxiv.org/abs/2502.01100) | [πŸ’» GitHub](https://github.com/WildEval/ZeroEval) | [πŸ€— Dataset](https://huggingface.co/datasets/WildEval/ZebraLogic) | Updated: **{LAST_UPDATED}**
app.py CHANGED
@@ -190,7 +190,7 @@ def data_load(result_file):
190
  main_ordered_columns = ORDERED_COLUMN_NAMES
191
  # filter the data with Total Puzzles == 1000
192
 
193
- click_url = True
194
  # read json file from the result_file
195
  with open(result_file, "r") as f:
196
  raw_data = json.load(f)
@@ -203,7 +203,8 @@ def data_load(result_file):
203
  pass
204
  original_df = pd.DataFrame(raw_data)
205
  original_df = original_df[original_df["Total Puzzles"] == 1000]
206
-
 
207
  original_df = post_processing(original_df, column_names_main, ordered_columns=main_ordered_columns, click_url=click_url, rank_column=RANKING_COLUMN)
208
  print(f"original_df.columns: {original_df.columns}")
209
  # print(original_df.columns)
 
190
  main_ordered_columns = ORDERED_COLUMN_NAMES
191
  # filter the data with Total Puzzles == 1000
192
 
193
+ click_url = False
194
  # read json file from the result_file
195
  with open(result_file, "r") as f:
196
  raw_data = json.load(f)
 
203
  pass
204
  original_df = pd.DataFrame(raw_data)
205
  original_df = original_df[original_df["Total Puzzles"] == 1000]
206
+ # let's remove some models in the list: ["o1-preview-2024-09-12-v2", "o1-mini-2024-09-12-v2", "o1-mini-2024-09-12"]
207
+ original_df = original_df[~original_df["Model"].isin(["o1-preview-2024-09-12-v2", "o1-mini-2024-09-12-v2", "o1-mini-2024-09-12"])]
208
  original_df = post_processing(original_df, column_names_main, ordered_columns=main_ordered_columns, click_url=click_url, rank_column=RANKING_COLUMN)
209
  print(f"original_df.columns: {original_df.columns}")
210
  # print(original_df.columns)