kaz-llm-lb

Running

hi-melnikov commited on May 24

Commit

b7741fd

•

1 Parent(s): b19c539

More verbose

Files changed (2) hide show

app.py CHANGED Viewed

@@ -108,7 +108,7 @@ def update_board():
     show_result_file = os.path.join(HF_HOME, "src/gen/show_result.py")
     subprocess.run(["python3", show_result_file, "--output"], check=True)
-    # update the gr item
     # TODO

     show_result_file = os.path.join(HF_HOME, "src/gen/show_result.py")
     subprocess.run(["python3", show_result_file, "--output"], check=True)
+    # update the gr item with leaderboard
     # TODO

src/leaderboard/build_leaderboard.py CHANGED Viewed

@@ -61,14 +61,17 @@ def download_openbench():
     # download answers of different models that we trust
     download_dataset("Vikhrmodels/openbench-eval", EVAL_RESULTS_PATH)
-    subprocess.run(["ls", EVAL_RESULTS_PATH], check=True)
     # copy the trusted model answers to data
     subprocess.run(
         [
             "rsync",
-            "-azP",
-            "--ignore-existing",
             f"{EVAL_RESULTS_PATH}/internal/*",
             f"{DATA_ARENA_PATH}/model_answer/internal/",
         ],
@@ -79,8 +82,7 @@ def download_openbench():
     subprocess.run(
         [
             "rsync",
-            "-azP",
-            "--ignore-existing",
             f"{EVAL_RESULTS_PATH}/model_judgment/*",
             f"{DATA_ARENA_PATH}/model_judgement/",
         ],

     # download answers of different models that we trust
     download_dataset("Vikhrmodels/openbench-eval", EVAL_RESULTS_PATH)
+    logging.info("\nInternal models in openbench-eval:")
+    subprocess.run(["ls", f"{EVAL_RESULTS_PATH}/internal/"], check=True)
+    logging.info("\nJudgement in openbench-eval")
+    subprocess.run(["ls", f"{EVAL_RESULTS_PATH}/model_judgment/"], check=True)
     # copy the trusted model answers to data
     subprocess.run(
         [
             "rsync",
+            "-azPvh",
             f"{EVAL_RESULTS_PATH}/internal/*",
             f"{DATA_ARENA_PATH}/model_answer/internal/",
         ],
     subprocess.run(
         [
             "rsync",
+            "-azPvh",
             f"{EVAL_RESULTS_PATH}/model_judgment/*",
             f"{DATA_ARENA_PATH}/model_judgement/",
         ],