kaz-llm-lb

Paused

hi-melnikov commited on May 24, 2024

Commit

9ee8875

1 Parent(s): 103ed5f

Still trying to find why crash

Files changed (1) hide show

src/leaderboard/build_leaderboard.py CHANGED Viewed

@@ -61,14 +61,16 @@ def download_openbench():
     # download answers of different models that we trust
     download_dataset("Vikhrmodels/openbench-eval", EVAL_RESULTS_PATH)
-    logging.info("\nFiles openbench-eval:")
-    subprocess.run(["ls", EVAL_RESULTS_PATH], check=True)
-    logging.info("\nInternal models in openbench-eval:")
-    subprocess.run(["ls", f"{EVAL_RESULTS_PATH}/internal/"], check=True)
-    logging.info("\nJudgement in openbench-eval")
-    subprocess.run(["ls", f"{EVAL_RESULTS_PATH}/model_judgment/"], check=True)
     # copy the trusted model answers to data
     subprocess.run(

     # download answers of different models that we trust
     download_dataset("Vikhrmodels/openbench-eval", EVAL_RESULTS_PATH)
+    subprocess.run(["pwd"], check=False)
+    logging.info(EVAL_RESULTS_PATH)
+    print("\nFiles openbench-eval:")
+    subprocess.run(["ls", EVAL_RESULTS_PATH], check=False)
+    print("\nInternal models in openbench-eval:")
+    subprocess.run(["ls", f"{EVAL_RESULTS_PATH}/internal/"], check=False)
+    print("\nJudgement in openbench-eval")
+    subprocess.run(["ls", f"{EVAL_RESULTS_PATH}/model_judgment/gpt-4-1106-preview"], check=False)
     # copy the trusted model answers to data
     subprocess.run(