Spaces:

babylm
/

leaderboard-2024

Running

Aaron Mueller commited on Dec 2, 2024

Commit

d162626

1 Parent(s): 31b9f7c

debugging

Files changed (2) hide show

src/leaderboard/read_evals.py CHANGED Viewed

@@ -56,7 +56,6 @@ class EvalResult:
         def _get_task_results(task):
             # We average all scores of a given metric (not all metrics are present in all files)
-            print(data["results"].items())
             accs = np.array([v.get(task.metric, None) for k, v in data["results"].items() if task.benchmark == k])
             if accs.size == 0 or any([acc is None for acc in accs]):
                 return None

         def _get_task_results(task):
             # We average all scores of a given metric (not all metrics are present in all files)
             accs = np.array([v.get(task.metric, None) for k, v in data["results"].items() if task.benchmark == k])
             if accs.size == 0 or any([acc is None for acc in accs]):
                 return None

src/submission/submit.py CHANGED Viewed

@@ -47,19 +47,25 @@ def add_new_eval(
     out_message = ""
     # Is the model info correctly filled?
     try:
         model_info = API.model_info(repo_id=model_id, revision=revision)
     except Exception:
         out_message += styled_warning("Could not get your model information. The leaderboard entry will not have a link to its HF repo.") + "<br>"
     modelcard_OK, error_msg = check_model_card(model_name)
     if not modelcard_OK:
         out_message += styled_warning(error_msg) + "<br>"
     predictions_OK, error_msg = is_valid_predictions(predictions)
     if not predictions_OK:
         return styled_error(error_msg) + "<br>"
     # Seems good, creating the eval
     print("Adding new eval")
@@ -74,6 +80,8 @@ def add_new_eval(
         "private": False,
     }
     # Check for duplicate submission
     if f"{model_name}_{revision}_{track}" in REQUESTED_MODELS:
         return styled_error("A model with this name has been already submitted.")
@@ -83,6 +91,8 @@ def add_new_eval(
     os.makedirs(OUT_DIR, exist_ok=True)
     out_path = f"{OUT_DIR}/{model_path}_{revision}_eval_request_False_{track}.json"
     with open(out_path, "w") as f:
         f.write(json.dumps(eval_entry))
@@ -95,6 +105,8 @@ def add_new_eval(
         commit_message=f"Add {model_name} to eval queue",
     )
     # Remove the local file
     os.remove(out_path)

     out_message = ""
     # Is the model info correctly filled?
+    print("Made it before 1")
     try:
         model_info = API.model_info(repo_id=model_id, revision=revision)
     except Exception:
         out_message += styled_warning("Could not get your model information. The leaderboard entry will not have a link to its HF repo.") + "<br>"
+    print("Made it after 1")
     modelcard_OK, error_msg = check_model_card(model_name)
     if not modelcard_OK:
         out_message += styled_warning(error_msg) + "<br>"
+    print("Made it after 2")
     predictions_OK, error_msg = is_valid_predictions(predictions)
     if not predictions_OK:
         return styled_error(error_msg) + "<br>"
+    print("Made it after 3")
     # Seems good, creating the eval
     print("Adding new eval")
         "private": False,
     }
+    print("Made it after 4")
     # Check for duplicate submission
     if f"{model_name}_{revision}_{track}" in REQUESTED_MODELS:
         return styled_error("A model with this name has been already submitted.")
     os.makedirs(OUT_DIR, exist_ok=True)
     out_path = f"{OUT_DIR}/{model_path}_{revision}_eval_request_False_{track}.json"
+    print("Made it after 5")
     with open(out_path, "w") as f:
         f.write(json.dumps(eval_entry))
         commit_message=f"Add {model_name} to eval queue",
     )
+    print("Made it after 6")
     # Remove the local file
     os.remove(out_path)