Spaces:
Runtime error
Runtime error
Commit
·
25e9dcd
1
Parent(s):
92ec2a2
Correct comp id computation
Browse files
utils.py
CHANGED
@@ -337,6 +337,9 @@ def get_benchmarks() -> Tuple[pd.DataFrame, Dict[str, Dict[str, float]]]:
|
|
337 |
for run in runs:
|
338 |
uid = run.config.get("uid", None)
|
339 |
model = run.config.get("model", None)
|
|
|
|
|
|
|
340 |
if not uid or not model:
|
341 |
continue
|
342 |
samples = list(
|
@@ -360,9 +363,7 @@ def get_benchmarks() -> Tuple[pd.DataFrame, Dict[str, Dict[str, float]]]:
|
|
360 |
if not has_all_keys:
|
361 |
continue
|
362 |
|
363 |
-
|
364 |
-
comp_name = sample.get("competition_id", "B7_MULTI_CHOICE")
|
365 |
-
comp_ids.append(COMP_NAME_TO_ID.get(comp_name, 2))
|
366 |
timestamps.append(datetime.datetime.fromtimestamp(sample["_timestamp"]))
|
367 |
mmlu.append(sample["mmlu.acc,none"])
|
368 |
mmlu_pro.append(sample["mmlu_pro"])
|
|
|
337 |
for run in runs:
|
338 |
uid = run.config.get("uid", None)
|
339 |
model = run.config.get("model", None)
|
340 |
+
# Any run without a competition_id was for competition 2.
|
341 |
+
comp_name = run.config.get("competition_id", "B7_MULTI_CHOICE")
|
342 |
+
comp_id = COMP_NAME_TO_ID.get(comp_name, 2)
|
343 |
if not uid or not model:
|
344 |
continue
|
345 |
samples = list(
|
|
|
363 |
if not has_all_keys:
|
364 |
continue
|
365 |
|
366 |
+
comp_ids.append(comp_id)
|
|
|
|
|
367 |
timestamps.append(datetime.datetime.fromtimestamp(sample["_timestamp"]))
|
368 |
mmlu.append(sample["mmlu.acc,none"])
|
369 |
mmlu_pro.append(sample["mmlu_pro"])
|