Spaces:
Runtime error
Runtime error
Aaron Mueller
commited on
Commit
·
af94ea7
1
Parent(s):
c8abe7b
testing once more
Browse files- src/leaderboard/read_evals.py +0 -3
- src/populate.py +2 -1
src/leaderboard/read_evals.py
CHANGED
@@ -109,7 +109,6 @@ class EvalResult:
|
|
109 |
AutoEvalColumn.still_on_hub.name: self.still_on_hub,
|
110 |
}
|
111 |
|
112 |
-
print(self.track, self.results.keys())
|
113 |
if self.track.lower() == "multimodal":
|
114 |
taskset = TasksMultimodal
|
115 |
else:
|
@@ -117,7 +116,6 @@ class EvalResult:
|
|
117 |
for task in taskset:
|
118 |
data_dict[task.value.col_name] = self.results[task.value.benchmark]
|
119 |
|
120 |
-
print("Made it for track", self.track)
|
121 |
return data_dict
|
122 |
|
123 |
|
@@ -181,5 +179,4 @@ def get_raw_eval_results(results_path: str, requests_path: str) -> list[EvalResu
|
|
181 |
except KeyError: # not all eval values present
|
182 |
continue
|
183 |
|
184 |
-
print(results, len(results))
|
185 |
return results
|
|
|
109 |
AutoEvalColumn.still_on_hub.name: self.still_on_hub,
|
110 |
}
|
111 |
|
|
|
112 |
if self.track.lower() == "multimodal":
|
113 |
taskset = TasksMultimodal
|
114 |
else:
|
|
|
116 |
for task in taskset:
|
117 |
data_dict[task.value.col_name] = self.results[task.value.benchmark]
|
118 |
|
|
|
119 |
return data_dict
|
120 |
|
121 |
|
|
|
179 |
except KeyError: # not all eval values present
|
180 |
continue
|
181 |
|
|
|
182 |
return results
|
src/populate.py
CHANGED
@@ -14,13 +14,14 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
|
|
14 |
all_data_json = [v.to_dict() for v in raw_data]
|
15 |
all_data_json_filtered = []
|
16 |
for item in all_data_json:
|
|
|
17 |
if "VQA" in benchmark_cols and "vqa" in item:
|
18 |
all_data_json_filtered.append(item)
|
19 |
if "VQA" not in benchmark_cols and "vqa" not in item:
|
20 |
all_data_json_filtered.append(item)
|
21 |
all_data_json = all_data_json_filtered
|
22 |
|
23 |
-
print(all_data_json)
|
24 |
df = pd.DataFrame.from_records(all_data_json)
|
25 |
print(df)
|
26 |
# df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
|
|
14 |
all_data_json = [v.to_dict() for v in raw_data]
|
15 |
all_data_json_filtered = []
|
16 |
for item in all_data_json:
|
17 |
+
print(benchmark_cols, "|||", item.keys())
|
18 |
if "VQA" in benchmark_cols and "vqa" in item:
|
19 |
all_data_json_filtered.append(item)
|
20 |
if "VQA" not in benchmark_cols and "vqa" not in item:
|
21 |
all_data_json_filtered.append(item)
|
22 |
all_data_json = all_data_json_filtered
|
23 |
|
24 |
+
print("Filtered:", all_data_json, len(all_data_json))
|
25 |
df = pd.DataFrame.from_records(all_data_json)
|
26 |
print(df)
|
27 |
# df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|