Spaces:
Running
Running
Aaron Mueller
commited on
Commit
·
8f1a599
1
Parent(s):
5285ff5
fix order of averages
Browse files- src/display/utils.py +2 -1
- src/leaderboard/read_evals.py +1 -1
src/display/utils.py
CHANGED
@@ -38,7 +38,8 @@ auto_eval_column_dict_multimodal.append(["model", ColumnContent, ColumnContent("
|
|
38 |
auto_eval_column_dict_multimodal.append(["track", ColumnContent, ColumnContent("Track", "markdown", False)])
|
39 |
for task in TasksMultimodal:
|
40 |
auto_eval_column_dict_multimodal.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", True)])
|
41 |
-
|
|
|
42 |
auto_eval_column_dict_multimodal.append(["vision_average", ColumnContent, ColumnContent("Vision Average", "number", True)])
|
43 |
auto_eval_column_dict_multimodal.append(["still_on_hub", ColumnContent, ColumnContent("Available on the hub", "bool", False)])
|
44 |
auto_eval_column_dict_multimodal.append(["revision", ColumnContent, ColumnContent("Model sha", "str", False, False)])
|
|
|
38 |
auto_eval_column_dict_multimodal.append(["track", ColumnContent, ColumnContent("Track", "markdown", False)])
|
39 |
for task in TasksMultimodal:
|
40 |
auto_eval_column_dict_multimodal.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", True)])
|
41 |
+
if task.name in ("ewok", "EWoK"): # make sure this appears in the right order
|
42 |
+
auto_eval_column_dict_multimodal.append(["text_average", ColumnContent, ColumnContent("Text Average", "number", True)])
|
43 |
auto_eval_column_dict_multimodal.append(["vision_average", ColumnContent, ColumnContent("Vision Average", "number", True)])
|
44 |
auto_eval_column_dict_multimodal.append(["still_on_hub", ColumnContent, ColumnContent("Available on the hub", "bool", False)])
|
45 |
auto_eval_column_dict_multimodal.append(["revision", ColumnContent, ColumnContent("Model sha", "str", False, False)])
|
src/leaderboard/read_evals.py
CHANGED
@@ -102,7 +102,7 @@ class EvalResult:
|
|
102 |
def to_dict(self):
|
103 |
"""Converts the Eval Result to a dict compatible with our dataframe display"""
|
104 |
eval_column = AutoEvalColumnMultimodal if self.track.lower() == "multimodal" else AutoEvalColumn
|
105 |
-
vision_tasks = ("VQA", "Winoground", "DevBench")
|
106 |
text_average = sum([v for k, v in self.results.items() if v is not None and k not in vision_tasks]) / len(Tasks)
|
107 |
data_dict = {
|
108 |
"eval_name": self.eval_name, # not a column, just a save name,
|
|
|
102 |
def to_dict(self):
|
103 |
"""Converts the Eval Result to a dict compatible with our dataframe display"""
|
104 |
eval_column = AutoEvalColumnMultimodal if self.track.lower() == "multimodal" else AutoEvalColumn
|
105 |
+
vision_tasks = ("VQA", "Winoground", "DevBench", "vqa", "winoground", "devbench")
|
106 |
text_average = sum([v for k, v in self.results.items() if v is not None and k not in vision_tasks]) / len(Tasks)
|
107 |
data_dict = {
|
108 |
"eval_name": self.eval_name, # not a column, just a save name,
|