Aaron Mueller commited on
Commit
8f1a599
·
1 Parent(s): 5285ff5

fix order of averages

Browse files
src/display/utils.py CHANGED
@@ -38,7 +38,8 @@ auto_eval_column_dict_multimodal.append(["model", ColumnContent, ColumnContent("
38
  auto_eval_column_dict_multimodal.append(["track", ColumnContent, ColumnContent("Track", "markdown", False)])
39
  for task in TasksMultimodal:
40
  auto_eval_column_dict_multimodal.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", True)])
41
- auto_eval_column_dict_multimodal.append(["text_average", ColumnContent, ColumnContent("Text Average", "number", True)])
 
42
  auto_eval_column_dict_multimodal.append(["vision_average", ColumnContent, ColumnContent("Vision Average", "number", True)])
43
  auto_eval_column_dict_multimodal.append(["still_on_hub", ColumnContent, ColumnContent("Available on the hub", "bool", False)])
44
  auto_eval_column_dict_multimodal.append(["revision", ColumnContent, ColumnContent("Model sha", "str", False, False)])
 
38
  auto_eval_column_dict_multimodal.append(["track", ColumnContent, ColumnContent("Track", "markdown", False)])
39
  for task in TasksMultimodal:
40
  auto_eval_column_dict_multimodal.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", True)])
41
+ if task.name in ("ewok", "EWoK"): # make sure this appears in the right order
42
+ auto_eval_column_dict_multimodal.append(["text_average", ColumnContent, ColumnContent("Text Average", "number", True)])
43
  auto_eval_column_dict_multimodal.append(["vision_average", ColumnContent, ColumnContent("Vision Average", "number", True)])
44
  auto_eval_column_dict_multimodal.append(["still_on_hub", ColumnContent, ColumnContent("Available on the hub", "bool", False)])
45
  auto_eval_column_dict_multimodal.append(["revision", ColumnContent, ColumnContent("Model sha", "str", False, False)])
src/leaderboard/read_evals.py CHANGED
@@ -102,7 +102,7 @@ class EvalResult:
102
  def to_dict(self):
103
  """Converts the Eval Result to a dict compatible with our dataframe display"""
104
  eval_column = AutoEvalColumnMultimodal if self.track.lower() == "multimodal" else AutoEvalColumn
105
- vision_tasks = ("VQA", "Winoground", "DevBench")
106
  text_average = sum([v for k, v in self.results.items() if v is not None and k not in vision_tasks]) / len(Tasks)
107
  data_dict = {
108
  "eval_name": self.eval_name, # not a column, just a save name,
 
102
  def to_dict(self):
103
  """Converts the Eval Result to a dict compatible with our dataframe display"""
104
  eval_column = AutoEvalColumnMultimodal if self.track.lower() == "multimodal" else AutoEvalColumn
105
+ vision_tasks = ("VQA", "Winoground", "DevBench", "vqa", "winoground", "devbench")
106
  text_average = sum([v for k, v in self.results.items() if v is not None and k not in vision_tasks]) / len(Tasks)
107
  data_dict = {
108
  "eval_name": self.eval_name, # not a column, just a save name,