brunneis commited on
Commit
8a1fb40
·
verified ·
1 Parent(s): 256be18

Update src/leaderboard/read_evals.py

Browse files
Files changed (1) hide show
  1. src/leaderboard/read_evals.py +2 -2
src/leaderboard/read_evals.py CHANGED
@@ -131,9 +131,9 @@ class EvalResult:
131
  non_zero_scores = {k: v for k, v in scores.items() if v != 0}
132
  if non_zero_scores:
133
  weights = {
134
- 'naive_judge': 0.3,
135
  'human_eval_solidity_pass_1': 0.5,
136
- 'human_eval_solidity_pass_3': 0.2
137
  }
138
  total_weight = sum(weights[k] for k in non_zero_scores)
139
  soliditybench = sum(scores[k] * weights[k] / total_weight for k in non_zero_scores)
 
131
  non_zero_scores = {k: v for k, v in scores.items() if v != 0}
132
  if non_zero_scores:
133
  weights = {
134
+ 'naive_judge': 0.1,
135
  'human_eval_solidity_pass_1': 0.5,
136
+ 'human_eval_solidity_pass_3': 0.4
137
  }
138
  total_weight = sum(weights[k] for k in non_zero_scores)
139
  soliditybench = sum(scores[k] * weights[k] / total_weight for k in non_zero_scores)