djstrong commited on
Commit
2be0a05
·
1 Parent(s): 6a07d0b
Files changed (1) hide show
  1. src/leaderboard/read_evals.py +1 -1
src/leaderboard/read_evals.py CHANGED
@@ -106,7 +106,7 @@ class EvalResult:
106
  task = task.value
107
 
108
  task_n_shot_num = n_shot_num
109
- if 'perplexity' in task.metric: # perplexity is the same for 0-shot and 5-shot and is calculated only with 0-shot
110
  task_n_shot_num = 0
111
 
112
  # We average all scores of a given metric (not all metrics are present in all files)
 
106
  task = task.value
107
 
108
  task_n_shot_num = n_shot_num
109
+ if 'perplexity' in task.metric or task.benchmark=='polish_eq_bench': # perplexity is the same for 0-shot and 5-shot and is calculated only with 0-shot
110
  task_n_shot_num = 0
111
 
112
  # We average all scores of a given metric (not all metrics are present in all files)