lixuejing commited on
Commit
9a1514a
·
1 Parent(s): 7bf32d2
Files changed (2) hide show
  1. src/leaderboard/read_evals.py +1 -1
  2. src/populate.py +1 -0
src/leaderboard/read_evals.py CHANGED
@@ -80,7 +80,7 @@ class EvalResult:
80
  if accs.size == 0 or any([acc is None for acc in accs]):
81
  continue
82
 
83
- mean_acc = np.mean(accs) * 100.0
84
  results[task.benchmark] = mean_acc
85
 
86
  return self(
 
80
  if accs.size == 0 or any([acc is None for acc in accs]):
81
  continue
82
 
83
+ mean_acc = np.mean(accs) if len(accs) > 0 else 0
84
  results[task.benchmark] = mean_acc
85
 
86
  return self(
src/populate.py CHANGED
@@ -13,6 +13,7 @@ def get_leaderboard_df(results_path: str, requests_path: str, dynamic_path: str,
13
  """Creates a dataframe from all the individual experiment results"""
14
  raw_data = get_raw_eval_results(results_path, requests_path, dynamic_path)
15
  all_data_json = [v.to_dict() for v in raw_data]
 
16
  #all_data_json.append(baseline_row)
17
  filter_models_flags(all_data_json)
18
 
 
13
  """Creates a dataframe from all the individual experiment results"""
14
  raw_data = get_raw_eval_results(results_path, requests_path, dynamic_path)
15
  all_data_json = [v.to_dict() for v in raw_data]
16
+ print("all_data_json", all_data_json)
17
  #all_data_json.append(baseline_row)
18
  filter_models_flags(all_data_json)
19