lixuejing
commited on
Commit
·
9a1514a
1
Parent(s):
7bf32d2
fix acc
Browse files- src/leaderboard/read_evals.py +1 -1
- src/populate.py +1 -0
src/leaderboard/read_evals.py
CHANGED
@@ -80,7 +80,7 @@ class EvalResult:
|
|
80 |
if accs.size == 0 or any([acc is None for acc in accs]):
|
81 |
continue
|
82 |
|
83 |
-
mean_acc = np.mean(accs)
|
84 |
results[task.benchmark] = mean_acc
|
85 |
|
86 |
return self(
|
|
|
80 |
if accs.size == 0 or any([acc is None for acc in accs]):
|
81 |
continue
|
82 |
|
83 |
+
mean_acc = np.mean(accs) if len(accs) > 0 else 0
|
84 |
results[task.benchmark] = mean_acc
|
85 |
|
86 |
return self(
|
src/populate.py
CHANGED
@@ -13,6 +13,7 @@ def get_leaderboard_df(results_path: str, requests_path: str, dynamic_path: str,
|
|
13 |
"""Creates a dataframe from all the individual experiment results"""
|
14 |
raw_data = get_raw_eval_results(results_path, requests_path, dynamic_path)
|
15 |
all_data_json = [v.to_dict() for v in raw_data]
|
|
|
16 |
#all_data_json.append(baseline_row)
|
17 |
filter_models_flags(all_data_json)
|
18 |
|
|
|
13 |
"""Creates a dataframe from all the individual experiment results"""
|
14 |
raw_data = get_raw_eval_results(results_path, requests_path, dynamic_path)
|
15 |
all_data_json = [v.to_dict() for v in raw_data]
|
16 |
+
print("all_data_json", all_data_json)
|
17 |
#all_data_json.append(baseline_row)
|
18 |
filter_models_flags(all_data_json)
|
19 |
|