choco9966 commited on
Commit
632706f
·
verified ·
1 Parent(s): 07cd8a1

Update src/tools/plots.py

Browse files
Files changed (1) hide show
  1. src/tools/plots.py +0 -16
src/tools/plots.py CHANGED
@@ -37,22 +37,6 @@ def create_scores_df(raw_data: list[EvalResult]) -> pd.DataFrame:
37
  current_date = row["date"]
38
  if task.benchmark == "Average":
39
  avg_skip_len = 0
40
- if row["results"]["ko_winogrande"] == 0.0:
41
- avg_skip_len += 1
42
- if row["results"]["ko_gsm8k"] == 0.0:
43
- avg_skip_len += 1
44
- if row["results"]["ko_eq_bench"] == 0.0:
45
- avg_skip_len += 1
46
- if row["results"]["ko_inst_follow"] == 0.0:
47
- avg_skip_len += 1
48
- if row["results"]["kor_nat_cka"] == 0.0:
49
- avg_skip_len += 1
50
- if row["results"]["kor_nat_sva"] == 0.0:
51
- avg_skip_len += 1
52
- if row["results"]["ko_harmlessness"] == 0.0:
53
- avg_skip_len += 1
54
- if row["results"]["ko_helpfulness"] == 0.0:
55
- avg_skip_len += 1
56
 
57
  current_score = np.sum(list(row["results"].values())) / (len(row["results"]) - avg_skip_len)
58
  else:
 
37
  current_date = row["date"]
38
  if task.benchmark == "Average":
39
  avg_skip_len = 0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
 
41
  current_score = np.sum(list(row["results"].values())) / (len(row["results"]) - avg_skip_len)
42
  else: