natolambert commited on
Commit
9a9d913
·
2 Parent(s): 51d7804 bc5408b

Merge branch 'main' of https://huggingface.co/spaces/allenai/reward-bench-v2

Browse files
Files changed (1) hide show
  1. app.py +4 -2
app.py CHANGED
@@ -41,8 +41,8 @@ repo = snapshot_download(
41
  ###########################################
42
 
43
  def avg_over_rewardbench_v2(dataframe_core):
44
- domain_cols = ["chat", "factuality", "safety", "math", "precise if", "ties"]
45
- domain_weights = [0, 1, 1, 1, 1, 1]
46
  new_df = dataframe_core.copy()
47
 
48
  # for main subsets, keys in subset_mapping, take the weighted avg by example_counts and store for the models
@@ -58,6 +58,8 @@ def avg_over_rewardbench_v2(dataframe_core):
58
  keep_columns = ["model", "model_type", "average"] + domain_cols
59
  new_df = new_df[keep_columns]
60
 
 
 
61
  return new_df
62
 
63
  def avg_over_rewardbench(dataframe_core, dataframe_prefs):
 
41
  ###########################################
42
 
43
  def avg_over_rewardbench_v2(dataframe_core):
44
+ domain_cols = ["factuality", "precise if", "math", "safety", "chat", "ties"]
45
+ domain_weights = [1, 1, 1, 1, 1, 1]
46
  new_df = dataframe_core.copy()
47
 
48
  # for main subsets, keys in subset_mapping, take the weighted avg by example_counts and store for the models
 
58
  keep_columns = ["model", "model_type", "average"] + domain_cols
59
  new_df = new_df[keep_columns]
60
 
61
+ # TODO: update domain_cols and comment this out if final dataset version changes names
62
+ new_df = new_df.rename(columns={"factuality": "Factuality", "precise if": "Precise IF", "math": "Math", "safety": "Safety", "chat": "Focus", "ties": "Ties"})
63
  return new_df
64
 
65
  def avg_over_rewardbench(dataframe_core, dataframe_prefs):