Spaces:
Running
Running
Merge branch 'main' of https://huggingface.co/spaces/allenai/reward-bench-v2
Browse files
app.py
CHANGED
@@ -41,8 +41,8 @@ repo = snapshot_download(
|
|
41 |
###########################################
|
42 |
|
43 |
def avg_over_rewardbench_v2(dataframe_core):
|
44 |
-
domain_cols = ["
|
45 |
-
domain_weights = [
|
46 |
new_df = dataframe_core.copy()
|
47 |
|
48 |
# for main subsets, keys in subset_mapping, take the weighted avg by example_counts and store for the models
|
@@ -58,6 +58,8 @@ def avg_over_rewardbench_v2(dataframe_core):
|
|
58 |
keep_columns = ["model", "model_type", "average"] + domain_cols
|
59 |
new_df = new_df[keep_columns]
|
60 |
|
|
|
|
|
61 |
return new_df
|
62 |
|
63 |
def avg_over_rewardbench(dataframe_core, dataframe_prefs):
|
|
|
41 |
###########################################
|
42 |
|
43 |
def avg_over_rewardbench_v2(dataframe_core):
|
44 |
+
domain_cols = ["factuality", "precise if", "math", "safety", "chat", "ties"]
|
45 |
+
domain_weights = [1, 1, 1, 1, 1, 1]
|
46 |
new_df = dataframe_core.copy()
|
47 |
|
48 |
# for main subsets, keys in subset_mapping, take the weighted avg by example_counts and store for the models
|
|
|
58 |
keep_columns = ["model", "model_type", "average"] + domain_cols
|
59 |
new_df = new_df[keep_columns]
|
60 |
|
61 |
+
# TODO: update domain_cols and comment this out if final dataset version changes names
|
62 |
+
new_df = new_df.rename(columns={"factuality": "Factuality", "precise if": "Precise IF", "math": "Math", "safety": "Safety", "chat": "Focus", "ties": "Ties"})
|
63 |
return new_df
|
64 |
|
65 |
def avg_over_rewardbench(dataframe_core, dataframe_prefs):
|