Update src/leaderboard/read_evals.py
Browse files
src/leaderboard/read_evals.py
CHANGED
@@ -173,7 +173,7 @@ def get_raw_eval_results(results_path: str, requests_path: str) -> list[EvalResu
|
|
173 |
# Creation of result
|
174 |
eval_result = EvalResult.init_from_json_file(model_result_filepath)
|
175 |
eval_result.update_with_request_file(requests_path)
|
176 |
-
|
177 |
# Store results of same eval together
|
178 |
eval_name = eval_result.eval_name
|
179 |
if eval_name in eval_results.keys():
|
@@ -182,6 +182,7 @@ def get_raw_eval_results(results_path: str, requests_path: str) -> list[EvalResu
|
|
182 |
eval_results[eval_name] = eval_result
|
183 |
|
184 |
results = []
|
|
|
185 |
for v in eval_results.values():
|
186 |
try:
|
187 |
v.to_dict() # we test if the dict version is complete
|
|
|
173 |
# Creation of result
|
174 |
eval_result = EvalResult.init_from_json_file(model_result_filepath)
|
175 |
eval_result.update_with_request_file(requests_path)
|
176 |
+
|
177 |
# Store results of same eval together
|
178 |
eval_name = eval_result.eval_name
|
179 |
if eval_name in eval_results.keys():
|
|
|
182 |
eval_results[eval_name] = eval_result
|
183 |
|
184 |
results = []
|
185 |
+
print(eval_results.values())
|
186 |
for v in eval_results.values():
|
187 |
try:
|
188 |
v.to_dict() # we test if the dict version is complete
|