yentinglin
commited on
Commit
•
5711a3c
1
Parent(s):
9b53393
add
Browse files- src/leaderboard/read_evals.py +3 -0
- src/populate.py +0 -2
src/leaderboard/read_evals.py
CHANGED
@@ -175,7 +175,9 @@ def get_raw_eval_results(results_path: str, requests_path: str) -> list[EvalResu
|
|
175 |
eval_results = {}
|
176 |
for model_result_filepath in model_result_filepaths:
|
177 |
# Creation of result
|
|
|
178 |
eval_result = EvalResult.init_from_json_file(model_result_filepath)
|
|
|
179 |
eval_result.update_with_request_file(requests_path)
|
180 |
|
181 |
# Store results of same eval together
|
@@ -184,6 +186,7 @@ def get_raw_eval_results(results_path: str, requests_path: str) -> list[EvalResu
|
|
184 |
eval_results[eval_name].results.update({k: v for k, v in eval_result.results.items() if v is not None})
|
185 |
else:
|
186 |
eval_results[eval_name] = eval_result
|
|
|
187 |
|
188 |
results = []
|
189 |
for v in eval_results.values():
|
|
|
175 |
eval_results = {}
|
176 |
for model_result_filepath in model_result_filepaths:
|
177 |
# Creation of result
|
178 |
+
print(f"Model result filepath: {model_result_filepath}")
|
179 |
eval_result = EvalResult.init_from_json_file(model_result_filepath)
|
180 |
+
print(eval_result)
|
181 |
eval_result.update_with_request_file(requests_path)
|
182 |
|
183 |
# Store results of same eval together
|
|
|
186 |
eval_results[eval_name].results.update({k: v for k, v in eval_result.results.items() if v is not None})
|
187 |
else:
|
188 |
eval_results[eval_name] = eval_result
|
189 |
+
print(eval_results)
|
190 |
|
191 |
results = []
|
192 |
for v in eval_results.values():
|
src/populate.py
CHANGED
@@ -14,8 +14,6 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
|
|
14 |
all_data_json = [v.to_dict() for v in raw_data]
|
15 |
|
16 |
df = pd.DataFrame.from_records(all_data_json)
|
17 |
-
print(df.head())
|
18 |
-
print(df)
|
19 |
df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
20 |
df = df[cols].round(decimals=2)
|
21 |
|
|
|
14 |
all_data_json = [v.to_dict() for v in raw_data]
|
15 |
|
16 |
df = pd.DataFrame.from_records(all_data_json)
|
|
|
|
|
17 |
df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
18 |
df = df[cols].round(decimals=2)
|
19 |
|