Spaces:
Sleeping
Sleeping
IliaLarchenko
commited on
Commit
·
dd8cb56
1
Parent(s):
fae1562
Sorting by performance
Browse files- tests/analysis.py +5 -1
tests/analysis.py
CHANGED
@@ -98,7 +98,11 @@ def generate_and_display_tables(df):
|
|
98 |
|
99 |
total_llm_scores = df.groupby("agent_llm")[prefix_columns].mean().mean(axis=1).sort_values(ascending=False)
|
100 |
# Grouped by unique interviewer model and sorted by descending total score
|
101 |
-
grouped_by_interviewer =
|
|
|
|
|
|
|
|
|
102 |
grouped_by_interviewer_styled = grouped_by_interviewer.style.map(highlight_color)
|
103 |
grouped_by_interviewer_styled.set_caption("Scores Grouped by Unique Interviewer Model")
|
104 |
|
|
|
98 |
|
99 |
total_llm_scores = df.groupby("agent_llm")[prefix_columns].mean().mean(axis=1).sort_values(ascending=False)
|
100 |
# Grouped by unique interviewer model and sorted by descending total score
|
101 |
+
grouped_by_interviewer = (
|
102 |
+
df.groupby("agent_llm")[["overall_score", "average_response_time_seconds", "number_of_messages"]]
|
103 |
+
.mean()
|
104 |
+
.reindex(total_llm_scores.index)
|
105 |
+
)
|
106 |
grouped_by_interviewer_styled = grouped_by_interviewer.style.map(highlight_color)
|
107 |
grouped_by_interviewer_styled.set_caption("Scores Grouped by Unique Interviewer Model")
|
108 |
|