Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
feat: implement anonymous displaying for long-doc
Browse files- app.py +17 -7
- src/utils.py +8 -10
app.py
CHANGED
@@ -41,13 +41,14 @@ print(f'QA data loaded: {original_df_qa.shape}')
|
|
41 |
print(f'Long-Doc data loaded: {len(original_df_long_doc)}')
|
42 |
|
43 |
leaderboard_df_qa = original_df_qa.copy()
|
44 |
-
shown_columns_qa, types_qa = get_default_cols(
|
|
|
45 |
leaderboard_df_qa = leaderboard_df_qa[~leaderboard_df_qa[COL_NAME_IS_ANONYMOUS]][shown_columns_qa]
|
46 |
|
47 |
leaderboard_df_long_doc = original_df_long_doc.copy()
|
48 |
-
shown_columns_long_doc, types_long_doc = get_default_cols(
|
49 |
-
|
50 |
-
leaderboard_df_long_doc = leaderboard_df_long_doc[shown_columns_long_doc]
|
51 |
|
52 |
|
53 |
def update_metric_qa(
|
@@ -67,8 +68,9 @@ def update_metric_long_doc(
|
|
67 |
langs: list,
|
68 |
reranking_model: list,
|
69 |
query: str,
|
|
|
70 |
):
|
71 |
-
return update_metric(raw_data, "long-doc", metric, domains, langs, reranking_model, query)
|
72 |
|
73 |
|
74 |
demo = gr.Blocks(css=custom_css)
|
@@ -243,6 +245,12 @@ with demo:
|
|
243 |
multiselect=True,
|
244 |
interactive=True
|
245 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
246 |
|
247 |
leaderboard_table_long_doc = gr.components.Dataframe(
|
248 |
value=leaderboard_df_long_doc,
|
@@ -254,7 +262,7 @@ with demo:
|
|
254 |
|
255 |
# Dummy leaderboard for handling the case when the user uses backspace key
|
256 |
hidden_leaderboard_table_for_search = gr.components.Dataframe(
|
257 |
-
value=
|
258 |
datatype=types_long_doc,
|
259 |
visible=False,
|
260 |
)
|
@@ -274,7 +282,7 @@ with demo:
|
|
274 |
|
275 |
# Set column-wise listener
|
276 |
for selector in [
|
277 |
-
selected_domains, selected_langs, selected_rerankings
|
278 |
]:
|
279 |
selector.change(
|
280 |
update_table_long_doc,
|
@@ -284,6 +292,7 @@ with demo:
|
|
284 |
selected_langs,
|
285 |
selected_rerankings,
|
286 |
search_bar,
|
|
|
287 |
],
|
288 |
leaderboard_table_long_doc,
|
289 |
queue=True,
|
@@ -298,6 +307,7 @@ with demo:
|
|
298 |
selected_langs,
|
299 |
selected_rerankings,
|
300 |
search_bar,
|
|
|
301 |
],
|
302 |
leaderboard_table_long_doc,
|
303 |
queue=True
|
|
|
41 |
print(f'Long-Doc data loaded: {len(original_df_long_doc)}')
|
42 |
|
43 |
leaderboard_df_qa = original_df_qa.copy()
|
44 |
+
shown_columns_qa, types_qa = get_default_cols(
|
45 |
+
'qa', leaderboard_df_qa.columns, add_fix_cols=True)
|
46 |
leaderboard_df_qa = leaderboard_df_qa[~leaderboard_df_qa[COL_NAME_IS_ANONYMOUS]][shown_columns_qa]
|
47 |
|
48 |
leaderboard_df_long_doc = original_df_long_doc.copy()
|
49 |
+
shown_columns_long_doc, types_long_doc = get_default_cols(
|
50 |
+
'long-doc', leaderboard_df_long_doc.columns, add_fix_cols=True)
|
51 |
+
leaderboard_df_long_doc = leaderboard_df_long_doc[~leaderboard_df_long_doc[COL_NAME_IS_ANONYMOUS]][shown_columns_long_doc]
|
52 |
|
53 |
|
54 |
def update_metric_qa(
|
|
|
68 |
langs: list,
|
69 |
reranking_model: list,
|
70 |
query: str,
|
71 |
+
show_anonymous: bool
|
72 |
):
|
73 |
+
return update_metric(raw_data, "long-doc", metric, domains, langs, reranking_model, query, show_anonymous)
|
74 |
|
75 |
|
76 |
demo = gr.Blocks(css=custom_css)
|
|
|
245 |
multiselect=True,
|
246 |
interactive=True
|
247 |
)
|
248 |
+
with gr.Row():
|
249 |
+
show_anonymous = gr.Checkbox(
|
250 |
+
label="Show anonymous submissions",
|
251 |
+
value=False,
|
252 |
+
info="The anonymous submissions might have invalid model information."
|
253 |
+
)
|
254 |
|
255 |
leaderboard_table_long_doc = gr.components.Dataframe(
|
256 |
value=leaderboard_df_long_doc,
|
|
|
262 |
|
263 |
# Dummy leaderboard for handling the case when the user uses backspace key
|
264 |
hidden_leaderboard_table_for_search = gr.components.Dataframe(
|
265 |
+
value=original_df_long_doc,
|
266 |
datatype=types_long_doc,
|
267 |
visible=False,
|
268 |
)
|
|
|
282 |
|
283 |
# Set column-wise listener
|
284 |
for selector in [
|
285 |
+
selected_domains, selected_langs, selected_rerankings, show_anonymous
|
286 |
]:
|
287 |
selector.change(
|
288 |
update_table_long_doc,
|
|
|
292 |
selected_langs,
|
293 |
selected_rerankings,
|
294 |
search_bar,
|
295 |
+
show_anonymous,
|
296 |
],
|
297 |
leaderboard_table_long_doc,
|
298 |
queue=True,
|
|
|
307 |
selected_langs,
|
308 |
selected_rerankings,
|
309 |
search_bar,
|
310 |
+
show_anonymous,
|
311 |
],
|
312 |
leaderboard_table_long_doc,
|
313 |
queue=True
|
src/utils.py
CHANGED
@@ -107,15 +107,12 @@ def update_table(
|
|
107 |
query: str,
|
108 |
show_anonymous: bool
|
109 |
):
|
110 |
-
print(f"shown_anonymous: {show_anonymous}")
|
111 |
filtered_df = hidden_df
|
112 |
if not show_anonymous:
|
113 |
-
print(filtered_df[COL_NAME_IS_ANONYMOUS])
|
114 |
filtered_df = filtered_df[~filtered_df[COL_NAME_IS_ANONYMOUS]]
|
115 |
-
print(f"filtered_df: {len(filtered_df)}")
|
116 |
filtered_df = filter_models(filtered_df, reranking_query)
|
117 |
filtered_df = filter_queries(query, filtered_df)
|
118 |
-
df = select_columns(filtered_df, domains, langs)
|
119 |
return df
|
120 |
|
121 |
|
@@ -125,13 +122,14 @@ def update_table_long_doc(
|
|
125 |
langs: list,
|
126 |
reranking_query: list,
|
127 |
query: str,
|
128 |
-
|
129 |
):
|
130 |
-
filtered_df =
|
|
|
|
|
|
|
131 |
filtered_df = filter_queries(query, filtered_df)
|
132 |
df = select_columns(filtered_df, domains, langs, task='long_doc')
|
133 |
-
# if not show_anonymous:
|
134 |
-
# df = df[~df[COL_NAME_IS_ANONYMOUS]]
|
135 |
return df
|
136 |
|
137 |
|
@@ -143,7 +141,7 @@ def update_metric(
|
|
143 |
langs: list,
|
144 |
reranking_model: list,
|
145 |
query: str,
|
146 |
-
show_anonymous: bool
|
147 |
) -> pd.DataFrame:
|
148 |
if task == 'qa':
|
149 |
leaderboard_df = get_leaderboard_df(raw_data, task=task, metric=metric)
|
@@ -163,7 +161,7 @@ def update_metric(
|
|
163 |
langs,
|
164 |
reranking_model,
|
165 |
query,
|
166 |
-
|
167 |
)
|
168 |
|
169 |
|
|
|
107 |
query: str,
|
108 |
show_anonymous: bool
|
109 |
):
|
|
|
110 |
filtered_df = hidden_df
|
111 |
if not show_anonymous:
|
|
|
112 |
filtered_df = filtered_df[~filtered_df[COL_NAME_IS_ANONYMOUS]]
|
|
|
113 |
filtered_df = filter_models(filtered_df, reranking_query)
|
114 |
filtered_df = filter_queries(query, filtered_df)
|
115 |
+
df = select_columns(filtered_df, domains, langs, task='qa')
|
116 |
return df
|
117 |
|
118 |
|
|
|
122 |
langs: list,
|
123 |
reranking_query: list,
|
124 |
query: str,
|
125 |
+
show_anonymous: bool
|
126 |
):
|
127 |
+
filtered_df = hidden_df
|
128 |
+
if not show_anonymous:
|
129 |
+
filtered_df = filtered_df[~filtered_df[COL_NAME_IS_ANONYMOUS]]
|
130 |
+
filtered_df = filter_models(filtered_df, reranking_query)
|
131 |
filtered_df = filter_queries(query, filtered_df)
|
132 |
df = select_columns(filtered_df, domains, langs, task='long_doc')
|
|
|
|
|
133 |
return df
|
134 |
|
135 |
|
|
|
141 |
langs: list,
|
142 |
reranking_model: list,
|
143 |
query: str,
|
144 |
+
show_anonymous: bool = False
|
145 |
) -> pd.DataFrame:
|
146 |
if task == 'qa':
|
147 |
leaderboard_df = get_leaderboard_df(raw_data, task=task, metric=metric)
|
|
|
161 |
langs,
|
162 |
reranking_model,
|
163 |
query,
|
164 |
+
show_anonymous
|
165 |
)
|
166 |
|
167 |
|