Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
fix: fix the long-doc version updating bug
Browse files
app.py
CHANGED
@@ -122,17 +122,28 @@ def update_qa_domains(version):
|
|
122 |
return domain_elem
|
123 |
|
124 |
|
|
|
|
|
|
|
|
|
|
|
125 |
def update_qa_langs(version):
|
126 |
datastore = update_datastore(version)
|
127 |
lang_elem = get_language_dropdown(QABenchmarks[datastore.slug])
|
128 |
return lang_elem
|
129 |
|
130 |
|
|
|
|
|
|
|
|
|
|
|
131 |
def update_qa_models(version):
|
132 |
datastore = update_datastore(version)
|
133 |
model_elem = get_reranking_dropdown(datastore.reranking_models)
|
134 |
return model_elem
|
135 |
|
|
|
136 |
def update_qa_df_ret_rerank(version):
|
137 |
datastore = update_datastore(version)
|
138 |
return get_leaderboard_table(datastore.qa_fmt_df, datastore.qa_types)
|
@@ -142,6 +153,16 @@ def update_qa_hidden_df_ret_rerank(version):
|
|
142 |
return get_leaderboard_table(datastore.qa_raw_df, datastore.qa_types, visible=False)
|
143 |
|
144 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
145 |
def filter_df_ret(df):
|
146 |
df_ret = df[df[COL_NAME_RERANKING_MODEL] == "NoReranker"]
|
147 |
df_ret = reset_rank(df_ret)
|
@@ -152,12 +173,24 @@ def update_qa_df_ret(version):
|
|
152 |
df_ret = filter_df_ret(datastore.qa_fmt_df)
|
153 |
return get_leaderboard_table(df_ret, datastore.qa_types)
|
154 |
|
|
|
155 |
def update_qa_hidden_df_ret(version):
|
156 |
datastore = update_datastore(version)
|
157 |
df_ret_hidden = filter_df_ret(datastore.qa_raw_df)
|
158 |
return get_leaderboard_table(df_ret_hidden, datastore.qa_types, visible=False)
|
159 |
|
160 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
161 |
def filter_df_rerank(df):
|
162 |
df_rerank = df[df[COL_NAME_RETRIEVAL_MODEL] == BM25_LINK]
|
163 |
df_rerank = reset_rank(df_rerank)
|
@@ -173,17 +206,26 @@ def update_qa_hidden_df_rerank(version):
|
|
173 |
df_rerank_hidden = filter_df_rerank(datastore.qa_raw_df)
|
174 |
return get_leaderboard_table(df_rerank_hidden, datastore.qa_types, visible=False)
|
175 |
|
|
|
|
|
|
|
|
|
176 |
|
177 |
-
def
|
178 |
-
|
179 |
-
|
180 |
-
datastore =
|
181 |
-
|
182 |
-
|
183 |
-
|
184 |
-
|
185 |
-
|
186 |
-
|
|
|
|
|
|
|
|
|
|
|
187 |
|
188 |
|
189 |
demo = gr.Blocks(css=custom_css)
|
@@ -409,9 +451,19 @@ with demo:
|
|
409 |
# select domain
|
410 |
with gr.Row():
|
411 |
domains = get_domain_dropdown(LongDocBenchmarks[datastore.slug])
|
|
|
|
|
|
|
|
|
|
|
412 |
# select language
|
413 |
with gr.Row():
|
414 |
langs = get_language_dropdown(LongDocBenchmarks[datastore.slug])
|
|
|
|
|
|
|
|
|
|
|
415 |
with gr.Column():
|
416 |
# select the metric
|
417 |
with gr.Row():
|
@@ -427,18 +479,28 @@ with demo:
|
|
427 |
search_bar = get_search_bar()
|
428 |
with gr.Column():
|
429 |
models = get_reranking_dropdown(datastore.reranking_models)
|
|
|
|
|
|
|
|
|
|
|
430 |
|
431 |
doc_df_elem_ret_rerank = get_leaderboard_table(datastore.doc_fmt_df, datastore.doc_types)
|
432 |
|
433 |
-
|
|
|
|
|
|
|
|
|
|
|
434 |
doc_df_elem_ret_rerank_hidden = get_leaderboard_table(
|
435 |
datastore.doc_raw_df, datastore.doc_types, visible=False
|
436 |
)
|
437 |
|
438 |
version.change(
|
439 |
-
|
440 |
version,
|
441 |
-
|
442 |
)
|
443 |
|
444 |
set_listeners(
|
@@ -475,31 +537,22 @@ with demo:
|
|
475 |
search_bar_ret = get_search_bar()
|
476 |
with gr.Column(scale=1):
|
477 |
models_ret = get_noreranking_dropdown()
|
478 |
-
|
479 |
-
_doc_df_ret = datastore.doc_fmt_df[
|
480 |
-
datastore.doc_fmt_df[COL_NAME_RERANKING_MODEL] == "NoReranker"
|
481 |
-
]
|
482 |
-
_doc_df_ret = reset_rank(_doc_df_ret)
|
483 |
doc_df_elem_ret = get_leaderboard_table(_doc_df_ret, datastore.doc_types)
|
|
|
|
|
|
|
|
|
|
|
484 |
|
485 |
-
_doc_df_ret_hidden = datastore.doc_raw_df
|
486 |
-
datastore.doc_raw_df[COL_NAME_RERANKING_MODEL] == "NoReranker"
|
487 |
-
]
|
488 |
-
_doc_df_ret_hidden = reset_rank(_doc_df_ret_hidden)
|
489 |
doc_df_elem_ret_hidden = get_leaderboard_table(
|
490 |
_doc_df_ret_hidden, datastore.doc_types, visible=False
|
491 |
)
|
492 |
-
|
493 |
version.change(
|
494 |
-
|
495 |
version,
|
496 |
-
|
497 |
-
domains,
|
498 |
-
langs,
|
499 |
-
models_ret,
|
500 |
-
doc_df_elem_ret,
|
501 |
-
doc_df_elem_ret_hidden
|
502 |
-
],
|
503 |
)
|
504 |
|
505 |
set_listeners(
|
@@ -530,10 +583,7 @@ with demo:
|
|
530 |
queue=True,
|
531 |
)
|
532 |
with gr.TabItem("Reranking Only", id=22):
|
533 |
-
_doc_df_rerank = datastore.doc_fmt_df
|
534 |
-
datastore.doc_fmt_df[COL_NAME_RETRIEVAL_MODEL] == BM25_LINK
|
535 |
-
]
|
536 |
-
_doc_df_rerank = reset_rank(_doc_df_rerank)
|
537 |
doc_rerank_models = (
|
538 |
_doc_df_rerank[COL_NAME_RERANKING_MODEL].apply(remove_html).unique().tolist()
|
539 |
)
|
@@ -543,18 +593,21 @@ with demo:
|
|
543 |
with gr.Column(scale=1):
|
544 |
doc_search_bar_rerank = gr.Textbox(show_label=False, visible=False)
|
545 |
doc_df_elem_rerank = get_leaderboard_table(_doc_df_rerank, datastore.doc_types)
|
546 |
-
|
547 |
-
|
548 |
-
|
549 |
-
|
|
|
|
|
|
|
550 |
doc_df_elem_rerank_hidden = get_leaderboard_table(
|
551 |
_doc_df_rerank_hidden, datastore.doc_types, visible=False
|
552 |
)
|
553 |
|
554 |
version.change(
|
555 |
-
|
556 |
version,
|
557 |
-
|
558 |
)
|
559 |
|
560 |
set_listeners(
|
|
|
122 |
return domain_elem
|
123 |
|
124 |
|
125 |
+
def update_doc_domains(version):
|
126 |
+
datastore = update_datastore(version)
|
127 |
+
domain_elem = get_domain_dropdown(LongDocBenchmarks[datastore.slug])
|
128 |
+
return domain_elem
|
129 |
+
|
130 |
def update_qa_langs(version):
|
131 |
datastore = update_datastore(version)
|
132 |
lang_elem = get_language_dropdown(QABenchmarks[datastore.slug])
|
133 |
return lang_elem
|
134 |
|
135 |
|
136 |
+
def update_doc_langs(version):
|
137 |
+
datastore = update_datastore(version)
|
138 |
+
lang_elem = get_language_dropdown(LongDocBenchmarks[datastore.slug])
|
139 |
+
return lang_elem
|
140 |
+
|
141 |
def update_qa_models(version):
|
142 |
datastore = update_datastore(version)
|
143 |
model_elem = get_reranking_dropdown(datastore.reranking_models)
|
144 |
return model_elem
|
145 |
|
146 |
+
|
147 |
def update_qa_df_ret_rerank(version):
|
148 |
datastore = update_datastore(version)
|
149 |
return get_leaderboard_table(datastore.qa_fmt_df, datastore.qa_types)
|
|
|
153 |
return get_leaderboard_table(datastore.qa_raw_df, datastore.qa_types, visible=False)
|
154 |
|
155 |
|
156 |
+
def update_doc_df_ret_rerank(version):
|
157 |
+
datastore = update_datastore(version)
|
158 |
+
return get_leaderboard_table(datastore.doc_fmt_df, datastore.doc_types)
|
159 |
+
|
160 |
+
|
161 |
+
def update_doc_hidden_df_ret_rerank(version):
|
162 |
+
datastore = update_datastore(version)
|
163 |
+
return get_leaderboard_table(datastore.doc_raw_df, datastore.doc_types, visible=False)
|
164 |
+
|
165 |
+
|
166 |
def filter_df_ret(df):
|
167 |
df_ret = df[df[COL_NAME_RERANKING_MODEL] == "NoReranker"]
|
168 |
df_ret = reset_rank(df_ret)
|
|
|
173 |
df_ret = filter_df_ret(datastore.qa_fmt_df)
|
174 |
return get_leaderboard_table(df_ret, datastore.qa_types)
|
175 |
|
176 |
+
|
177 |
def update_qa_hidden_df_ret(version):
|
178 |
datastore = update_datastore(version)
|
179 |
df_ret_hidden = filter_df_ret(datastore.qa_raw_df)
|
180 |
return get_leaderboard_table(df_ret_hidden, datastore.qa_types, visible=False)
|
181 |
|
182 |
|
183 |
+
def update_doc_df_ret(version):
|
184 |
+
datastore = update_datastore(version)
|
185 |
+
df_ret = filter_df_ret(datastore.doc_fmt_df)
|
186 |
+
return get_leaderboard_table(df_ret, datastore.doc_types)
|
187 |
+
|
188 |
+
|
189 |
+
def update_doc_hidden_df_ret(version):
|
190 |
+
datastore = update_datastore(version)
|
191 |
+
df_ret_hidden = filter_df_ret(datastore.doc_raw_df)
|
192 |
+
return get_leaderboard_table(df_ret_hidden, datastore.doc_types, visible=False)
|
193 |
+
|
194 |
def filter_df_rerank(df):
|
195 |
df_rerank = df[df[COL_NAME_RETRIEVAL_MODEL] == BM25_LINK]
|
196 |
df_rerank = reset_rank(df_rerank)
|
|
|
206 |
df_rerank_hidden = filter_df_rerank(datastore.qa_raw_df)
|
207 |
return get_leaderboard_table(df_rerank_hidden, datastore.qa_types, visible=False)
|
208 |
|
209 |
+
def update_doc_df_rerank(version):
|
210 |
+
datastore = update_datastore(version)
|
211 |
+
df_rerank = filter_df_rerank(datastore.doc_fmt_df)
|
212 |
+
return get_leaderboard_table(df_rerank, datastore.doc_types)
|
213 |
|
214 |
+
def update_doc_hidden_df_rerank(version):
|
215 |
+
datastore = update_datastore(version)
|
216 |
+
df_rerank_hidden = filter_df_rerank(datastore.doc_raw_df)
|
217 |
+
return get_leaderboard_table(df_rerank_hidden, datastore.doc_types, visible=False)
|
218 |
+
|
219 |
+
# def update_doc_version(version):
|
220 |
+
# global datastore
|
221 |
+
# global ds_dict
|
222 |
+
# datastore = ds_dict[version]
|
223 |
+
# # domain_elem = get_domain_dropdown(LongDocBenchmarks[datastore.slug])
|
224 |
+
# # lang_elem = get_language_dropdown(LongDocBenchmarks[datastore.slug])
|
225 |
+
# # model_elem = get_reranking_dropdown(datastore.reranking_models)
|
226 |
+
# df_elem = get_leaderboard_table(datastore.doc_fmt_df, datastore.doc_types)
|
227 |
+
# hidden_df_elem = get_leaderboard_table(datastore.doc_raw_df, datastore.doc_types, visible=False)
|
228 |
+
# return domain_elem, lang_elem, model_elem, df_elem, hidden_df_elem
|
229 |
|
230 |
|
231 |
demo = gr.Blocks(css=custom_css)
|
|
|
451 |
# select domain
|
452 |
with gr.Row():
|
453 |
domains = get_domain_dropdown(LongDocBenchmarks[datastore.slug])
|
454 |
+
version.change(
|
455 |
+
update_doc_domains,
|
456 |
+
version,
|
457 |
+
domains
|
458 |
+
)
|
459 |
# select language
|
460 |
with gr.Row():
|
461 |
langs = get_language_dropdown(LongDocBenchmarks[datastore.slug])
|
462 |
+
version.change(
|
463 |
+
update_doc_langs,
|
464 |
+
version,
|
465 |
+
langs
|
466 |
+
)
|
467 |
with gr.Column():
|
468 |
# select the metric
|
469 |
with gr.Row():
|
|
|
479 |
search_bar = get_search_bar()
|
480 |
with gr.Column():
|
481 |
models = get_reranking_dropdown(datastore.reranking_models)
|
482 |
+
version.change(
|
483 |
+
update_qa_models,
|
484 |
+
version,
|
485 |
+
models
|
486 |
+
)
|
487 |
|
488 |
doc_df_elem_ret_rerank = get_leaderboard_table(datastore.doc_fmt_df, datastore.doc_types)
|
489 |
|
490 |
+
version.change(
|
491 |
+
update_doc_df_ret_rerank,
|
492 |
+
version,
|
493 |
+
doc_df_elem_ret_rerank
|
494 |
+
)
|
495 |
+
|
496 |
doc_df_elem_ret_rerank_hidden = get_leaderboard_table(
|
497 |
datastore.doc_raw_df, datastore.doc_types, visible=False
|
498 |
)
|
499 |
|
500 |
version.change(
|
501 |
+
update_doc_hidden_df_ret_rerank,
|
502 |
version,
|
503 |
+
doc_df_elem_ret_rerank_hidden
|
504 |
)
|
505 |
|
506 |
set_listeners(
|
|
|
537 |
search_bar_ret = get_search_bar()
|
538 |
with gr.Column(scale=1):
|
539 |
models_ret = get_noreranking_dropdown()
|
540 |
+
_doc_df_ret = filter_df_ret(datastore.doc_fmt_df)
|
|
|
|
|
|
|
|
|
541 |
doc_df_elem_ret = get_leaderboard_table(_doc_df_ret, datastore.doc_types)
|
542 |
+
version.change(
|
543 |
+
update_doc_df_ret,
|
544 |
+
version,
|
545 |
+
doc_df_elem_ret
|
546 |
+
)
|
547 |
|
548 |
+
_doc_df_ret_hidden = filter_df_ret(datastore.doc_raw_df)
|
|
|
|
|
|
|
549 |
doc_df_elem_ret_hidden = get_leaderboard_table(
|
550 |
_doc_df_ret_hidden, datastore.doc_types, visible=False
|
551 |
)
|
|
|
552 |
version.change(
|
553 |
+
update_doc_hidden_df_ret,
|
554 |
version,
|
555 |
+
doc_df_elem_ret_hidden
|
|
|
|
|
|
|
|
|
|
|
|
|
556 |
)
|
557 |
|
558 |
set_listeners(
|
|
|
583 |
queue=True,
|
584 |
)
|
585 |
with gr.TabItem("Reranking Only", id=22):
|
586 |
+
_doc_df_rerank = filter_df_rerank(datastore.doc_fmt_df)
|
|
|
|
|
|
|
587 |
doc_rerank_models = (
|
588 |
_doc_df_rerank[COL_NAME_RERANKING_MODEL].apply(remove_html).unique().tolist()
|
589 |
)
|
|
|
593 |
with gr.Column(scale=1):
|
594 |
doc_search_bar_rerank = gr.Textbox(show_label=False, visible=False)
|
595 |
doc_df_elem_rerank = get_leaderboard_table(_doc_df_rerank, datastore.doc_types)
|
596 |
+
version.change(
|
597 |
+
update_doc_df_rerank,
|
598 |
+
version,
|
599 |
+
doc_df_elem_rerank
|
600 |
+
)
|
601 |
+
|
602 |
+
_doc_df_rerank_hidden = filter_df_rerank(datastore.doc_raw_df)
|
603 |
doc_df_elem_rerank_hidden = get_leaderboard_table(
|
604 |
_doc_df_rerank_hidden, datastore.doc_types, visible=False
|
605 |
)
|
606 |
|
607 |
version.change(
|
608 |
+
update_doc_hidden_df_rerank,
|
609 |
version,
|
610 |
+
doc_df_elem_rerank_hidden
|
611 |
)
|
612 |
|
613 |
set_listeners(
|