Spaces:
Running
Running
Update src/streamlit_app.py
Browse files- src/streamlit_app.py +33 -1
src/streamlit_app.py
CHANGED
@@ -4,6 +4,38 @@ import pandas as pd
|
|
4 |
# βββ Page config ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
5 |
st.set_page_config(page_title="ExpertLongBench Leaderboard", layout="wide")
|
6 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7 |
# βββ Load data ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
8 |
@st.cache_data
|
9 |
def load_data(path="src/models.json"):
|
@@ -25,7 +57,7 @@ max_ranks = {col: df[f"{col}_rank"].max() for col in score_cols}
|
|
25 |
tab1, tab2 = st.tabs(["Leaderboard", "Benchmark Details"])
|
26 |
|
27 |
with tab1:
|
28 |
-
st.markdown("**Leaderboard:** higher scores shaded green; best models bolded.")
|
29 |
# Build raw HTML table
|
30 |
cols = ["Model"] + [f"T{i}" for i in range(1,12)] + ["Avg"]
|
31 |
html = "<table style='border-collapse:collapse; width:100%; font-size:14px;'>"
|
|
|
4 |
# βββ Page config ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
5 |
st.set_page_config(page_title="ExpertLongBench Leaderboard", layout="wide")
|
6 |
|
7 |
+
|
8 |
+
logo_image = Image.open("./expertlongbench.png")
|
9 |
+
|
10 |
+
# Display logo
|
11 |
+
buffered = BytesIO()
|
12 |
+
logo_image.save(buffered, format="PNG")
|
13 |
+
img_data = base64.b64encode(buffered.getvalue()).decode("utf-8")
|
14 |
+
|
15 |
+
st.markdown(
|
16 |
+
f"""
|
17 |
+
<div class="logo-container" style="display:flex; justify-content: center;">
|
18 |
+
<img src="data:image/png;base64,{img_data}" style="width:50%; max-width:700px;"/>
|
19 |
+
</div>
|
20 |
+
""",
|
21 |
+
unsafe_allow_html=True
|
22 |
+
)
|
23 |
+
|
24 |
+
st.markdown(
|
25 |
+
'''
|
26 |
+
<div class="header">
|
27 |
+
<br/>
|
28 |
+
<p style="font-size:22px;">
|
29 |
+
VERIFACT: Enhancing Long-Form Factuality Evaluation with Refined Fact Extraction and Reference Facts
|
30 |
+
</p>
|
31 |
+
<p style="font-size:20px;">
|
32 |
+
# π <a href="">Paper</a> | π» <a href="">GitHub</a> | π€ <a href="">HuggingFace</a>
|
33 |
+
βοΈ <strong>Version</strong>: <strong>V1</strong> | <strong># Models</strong>: 12 | Updated: <strong>April 2025</strong>
|
34 |
+
</p>
|
35 |
+
</div>
|
36 |
+
''',
|
37 |
+
unsafe_allow_html=True
|
38 |
+
)
|
39 |
# βββ Load data ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
40 |
@st.cache_data
|
41 |
def load_data(path="src/models.json"):
|
|
|
57 |
tab1, tab2 = st.tabs(["Leaderboard", "Benchmark Details"])
|
58 |
|
59 |
with tab1:
|
60 |
+
# st.markdown("**Leaderboard:** higher scores shaded green; best models bolded.")
|
61 |
# Build raw HTML table
|
62 |
cols = ["Model"] + [f"T{i}" for i in range(1,12)] + ["Avg"]
|
63 |
html = "<table style='border-collapse:collapse; width:100%; font-size:14px;'>"
|