Spaces:

LLM360
/

de-arena

Running

App Files Files Community

yzabc007 commited on Oct 21, 2024

Commit

11b03a4

1 Parent(s): accff44

Update space

Browse files

Files changed (1) hide show

app.py +25 -2

app.py CHANGED Viewed

@@ -128,6 +128,29 @@ def overall_leaderboard(dataframe):
     )
 demo = gr.Blocks(css=custom_css)
 with demo:
@@ -139,7 +162,7 @@ with demo:
     INTRODUCTION_TEXT_FONT_SIZE = 16
     INTRODUCTION_TEXT = (
         f'<p style="font-size:{INTRODUCTION_TEXT_FONT_SIZE}px;">'
-        '<strong>Decentralized Arena</strong> automates,  scales, and accelerates "<a href="https://lmarena.ai/">Chatbot Arena</a>" '
         'for large language model (LLM) evaluation across diverse, fine-grained dimensions, '
         'such as mathematics (algebra, geometry, probability), logical reasoning, social reasoning, science (chemistry, physics, biology), or any user-defined dimensions. '
         'The evaluation is decentralized and democratic, with all participating LLMs assessing each other to ensure unbiased and fair results. '
@@ -175,7 +198,7 @@ with demo:
             TEXT = (
                 f'<p style="font-size:{INTRODUCTION_TEXT_FONT_SIZE}px;">'
-                'Total #models: 57 (Last updated: 2024-10-21)'
                 '</p>'
                 f'<p style="font-size:{INTRODUCTION_TEXT_FONT_SIZE}px;">'
                 'This page prvovides a comprehensive overview of model ranks across various dimensions, based on their averaged ranks. '

     )
+# Your leaderboard name
+TITLE = """<h1 align="center" id="space-title">Decentralized Arena Leaderboard</h1>"""
+SUB_TITLE = """<h2 align="center" id="space-subtitle">Automated, Robust, and Transparent LLM Evaluation for Numerous Dimensions</h2>"""
+EXTERNAL_LINKS = """
+<h2 align="center" id="space-links">
+    <a href="https://de-arena.maitrix.org/" target="_blank">Blog</a> |
+    <a href="https://github.com/maitrix-org/de-arena" target="_blank">GitHub</a> |
+    <a href="https://de-arena.maitrix.org/images/Heading.mp4" target="">Video</a> |
+    <a href="https://maitrix.org/" target="_blank">@Maitrix.org</a> |
+    <a href="https://www.llm360.ai/" target="_blank">@LLM360</a>
+</h2>
+"""
+# What does your leaderboard evaluate?
+INTRODUCTION_TEXT = """
+**Decentralized Arena** automates and scales "Chatbot Arena" for LLM evaluation across various fine-grained dimensions
+(e.g., math – algebra, geometry, probability; logical reasoning, social reasoning, biology, chemistry, …).
+The evaluation is decentralized and democratic, with all LLMs participating in evaluating others.
+It achieves a 95\% correlation with Chatbot Arena's overall rankings, while being fully transparent and reproducible.
+"""
 demo = gr.Blocks(css=custom_css)
 with demo:
     INTRODUCTION_TEXT_FONT_SIZE = 16
     INTRODUCTION_TEXT = (
         f'<p style="font-size:{INTRODUCTION_TEXT_FONT_SIZE}px;">'
+        '<strong>Decentralized Arena</strong> automates,  scales, and accelerates <a href="https://lmarena.ai/">Chatbot Arena</a> '
         'for large language model (LLM) evaluation across diverse, fine-grained dimensions, '
         'such as mathematics (algebra, geometry, probability), logical reasoning, social reasoning, science (chemistry, physics, biology), or any user-defined dimensions. '
         'The evaluation is decentralized and democratic, with all participating LLMs assessing each other to ensure unbiased and fair results. '
             TEXT = (
                 f'<p style="font-size:{INTRODUCTION_TEXT_FONT_SIZE}px;">'
+                '<b>Total #models: 57 (Last updated: 2024-10-21)</b>'
                 '</p>'
                 f'<p style="font-size:{INTRODUCTION_TEXT_FONT_SIZE}px;">'
                 'This page prvovides a comprehensive overview of model ranks across various dimensions, based on their averaged ranks. '