Spaces:

CohereLabsCommunity
/

m-rewardbench

Running

App Files Files Community

shayekh commited on Jan 14

Commit

ac578b5

verified ·

1 Parent(s): 7366dc0

intro added with paper/artifacts

Browse files

Files changed (1) hide show

app.py +36 -4

app.py CHANGED Viewed

@@ -4,10 +4,24 @@ import numpy as np
 from gradio_leaderboard import Leaderboard, SelectColumns, ColumnFilter
 # Define constants and enums
-TITLE = "<h1>M-RewardBench Leaderboard</h1>"
-INTRODUCTION_TEXT = "https://m-rewardbench.github.io/"
 GOOGLE_SHEET_URL = "https://docs.google.com/spreadsheets/d/1qrD7plUdrBwAw7G6UeDVZAaV9ihxaNAcoiKwSaqotR4/export?gid=0&format=csv"
-ABOUT_TEXT = """Welcome to M-RewardBench Leaderboard!"""
 class AutoEvalColumn:
@@ -111,6 +125,7 @@ def format_with_color(val, min_val=50, max_val=100):
         return str(val)
 demo = gr.Blocks(theme=gr.themes.Soft())
 with demo:
   gr.HTML(TITLE)
   gr.Markdown(INTRODUCTION_TEXT)
@@ -153,6 +168,23 @@ with demo:
       AutoEvalColumn.add_columns_from_df(df, numeric_cols)
       leaderboard = init_leaderboard(df)
 demo.launch(ssr_mode=False)

 from gradio_leaderboard import Leaderboard, SelectColumns, ColumnFilter
 # Define constants and enums
+# TITLE = "<h1>M-RewardBench Leaderboard</h1>"
+TITLE = '''<h1>
+<span style="font-variant: small-caps;">M-RewardBench</span>: Evaluating Reward Models in Multilingual Settings
+</h1>'''
+INTRODUCTION_TEXT = '''
+Evaluating the chat, safety, reasoning, and translation capabilities of Multilingual Reward Models.
+📄 [Paper](https://arxiv.org/pdf/2410.15522.pdf) | 💻 [Code](https://github.com/for-ai/m-rewardbench) | 🤗 [Dataset](https://hf.co/datasets/C4AI-Community/multilingual-reward-bench) | 📚 [arXiv](https://arxiv.org/abs/2410.15522) | 🏆 [Leaderboard](https://c4ai-community-m-rewardbench.hf.space/)
+🌐 https://m-rewardbench.github.io/'''
 GOOGLE_SHEET_URL = "https://docs.google.com/spreadsheets/d/1qrD7plUdrBwAw7G6UeDVZAaV9ihxaNAcoiKwSaqotR4/export?gid=0&format=csv"
+# ABOUT_TEXT = """
+# <h1>
+# <span style="font-variant: small-caps;">M-RewardBench</span>: Evaluating Reward Models in Multilingual Settings
+# </h1>
+# Welcome to M-RewardBench Leaderboard!"""
 class AutoEvalColumn:
         return str(val)
 demo = gr.Blocks(theme=gr.themes.Soft())
 with demo:
   gr.HTML(TITLE)
   gr.Markdown(INTRODUCTION_TEXT)
       AutoEvalColumn.add_columns_from_df(df, numeric_cols)
       leaderboard = init_leaderboard(df)
+  with gr.Row():
+    with gr.Accordion("📚 Citation", open=False):
+      citation_button = gr.Textbox(
+            value=r"""@misc{gureja2024mrewardbench,
+          title={M-RewardBench: Evaluating Reward Models in Multilingual Settings},
+          author={Srishti Gureja and Lester James V. Miranda and Shayekh Bin Islam and Rishabh Maheshwary and Drishti Sharma and Gusti Winata and Nathan Lambert and Sebastian Ruder and Sara Hooker and Marzieh Fadaee},
+          year={2024},
+          eprint={2410.15522},
+          archivePrefix={arXiv},
+          primaryClass={cs.CL},
+          url={https://arxiv.org/abs/2410.15522},
+    }""",
+            lines=7,
+            label="BibTeX",
+            elem_id="citation-button",
+            show_copy_button=True,
+      )
 demo.launch(ssr_mode=False)