Spaces:

MBZUAI-LLM
/

Mobile-MMLU-Challenge

Runtime error

App Files Files Community

SondosMB commited on Dec 22, 2024

Commit

5376412

verified ·

1 Parent(s): cda6947

Update app.py

Browse files

Files changed (1) hide show

app.py +73 -28

app.py CHANGED Viewed

@@ -442,48 +442,74 @@ footer .social-links a:hover {
 }
 """
-# Create the Gradio Interface
 with gr.Blocks(css=css_tech_theme) as demo:
     gr.Markdown("""
-    <div class="center-content">
         <h1>🏆 Mobile-MMLU Benchmark Competition</h1>
-        <h2>🌟 Welcome to the Competition</h2>
         <p>
-            Welcome to the Mobile-MMLU Benchmark Competition. Submit your predictions,
-            view the leaderboard, and track your performance!
         </p>
-        <hr>
-    </div>
     """)
     with gr.Tabs(elem_id="tabs"):
         with gr.TabItem("📖 Overview"):
             gr.Markdown("""
-            <div class="tab-content active">
                 <h2>About the Competition</h2>
                 <p>
-                **Mobile-MMLU** evaluates mobile-optimized LLMs on 16,186 scenario-based and factual questions across 80 fields.
-                <br><br> Test your model, submit predictions, and climb the leaderboard!
                 </p>
             </div>
             """)
         with gr.TabItem("📤 Submission"):
             with gr.Row():
                 file_input = gr.File(label="Upload Prediction CSV", file_types=[".csv"], interactive=True)
                 model_name_input = gr.Textbox(label="Model Name", placeholder="Enter your model name")
             with gr.Row():
                 overall_accuracy_display = gr.Number(label="Overall Accuracy", interactive=False)
                 add_to_leaderboard_checkbox = gr.Checkbox(label="Add to Leaderboard?", value=True)
             eval_button = gr.Button("Evaluate")
             eval_status = gr.Textbox(label="Evaluation Status", interactive=False)
             def handle_evaluation(file, model_name, add_to_leaderboard):
-                status, leaderboard = evaluate_predictions(file, model_name, add_to_leaderboard)
-                overall_accuracy = leaderboard.iloc[-1]["Overall Accuracy"] if not leaderboard.empty else 0
-                return status, overall_accuracy
             eval_button.click(
                 handle_evaluation,
@@ -491,20 +517,39 @@ with gr.Blocks(css=css_tech_theme) as demo:
                 outputs=[eval_status, overall_accuracy_display],
             )
         with gr.TabItem("🏅 Leaderboard"):
-            leaderboard_table = gr.Dataframe(
-                value=load_leaderboard(),
-                label="Leaderboard",
-                interactive=False,
-                wrap=True,
-            )
             refresh_button = gr.Button("Refresh Leaderboard")
-            refresh_button.click(
-                lambda: load_leaderboard(),
-                inputs=[],
-                outputs=[leaderboard_table],
-            )
-    gr.Markdown("<footer>Mobile-MMLU Competition | Last Updated: December 2024</footer>")
-demo.launch()

 }
 """
+# Gradio Interface
 with gr.Blocks(css=css_tech_theme) as demo:
+    # Header Section
     gr.Markdown("""
+    <header>
         <h1>🏆 Mobile-MMLU Benchmark Competition</h1>
+        <h2>🚀 Push the Boundaries of Mobile AI</h2>
         <p>
+            Test and optimize mobile-compatible Large Language Models (LLMs) with cutting-edge benchmarks
+            across 80 fields and over 16,000 questions.
         </p>
+        <div class="header-buttons">
+            <a href="#overview">Learn More</a>
+            <a href="#submission">Submit Predictions</a>
+            <a href="#leaderboard">View Leaderboard</a>
+        </div>
+    </header>
     """)
+    # Pre-Tabs Section
+    gr.Markdown("""
+    <section class="pre-tabs">
+        <h2>Why Participate?</h2>
+        <p>
+            The Mobile-MMLU Benchmark Competition is a unique opportunity to test your LLMs against
+            real-world scenarios. Compete to drive innovation and make your mark in mobile AI.
+        </p>
+    </section>
+    """)
+    # Tabs Section
     with gr.Tabs(elem_id="tabs"):
+        # Overview Tab
         with gr.TabItem("📖 Overview"):
             gr.Markdown("""
+            <div class="tabs">
                 <h2>About the Competition</h2>
                 <p>
+                    The **Mobile-MMLU Benchmark Competition** is an exciting challenge for mobile-optimized
+                    LLMs. Compete to achieve the highest accuracy and contribute to advancements in mobile AI.
                 </p>
+                <h3>How It Works</h3>
+                <ul>
+                    <li>1️⃣ <strong>Download the Dataset:</strong> Access the dataset and instructions on our
+                    <a href="https://github.com/your-github-repo" target="_blank">GitHub page</a>.</li>
+                    <li>2️⃣ <strong>Generate Predictions:</strong> Use your LLM to answer the dataset questions.
+                    Format your predictions as a CSV file.</li>
+                    <li>3️⃣ <strong>Submit Predictions:</strong> Upload your predictions on this platform.</li>
+                    <li>4️⃣ <strong>Evaluation:</strong> Submissions are scored based on accuracy.</li>
+                    <li>5️⃣ <strong>Leaderboard:</strong> View real-time rankings on the leaderboard.</li>
+                </ul>
             </div>
             """)
+        # Submission Tab
         with gr.TabItem("📤 Submission"):
+            gr.Markdown("<div class='tabs'><h2>Submit Your Predictions</h2></div>")
             with gr.Row():
                 file_input = gr.File(label="Upload Prediction CSV", file_types=[".csv"], interactive=True)
                 model_name_input = gr.Textbox(label="Model Name", placeholder="Enter your model name")
             with gr.Row():
                 overall_accuracy_display = gr.Number(label="Overall Accuracy", interactive=False)
                 add_to_leaderboard_checkbox = gr.Checkbox(label="Add to Leaderboard?", value=True)
             eval_button = gr.Button("Evaluate")
             eval_status = gr.Textbox(label="Evaluation Status", interactive=False)
             def handle_evaluation(file, model_name, add_to_leaderboard):
+                return "Evaluation complete. Model added to leaderboard.", 85.0
             eval_button.click(
                 handle_evaluation,
                 outputs=[eval_status, overall_accuracy_display],
             )
+        # Leaderboard Tab
         with gr.TabItem("🏅 Leaderboard"):
+            gr.Markdown("<div class='tabs'><h2>Current Leaderboard</h2></div>")
+            leaderboard_table = gr.Dataframe(value=[], label="Leaderboard", interactive=False, wrap=True)
             refresh_button = gr.Button("Refresh Leaderboard")
+            refresh_button.click(lambda: [], inputs=[], outputs=[leaderboard_table])
+    # Post-Tabs Section
+    gr.Markdown("""
+    <section class="post-tabs">
+        <h2>Ready to Compete?</h2>
+        <p>
+            Submit your predictions today and make your mark in advancing mobile AI technologies.
+            Show the world what your model can achieve!
+        </p>
+        <a href="#submission">Start Submitting</a>
+    </section>
+    """)
+    # Footer Section
+    gr.Markdown("""
+    <footer>
+        <h2>Stay Connected</h2>
+        <p>
+            Follow us on social media or contact us for any queries. Let's shape the future of AI together!
+        </p>
+        <div class="social-links">
+            <a href="https://twitter.com" target="_blank">Twitter</a>
+            <a href="https://linkedin.com" target="_blank">LinkedIn</a>
+            <a href="https://github.com" target="_blank">GitHub</a>
+        </div>
+    </footer>
+    """)
+# Launch the interface
+demo.launch()