H2H-eval-comparator

Sleeping

App Files Files Community

rohansampath commited on Feb 26

Commit

e136af0

verified ·

1 Parent(s): eb1aa5a

Create modules/ui_components.py

Browse files

Files changed (1) hide show

modules/ui_components.py +99 -0

modules/ui_components.py ADDED Viewed

	@@ -0,0 +1,99 @@

+import gradio as gr
+# CSS styling for the application
+CSS = """
+#preview_header {
+    margin-bottom: 10px;
+    margin-top: 5px;
+}
+#preview_table {
+    background-color: #f8f9fa;
+    border-radius: 8px;
+    padding: 10px;
+}
+h1 {
+    text-align: center;
+}
+.section-divider {
+    border-top: 1px solid #ddd;
+    margin: 12px 0;
+}
+.config-box {
+    border: 1px solid #ddd;
+    border-radius: 8px;
+    padding: 15px;
+    margin: 10px;
+    background-color: #f9f9f9;
+}
+.center-divider {
+    display: flex;
+    justify-content: center;
+    height: 100%;
+}
+.error-message {
+    color: #d32f2f;
+    background-color: #ffebee;
+    padding: 10px;
+    border-radius: 4px;
+    margin: 10px 0;
+}
+"""
+def create_header():
+    """
+    Creates the main application header.
+    Returns:
+        list: List of header components.
+    """
+    title = gr.Markdown("# Head-to-Head Model Evaluation Comparator")
+    description = gr.Markdown("""
+    This demo evaluates two models (or one model with two different configs), head-to-head, on a benchmark dataset.
+    Available Datasets: [MMLU-Pro](https://huggingface.co/datasets/TIGER-Lab/MMLU-Pro)
+    """)
+    return [title, description]
+def create_results_section():
+    """
+    Creates the results section of the UI.
+    Returns:
+        dict: Dictionary containing results components.
+    """
+    with gr.Column(visible=False) as results_container:
+        results_output = gr.Markdown(label="Evaluation Results")
+        # Results table - Initially hidden until evaluation completes
+        with gr.Column(visible=False) as results_table_container:
+            with gr.Row():
+                results_table = gr.DataFrame(
+                    interactive=True,
+                    label="Detailed Results (Sortable)",
+                    visible=True
+                )
+    return {
+        'container': results_container,
+        'output': results_output,
+        'table_container': results_table_container,
+        'table': results_table
+    }
+def create_action_buttons():
+    """
+    Creates the action buttons for evaluation.
+    Returns:
+        dict: Dictionary containing button components.
+    """
+    with gr.Row():
+        with gr.Column(scale=1):
+            eval_button = gr.Button("Run MMLU-Pro Evaluation", variant="primary", interactive=False)
+            cancel_button = gr.Button("Cancel Evaluation", variant="stop", visible=False)
+    return {
+        'eval_button': eval_button,
+        'cancel_button': cancel_button
+    }