Spaces:

CultriX
/

Tiny-LeaderBoard

Running

CultriX commited on Dec 23, 2024

Commit

144fe6c

verified ·

1 Parent(s): 38e1340

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -166,10 +166,12 @@ def process_and_visualize(file_content):
     output_text = f"Average Performance per Model:\n{averages.sort_values(by='Average Performance').to_string()}"
-    return output_text, image_avg, image_line, image_heatmap, image_boxplot, plotly_avg, plotly_tasks
 if __name__ == "__main__":
     iface = gr.Interface(
         fn=process_and_visualize,
         inputs=gr.Textbox(lines=10, label="Paste your data here"),
@@ -180,8 +182,10 @@ if __name__ == "__main__":
             gr.Image(label="Matplotlib Task Performance Heatmap"),
             gr.Image(label="Matplotlib Performance Distribution Boxplot"),
             gr.HTML(label="Plotly Average Performance Chart"),
-            gr.Accordion(
-                [gr.HTML(label=f"Plotly {task} Chart") for task in ['tinyArc', 'tinyHellaswag', 'tinyMMLU', 'tinyTruthfulQA', 'tinyTruthfulQA_mc1', 'tinyWinogrande']], label="Task Charts"),
         ],
         title="LLM Benchmark Visualizer",
         description="Upload your LLM benchmark data and visualize the results."

     output_text = f"Average Performance per Model:\n{averages.sort_values(by='Average Performance').to_string()}"
+    return output_text, image_avg, image_line, image_heatmap, image_boxplot, plotly_avg, plotly_tasks, plotly_tasks
 if __name__ == "__main__":
+    task_names = ['tinyArc', 'tinyHellaswag', 'tinyMMLU', 'tinyTruthfulQA', 'tinyTruthfulQA_mc1', 'tinyWinogrande']
     iface = gr.Interface(
         fn=process_and_visualize,
         inputs=gr.Textbox(lines=10, label="Paste your data here"),
             gr.Image(label="Matplotlib Task Performance Heatmap"),
             gr.Image(label="Matplotlib Performance Distribution Boxplot"),
             gr.HTML(label="Plotly Average Performance Chart"),
+            gr.TabbedInterface(
+                [gr.HTML(label=f"Plotly {task} Chart") for task in task_names],
+                label="Task Charts"
+            ),
         ],
         title="LLM Benchmark Visualizer",
         description="Upload your LLM benchmark data and visualize the results."