Leaderboard_test

Sleeping

App Files Files Community

bgamazay commited on Feb 6

Commit

077e5da

verified ·

1 Parent(s): 090369e

Update app.py

Browse files

Files changed (1) hide show

app.py +60 -38

app.py CHANGED Viewed

@@ -11,7 +11,7 @@ CITATION_BUTTON_TEXT = r"""@misc{aienergyscore-leaderboard,
     howpublished = "\url{https://huggingface.co/spaces/AIEnergyScore/Leaderboard}",
 }"""
-# List of tasks (CSV filenames)
 tasks = [
     'asr.csv',
     'object_detection.csv',
@@ -30,49 +30,68 @@ def format_stars(score):
         score_int = int(score)
     except Exception:
         score_int = 0
-    return f'<span style="color: #3fa45bff !important; font-size:2em !important;">{"★" * score_int}</span>'
 def make_link(mname):
     parts = str(mname).split('/')
     display_name = parts[1] if len(parts) > 1 else mname
     return f'[{display_name}](https://huggingface.co/{mname})'
 def get_plots(task):
     df = pd.read_csv('data/energy/' + task)
     if df.columns[0].startswith("Unnamed:"):
         df = df.iloc[:, 1:]
-    df['energy_score'] = df['energy_score'].astype(int)
     df['Display Model'] = df['model'].apply(lambda m: m.split('/')[-1])
     color_map = {1: "red", 2: "orange", 3: "yellow", 4: "lightgreen", 5: "green"}
     fig = px.scatter(
         df,
-        x="total_gpu_energy",  # Ensure correct column for x-axis
-        y="Display Model",  # Keep model name for y-axis
-        color="energy_score",  # Ensure correct column for point color
-        custom_data=['energy_score'],
         height=500,
         width=800,
-        color_discrete_map=color_map
     )
     fig.update_traces(
-        hovertemplate="<br>".join([
-            "Model: %{y}",
-            "GPU Energy (Wh): %{x}",
-            "Energy Score: %{customdata[0]}"
-        ])
     )
-    fig.update_layout(xaxis_title="GPU Energy (Wh)", yaxis_title="Model")
     return fig
 def get_all_plots():
     all_df = pd.DataFrame()
     for task in tasks:
         df = pd.read_csv('data/energy/' + task)
         if df.columns[0].startswith("Unnamed:"):
             df = df.iloc[:, 1:]
-        df['energy_score'] = df['energy_score'].astype(int)
         df['Display Model'] = df['model'].apply(lambda m: m.split('/')[-1])
         all_df = pd.concat([all_df, df], ignore_index=True)
     all_df = all_df.drop_duplicates(subset=['model'])
@@ -81,38 +100,41 @@ def get_all_plots():
     fig = px.scatter(
         all_df,
-        x="total_gpu_energy",  # Ensure correct column for x-axis
         y="Display Model",
-        color="energy_score",  # Ensure correct column for point color
-        custom_data=['energy_score'],
         height=500,
         width=800,
-        color_discrete_map=color_map
     )
     fig.update_traces(
-        hovertemplate="<br>".join([
-            "Model: %{y}",
-            "GPU Energy (Wh): %{x}",
-            "Energy Score: %{customdata[0]}"
-        ])
     )
-    fig.update_layout(xaxis_title="GPU Energy (Wh)", yaxis_title="Model")
     return fig
 def get_model_names(task):
     """
     For a given task, load the energy CSV and return a dataframe with the following columns:
       - Model (a markdown link)
-      - GPU Energy (Wh) formatted as a string with 4 decimal places
       - Score (a star rating based on energy_score)
-    For text_generation.csv only, also add the "Class" column from the CSV.
-    The final column order is: Model, GPU Energy (Wh), Score, [Class].
     """
     df = pd.read_csv('data/energy/' + task)
     if df.columns[0].startswith("Unnamed:"):
         df = df.iloc[:, 1:]
-    df['energy_score'] = df['energy_score'].astype(int)
-    # Format the energy as a string with 4 decimals
     df['GPU Energy (Wh)'] = df['total_gpu_energy'].apply(lambda x: f"{x:.4f}")
     df['Model'] = df['model'].apply(make_link)
     df['Score'] = df['energy_score'].apply(format_stars)
@@ -123,13 +145,14 @@ def get_model_names(task):
     else:
         df = df[['Model', 'GPU Energy (Wh)', 'Score']]
-    df = df.sort_values(by='GPU Energy (Wh)')
     return df
 def get_all_model_names():
     """
     Combine data from all tasks and return a leaderboard table with:
-      - Model, GPU Energy (Wh), Score
     Duplicate models are dropped.
     """
     all_df = pd.DataFrame()
@@ -137,17 +160,18 @@ def get_all_model_names():
         df = pd.read_csv('data/energy/' + task)
         if df.columns[0].startswith("Unnamed:"):
             df = df.iloc[:, 1:]
-        df['energy_score'] = df['energy_score'].astype(int)
         df['GPU Energy (Wh)'] = df['total_gpu_energy'].apply(lambda x: f"{x:.4f}")
         df['Model'] = df['model'].apply(make_link)
         df['Score'] = df['energy_score'].apply(format_stars)
         all_df = pd.concat([all_df, df], ignore_index=True)
     all_df = all_df.drop_duplicates(subset=['model'])
-    all_df = all_df.sort_values(by='GPU Energy (Wh)')
     return all_df[['Model', 'GPU Energy (Wh)', 'Score']]
 # Build the Gradio interface.
-# The css argument below makes all tables (e.g. leaderboard) use a fixed layout with narrower columns.
 demo = gr.Blocks(css="""
 .gr-dataframe table {
     table-layout: fixed;
@@ -257,8 +281,6 @@ Click through the tasks below to see how different models measure up in terms of
             lines=10,
             show_copy_button=True,
         )
-    gr.Markdown(
-        """Last updated: February 2025"""
-    )
 demo.launch()

     howpublished = "\url{https://huggingface.co/spaces/AIEnergyScore/Leaderboard}",
 }"""
+# List of CSV filenames (one per task)
 tasks = [
     'asr.csv',
     'object_detection.csv',
         score_int = int(score)
     except Exception:
         score_int = 0
+    # Display a star rating (★) based on the energy score.
+    return f'<span style="color: #3fa45bff; font-size:2em;">{"★" * score_int}</span>'
 def make_link(mname):
+    # Make a Markdown link from the model name.
     parts = str(mname).split('/')
     display_name = parts[1] if len(parts) > 1 else mname
     return f'[{display_name}](https://huggingface.co/{mname})'
 def get_plots(task):
+    # Read the CSV for the given task.
     df = pd.read_csv('data/energy/' + task)
+    # If the first column is unnamed (the extra blank column), drop it.
     if df.columns[0].startswith("Unnamed:"):
         df = df.iloc[:, 1:]
+    # Convert the numeric columns
+    df['total_gpu_energy'] = pd.to_numeric(df['total_gpu_energy'], errors='coerce')
+    df['energy_score'] = pd.to_numeric(df['energy_score'], errors='coerce').astype(int)
+    # Create a short version of the model name for display on the y-axis.
     df['Display Model'] = df['model'].apply(lambda m: m.split('/')[-1])
+    # Define a discrete color mapping for energy scores.
     color_map = {1: "red", 2: "orange", 3: "yellow", 4: "lightgreen", 5: "green"}
+    # Build a scatter plot:
+    #  - x-axis: total_gpu_energy
+    #  - y-axis: Display Model (short model name)
+    #  - Color: energy_score
+    #  - Custom tooltip will include the full model name, energy value and energy score.
     fig = px.scatter(
         df,
+        x="total_gpu_energy",
+        y="Display Model",
+        color="energy_score",
+        custom_data=['model', 'total_gpu_energy', 'energy_score'],
         height=500,
         width=800,
+        color_discrete_map=color_map,
     )
     fig.update_traces(
+        hovertemplate=(
+            "Model: %{customdata[0]}<br>" +
+            "Total GPU Energy (Wh): %{customdata[1]:.4f}<br>" +
+            "Energy Score: %{customdata[2]}"
+        )
+    )
+    fig.update_layout(
+        xaxis_title="Total GPU Energy (Wh)",
+        yaxis_title="Model",
+        margin=dict(l=40, r=40, t=40, b=40)
     )
     return fig
 def get_all_plots():
+    # Combine data from all tasks.
     all_df = pd.DataFrame()
     for task in tasks:
         df = pd.read_csv('data/energy/' + task)
         if df.columns[0].startswith("Unnamed:"):
             df = df.iloc[:, 1:]
+        df['total_gpu_energy'] = pd.to_numeric(df['total_gpu_energy'], errors='coerce')
+        df['energy_score'] = pd.to_numeric(df['energy_score'], errors='coerce').astype(int)
         df['Display Model'] = df['model'].apply(lambda m: m.split('/')[-1])
         all_df = pd.concat([all_df, df], ignore_index=True)
     all_df = all_df.drop_duplicates(subset=['model'])
     fig = px.scatter(
         all_df,
+        x="total_gpu_energy",
         y="Display Model",
+        color="energy_score",
+        custom_data=['model', 'total_gpu_energy', 'energy_score'],
         height=500,
         width=800,
+        color_discrete_map=color_map,
     )
     fig.update_traces(
+        hovertemplate=(
+            "Model: %{customdata[0]}<br>" +
+            "Total GPU Energy (Wh): %{customdata[1]:.4f}<br>" +
+            "Energy Score: %{customdata[2]}"
+        )
+    )
+    fig.update_layout(
+        xaxis_title="Total GPU Energy (Wh)",
+        yaxis_title="Model",
+        margin=dict(l=40, r=40, t=40, b=40)
     )
     return fig
 def get_model_names(task):
     """
     For a given task, load the energy CSV and return a dataframe with the following columns:
       - Model (a markdown link)
+      - GPU Energy (Wh) (formatted to 4 decimal places)
       - Score (a star rating based on energy_score)
+    For text_generation.csv only, also include the "Class" column if it exists.
     """
     df = pd.read_csv('data/energy/' + task)
     if df.columns[0].startswith("Unnamed:"):
         df = df.iloc[:, 1:]
+    df['total_gpu_energy'] = pd.to_numeric(df['total_gpu_energy'], errors='coerce')
+    df['energy_score'] = pd.to_numeric(df['energy_score'], errors='coerce').astype(int)
     df['GPU Energy (Wh)'] = df['total_gpu_energy'].apply(lambda x: f"{x:.4f}")
     df['Model'] = df['model'].apply(make_link)
     df['Score'] = df['energy_score'].apply(format_stars)
     else:
         df = df[['Model', 'GPU Energy (Wh)', 'Score']]
+    # Sort by the numeric energy value.
+    df = df.sort_values(by='total_gpu_energy')
     return df
 def get_all_model_names():
     """
     Combine data from all tasks and return a leaderboard table with:
+      - Model, GPU Energy (Wh), Score.
     Duplicate models are dropped.
     """
     all_df = pd.DataFrame()
         df = pd.read_csv('data/energy/' + task)
         if df.columns[0].startswith("Unnamed:"):
             df = df.iloc[:, 1:]
+        df['total_gpu_energy'] = pd.to_numeric(df['total_gpu_energy'], errors='coerce')
+        df['energy_score'] = pd.to_numeric(df['energy_score'], errors='coerce').astype(int)
         df['GPU Energy (Wh)'] = df['total_gpu_energy'].apply(lambda x: f"{x:.4f}")
         df['Model'] = df['model'].apply(make_link)
         df['Score'] = df['energy_score'].apply(format_stars)
         all_df = pd.concat([all_df, df], ignore_index=True)
     all_df = all_df.drop_duplicates(subset=['model'])
+    all_df = all_df.sort_values(by='total_gpu_energy')
     return all_df[['Model', 'GPU Energy (Wh)', 'Score']]
 # Build the Gradio interface.
+# The CSS below sets fixed layouts for tables.
 demo = gr.Blocks(css="""
 .gr-dataframe table {
     table-layout: fixed;
             lines=10,
             show_copy_button=True,
         )
+    gr.Markdown("Last updated: February 2025")
 demo.launch()