Spaces:

JetBrains-Research
/

long-code-arena

Running

App Files Files Community

galtimur commited on Jun 5, 2024

Commit

0c58008

verified ·

1 Parent(s): fe82027

Update src/leaderboard_formatting.py

Browse files

Files changed (1) hide show

src/leaderboard_formatting.py +11 -1

src/leaderboard_formatting.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from typing import List
 COLUMNS_PRETTY = {
     "bleu": "BLEU",
     "chrf": "ChrF",
@@ -25,7 +26,7 @@ COLUMNS_PRETTY = {
     "context": "Context",
 }
 METRICS_PER_TASK = {
     "commit_message_generation": [
         "BLEU",
@@ -58,6 +59,9 @@ METRICS_PER_TASK = {
         "ChrF",
         "API Recall",
     ]
 }
@@ -67,6 +71,7 @@ SORT_COLUMN_PER_TASK = {
     "bug_localization": "Model Name",
     "module_summarization": "CompScore",
     "library_based_code_generation": "API Recall",
 }
@@ -83,6 +88,9 @@ def get_columns_per_task(task_id: str) -> List[str]:
     if task_id == 'library_based_code_generation':
         return ["Model Name", "Context"] + metrics_per_task + ["Availability", "Submitted By", "Resources"]
     return ["Model Name", "Context Size", "Availability"] + metrics_per_task + ["Submitted By", "Resources"]
@@ -92,4 +100,6 @@ def get_types_per_task(task_id: str) -> List[str]:
         return ["html", "markdown", "markdown", "html"] + ["number" for _ in metrics_per_task] + ["markdown", "markdown", "html"]
     if task_id == 'bug_localization':
         return ["html", "markdown", "markdown", "html"] + ["number" for _ in metrics_per_task] + ["markdown", "html"]
     return ["html", "markdown", "markdown"] + ["number" for _ in metrics_per_task] + ["markdown", "html"]

 from typing import List
+# Common dictionary to map the columns names
 COLUMNS_PRETTY = {
     "bleu": "BLEU",
     "chrf": "ChrF",
     "context": "Context",
 }
+# Add your metrics
 METRICS_PER_TASK = {
     "commit_message_generation": [
         "BLEU",
         "ChrF",
         "API Recall",
     ]
+    "ci_builds_repair": [
+        "Pass@1",
+    ]
 }
     "bug_localization": "Model Name",
     "module_summarization": "CompScore",
     "library_based_code_generation": "API Recall",
+    "ci_builds_repair": "Pass@1"
 }
     if task_id == 'library_based_code_generation':
         return ["Model Name", "Context"] + metrics_per_task + ["Availability", "Submitted By", "Resources"]
+    if task_id == 'ci_builds_repair':
+        return ["Model Name", "Context Size"] + metrics_per_task + ["Availability", "Submitted By", "Resources"]
     return ["Model Name", "Context Size", "Availability"] + metrics_per_task + ["Submitted By", "Resources"]
         return ["html", "markdown", "markdown", "html"] + ["number" for _ in metrics_per_task] + ["markdown", "markdown", "html"]
     if task_id == 'bug_localization':
         return ["html", "markdown", "markdown", "html"] + ["number" for _ in metrics_per_task] + ["markdown", "html"]
+    if task_id == 'ci_builds_repair':
+        return ["html", "markdown"] + ["number" for _ in metrics_per_task] + ["markdown", "markdown", "html"]
     return ["html", "markdown", "markdown"] + ["number" for _ in metrics_per_task] + ["markdown", "html"]