Spaces:

alexandrainst
/

zero-shot-classification

Running

App Files Files Community

saattrupdan commited on Dec 1, 2022

Commit

41bb40c

1 Parent(s): efd38a2

feat: Update app

Browse files

Files changed (1) hide show

app.py +37 -13

app.py CHANGED Viewed

@@ -11,6 +11,15 @@ classifier = pipeline(
 )
 def classification(task: str, doc: str) -> str:
     """Classify text into categories.
@@ -93,40 +102,55 @@ def classification(task: str, doc: str) -> str:
                 "sport",
             ]
-    # Else if the task is offensive text detection, classify the text into offensive
-    # or not offensive
-    elif task == "Offensive text detection":
         if language == "sv":
-            hypothesis_template = "Detta exempel er {}."
-            candidate_labels = ["stötande", "inte stötande"]
         elif language == "no":
-            hypothesis_template = "Dette eksemplet er {}."
-            candidate_labels = ["støtende", "ikke støtende"]
         else:
-            hypothesis_template = "Dette eksempel er {}."
-            candidate_labels = ["anstødig tale", "ikke anstødig tale"]
     # Else the task is not supported, so raise an error
     else:
         raise ValueError(f"Task {task} not supported.")
     # Run the classifier on the text
     result = classifier(
-        doc, candidate_labels=candidate_labels, hypothesis_template=hypothesis_template
     )
     print(result)
     # Return the predicted label
     return (
-        f"{result['labels'][0].capitalize()}\n"
         f"({confidence_str}: {result['scores'][0]:.0%})"
     )
 # Create a dropdown menu for the task
 dropdown = gr.inputs.Dropdown(
     label="Task",
-    choices=["Sentiment classification", "News topic classification", "Offensive text detection"],
     default="Sentiment classification",
 )
@@ -136,7 +160,7 @@ interface = gr.Interface(
     inputs=[dropdown, gr.inputs.Textbox(label="Text")],
     outputs=gr.outputs.Label(type="text"),
     title="Scandinavian zero-shot text classification",
-    description="Classify text in Danish, Swedish or Norwegian into categories, without any training data!",
 )
 # Run the app

 )
+# Set the description for the interface
+DESCRIPTION = """Classify text in Danish, Swedish or Norwegian into categories, without
+any training data!
+Note that the models will most likely *not* work as well as a finetuned model on your
+specific data, but they can be used as a starting point for your own classification
+task ✨"""
 def classification(task: str, doc: str) -> str:
     """Classify text into categories.
                 "sport",
             ]
+    # Else if the task is spam detection, classify the text into spam or not spam
+    elif task == "Spam detection":
         if language == "sv":
+            hypothesis_template = "Det här e-postmeddelandet ser {}"
+            candidate_labels = {
+                "ut som ett skräppostmeddelande": "Spam",
+                "inte ut som ett skräppostmeddelande": "Inte spam",
+            }
         elif language == "no":
+            hypothesis_template = "Denne e-posten ser {}"
+            candidate_labels = {
+                "ut som en spam-e-post": "Spam",
+                "ikke ut som en spam-e-post": "Ikke spam",
+            }
         else:
+            hypothesis_template = "Denne e-mail ligner {}"
+            candidate_labels = {
+                "en spam e-mail": "Spam",
+                "ikke en spam e-mail": "Ikke spam",
+            }
     # Else the task is not supported, so raise an error
     else:
         raise ValueError(f"Task {task} not supported.")
+    # If `candidate_labels` is a list then convert it to a dictionary, where the keys
+    # are the entries in the list and the values are the keys capitalized
+    if isinstance(candidate_labels, list):
+        candidate_labels = {label: label.capitalize() for label in candidate_labels}
     # Run the classifier on the text
     result = classifier(
+        doc,
+        candidate_labels=list(candidate_labels.keys()),
+        hypothesis_template=hypothesis_template,
     )
     print(result)
     # Return the predicted label
     return (
+        f"{candidate_labels[result['labels'][0]]}\n"
         f"({confidence_str}: {result['scores'][0]:.0%})"
     )
 # Create a dropdown menu for the task
 dropdown = gr.inputs.Dropdown(
     label="Task",
+    choices=["Sentiment classification", "News topic classification", "Spam detection"],
     default="Sentiment classification",
 )
     inputs=[dropdown, gr.inputs.Textbox(label="Text")],
     outputs=gr.outputs.Label(type="text"),
     title="Scandinavian zero-shot text classification",
+    description=DESCRIPTION,
 )
 # Run the app