param-bharat
/

ModernBERT-large-nli-scorer

Text Classification

Transformers

Safetensors

modernbert

Generated from Trainer

Model card Files Files and versions Community

param-bharat commited on Dec 27, 2024

Commit

727c481

verified ·

1 Parent(s): b4e5d0a

Upload NLIScorer

Browse files

Files changed (1) hide show

pipeline.py +36 -7

pipeline.py CHANGED Viewed

@@ -330,28 +330,57 @@ TASK_CLASSES = {
     "Quality/Response/Verbosity": QualityResponseVerbosity,
 }
 class NLIScorer(Pipeline):
     def _sanitize_parameters(self, **kwargs):
         preprocess_kwargs = {}
         postprocess_kwargs = {}
-        if "threshold" in kwargs:
-            postprocess_kwargs["threshold"] = kwargs["threshold"]
         return preprocess_kwargs, {}, postprocess_kwargs
     def preprocess(self, inputs):
         task_name = inputs.pop("task_type")
         TaskClass = TASK_CLASSES[task_name]
         task_class = TaskClass(tokenizer=self.tokenizer, **inputs)
-        return task_class.as_model_inputs
     def _forward(self, model_inputs):
-        outputs = self.model(**model_inputs)
-        return outputs
-    def postprocess(self, model_outputs, threshold=0.5):
         pos_scores = model_outputs["logits"].softmax(-1)[0][1]
-        best_class = int(pos_scores > threshold)
         if best_class == 1:
             score = pos_scores
         else:

     "Quality/Response/Verbosity": QualityResponseVerbosity,
 }
+TASK_THRESHOLDS = {
+    "Detection/Hallucination/Factual Consistency": 0.5895,
+    "Detection/Prompt Injection": 0.4147,
+    "Detection/Source Code": 0.4001,
+    "Detection/Toxicity/Disability": 0.5547,
+    "Detection/Toxicity/Gender": 0.4007,
+    "Detection/Toxicity/Identity Hate": 0.5502,
+    "Detection/Toxicity/Insult": 0.4913,
+    "Detection/Toxicity/Obscene": 0.448,
+    "Detection/Toxicity/Race": 0.5983,
+    "Detection/Toxicity/Religion": 0.4594,
+    "Detection/Toxicity/Toxic": 0.5034,
+    "Detection/Toxicity/Violence": 0.4031,
+    "Quality/Context/Document Relevance": 0.5809,
+    "Quality/Context/Document Utilization": 0.4005,
+    "Quality/Context/Sentence Relevance": 0.6003,
+    "Quality/Context/Sentence Utilization": 0.5417,
+    "Quality/Response/Adherence": 0.59,
+    "Quality/Response/Attribution": 0.5304,
+    "Quality/Response/Coherence": 0.6891,
+    "Quality/Response/Complexity": 0.7235,
+    "Quality/Response/Correctness": 0.6535,
+    "Quality/Response/Helpfulness": 0.4445,
+    "Quality/Response/Instruction Following": 0.5323,
+    "Quality/Response/Relevance": 0.4011,
+    "Quality/Response/Verbosity": 0.4243,
+}
 class NLIScorer(Pipeline):
     def _sanitize_parameters(self, **kwargs):
         preprocess_kwargs = {}
         postprocess_kwargs = {}
         return preprocess_kwargs, {}, postprocess_kwargs
     def preprocess(self, inputs):
         task_name = inputs.pop("task_type")
         TaskClass = TASK_CLASSES[task_name]
         task_class = TaskClass(tokenizer=self.tokenizer, **inputs)
+        return {
+            "model_inputs": task_class.as_model_inputs,
+            "threshold": TASK_THRESHOLDS[task_name],
+        }
     def _forward(self, model_inputs):
+        outputs = self.model(**model_inputs["model_inputs"])
+        return {"logits": outputs["logits"], "threshold": model_inputs["threshold"]}
+    def postprocess(self, model_outputs):
         pos_scores = model_outputs["logits"].softmax(-1)[0][1]
+        best_class = int(pos_scores > model_outputs["threshold"])
         if best_class == 1:
             score = pos_scores
         else: