frugal-ai-submission-template

Sleeping

App Files Files Community

Tonic commited on Feb 10

Commit

4b2de56

verified ·

1 Parent(s): 908f3ec

add custom layernorm patch

Browse files

Files changed (1) hide show

tasks/text.py +23 -13

tasks/text.py CHANGED Viewed

@@ -7,6 +7,7 @@ import os
 from concurrent.futures import ThreadPoolExecutor
 from typing import List, Dict, Tuple
 import torch
 from transformers import AutoTokenizer, AutoModelForSequenceClassification, AutoConfig
 from huggingface_hub import login
 from dotenv import load_dotenv
@@ -30,6 +31,11 @@ router = APIRouter()
 DESCRIPTION = "Climate Guard Toxic Agent Classifier"
 ROUTE = "/text"
 class TextClassifier:
     def __init__(self):
         self.device = "cuda" if torch.cuda.is_available() else "cpu"
@@ -38,27 +44,31 @@ class TextClassifier:
         for attempt in range(max_retries):
             try:
-                # Load config and modify it
                 self.config = AutoConfig.from_pretrained(model_name)
-                # Remove problematic bias parameters
-                if hasattr(self.config, 'norm_bias'):
-                    delattr(self.config, 'norm_bias')
                 # Initialize tokenizer
                 self.tokenizer = AutoTokenizer.from_pretrained(
                     model_name,
-                    model_max_length=2048,
                     padding_side='right',
                     truncation_side='right'
                 )
-                # Initialize model with modified config
-                self.model = AutoModelForSequenceClassification.from_pretrained(
-                    model_name,
-                    config=self.config,
-                    ignore_mismatched_sizes=True
-                )
                 self.model.to(self.device)
                 self.model.eval()
@@ -81,7 +91,7 @@ class TextClassifier:
                 batch,
                 return_tensors="pt",
                 truncation=True,
-                max_length=2024,
                 padding='max_length'
             ).to(self.device)

 from concurrent.futures import ThreadPoolExecutor
 from typing import List, Dict, Tuple
 import torch
+import torch.nn as nn
 from transformers import AutoTokenizer, AutoModelForSequenceClassification, AutoConfig
 from huggingface_hub import login
 from dotenv import load_dotenv
 DESCRIPTION = "Climate Guard Toxic Agent Classifier"
 ROUTE = "/text"
+# Custom LayerNorm that ignores bias parameter
+class CustomLayerNorm(nn.LayerNorm):
+    def __init__(self, normalized_shape, eps=1e-5, **kwargs):
+        super().__init__(normalized_shape, eps=eps)
 class TextClassifier:
     def __init__(self):
         self.device = "cuda" if torch.cuda.is_available() else "cpu"
         for attempt in range(max_retries):
             try:
+                # Load config
                 self.config = AutoConfig.from_pretrained(model_name)
                 # Initialize tokenizer
                 self.tokenizer = AutoTokenizer.from_pretrained(
                     model_name,
+                    model_max_length=512,
                     padding_side='right',
                     truncation_side='right'
                 )
+                # Patch LayerNorm
+                original_layernorm = nn.LayerNorm
+                nn.LayerNorm = CustomLayerNorm
+                try:
+                    # Initialize model with patched LayerNorm
+                    self.model = AutoModelForSequenceClassification.from_pretrained(
+                        model_name,
+                        config=self.config,
+                        ignore_mismatched_sizes=True
+                    )
+                finally:
+                    # Restore original LayerNorm
+                    nn.LayerNorm = original_layernorm
                 self.model.to(self.device)
                 self.model.eval()
                 batch,
                 return_tensors="pt",
                 truncation=True,
+                max_length=512,
                 padding='max_length'
             ).to(self.device)