submission-template

Sleeping

csk99 commited on Jan 23

Commit

a8c9010

verified ·

1 Parent(s): e324040

Update tasks/text.py

Add inference code with sentence transformer and XGBoost model

Files changed (1) hide show

tasks/text.py CHANGED Viewed

@@ -7,6 +7,12 @@ import random
 from .utils.evaluation import TextEvaluationRequest
 from .utils.emissions import tracker, clean_emissions_data, get_space_info
 router = APIRouter()
 DESCRIPTION = "Random Baseline"
@@ -53,12 +59,26 @@ async def evaluate_text(request: TextEvaluationRequest):
     #--------------------------------------------------------------------------------------------
     # YOUR MODEL INFERENCE CODE HERE
     # Update the code below to replace the random baseline by your model inference within the inference pass where the energy consumption and emissions are tracked.
     #--------------------------------------------------------------------------------------------
     # Make random predictions (placeholder for actual model inference)
     true_labels = test_dataset["label"]
-    predictions = [random.randint(0, 7) for _ in range(len(true_labels))]
     #--------------------------------------------------------------------------------------------
     # YOUR MODEL INFERENCE STOPS HERE

 from .utils.evaluation import TextEvaluationRequest
 from .utils.emissions import tracker, clean_emissions_data, get_space_info
+#packages needed for inference
+from sentence_transformers import SentenceTransformer
+from xgboost import XGBClassifier
+import pickle
 router = APIRouter()
 DESCRIPTION = "Random Baseline"
     #--------------------------------------------------------------------------------------------
     # YOUR MODEL INFERENCE CODE HERE
+    #Load the embedding model
+    model = SentenceTransformer("dunzhang/stella_en_400M_v5",trust_remote_code=True)
+    # Convert each sentence into a vector representation (embedding)
+    embeddings = model.encode(test_dataset['quote'].tolist())
     # Update the code below to replace the random baseline by your model inference within the inference pass where the energy consumption and emissions are tracked.
     #--------------------------------------------------------------------------------------------
     # Make random predictions (placeholder for actual model inference)
     true_labels = test_dataset["label"]
+    #load the xgboost model
+    with open("models/stella_400_xgb_500.pkl",'rb') as f:
+        xgbclassifier = pickle.load(f)
+    #make inference
+    predictions = xgbclassifier.predict(embeddings)
     #--------------------------------------------------------------------------------------------
     # YOUR MODEL INFERENCE STOPS HERE