p0x0q-dev
/

bge-m3-sparse-experimental

Sentence Similarity

sentence-transformers

feature-extraction

text-embeddings-inference

Model card Files Files and versions Community

takanezawa commited on Sep 13, 2024

Commit

4af82f4

·

1 Parent(s): a03b9b6

スパースベクトル化に対応する

Files changed (2) hide show

.gitignore +1 -0
handler.py +20 -12

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ test*

handler.py CHANGED Viewed

@@ -1,15 +1,14 @@
 from typing import  Dict, List, Any
-from optimum.onnxruntime import ORTModelForSequenceClassification
-from transformers import pipeline, AutoTokenizer
 class EndpointHandler():
-    def __init__(self, path="./onnx"):
         # load the optimized model
-        model = ORTModelForSequenceClassification.from_pretrained(path)
-        tokenizer = AutoTokenizer.from_pretrained(path)
-        # create inference pipeline
-        self.pipeline = pipeline("text-classification", model=model, tokenizer=tokenizer)
     def __call__(self, data: Any) -> List[List[Dict[str, float]]]:
@@ -24,11 +23,20 @@ class EndpointHandler():
         """
         inputs = data.pop("inputs", data)
         parameters = data.pop("parameters", None)
         # pass inputs with all kwargs in data
-        if parameters is not None:
-            prediction = self.pipeline(inputs, **parameters)
-        else:
-            prediction = self.pipeline(inputs)
         # postprocess the prediction
-        return prediction

 from typing import  Dict, List, Any
+# from optimum.onnxruntime import ORTModelForSequenceClassification
+# from transformers import pipeline, AutoTokenizer
+from FlagEmbedding import BGEM3FlagModel
 class EndpointHandler():
+    def __init__(self, path="./"):
         # load the optimized model
+        # モデルの準備
+        model = BGEM3FlagModel("./", use_fp16=False)
     def __call__(self, data: Any) -> List[List[Dict[str, float]]]:
         """
         inputs = data.pop("inputs", data)
         parameters = data.pop("parameters", None)
+        sparse_embs = []
+        result = self.model.encode(inputs, return_dense=False, return_sparse=True)
+        sparse_vectors = result["lexical_weights"]
+        for sparse_vector in sparse_vectors:
+            sparse_values = [value for value in sparse_vector.values()]
+            sparse_dimensions = [int(key) for key in sparse_vector.keys()]
+            sparse_embs.append((sparse_values, sparse_dimensions))
         # pass inputs with all kwargs in data
+        # if parameters is not None:
+        #     prediction = self.pipeline(inputs, **parameters)
+        # else:
+        #     prediction = self.pipeline(inputs)
         # postprocess the prediction
+        return sparse_vectors