JohnKouf commited on
Commit
5a09914
·
verified ·
1 Parent(s): 2d7f83d

Update Similarity.py

Browse files
Files changed (1) hide show
  1. Similarity.py +15 -11
Similarity.py CHANGED
@@ -1,15 +1,19 @@
1
- from sentence_transformers import SentenceTransformer
 
2
 
3
- class Similarity:
4
  def __init__(self):
5
- self.model = None
6
-
7
- def load_model(self):
8
- if self.model is None:
9
- print("Loading SentenceTransformer model...")
10
- self.model = SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2")
11
- print("Model loaded.")
12
 
13
  def embed_text(self, text):
14
- self.load_model()
15
- return self.model.encode(text, convert_to_tensor=True)
 
 
 
 
 
 
 
1
+ from transformers import AutoTokenizer, AutoModel
2
+ import torch
3
 
4
+ class SimpleEmbedder:
5
  def __init__(self):
6
+ print("Loading tokenizer and model...")
7
+ self.tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/all-MiniLM-L6-v2')
8
+ self.model = AutoModel.from_pretrained('sentence-transformers/all-MiniLM-L6-v2')
9
+ print("Loaded.")
 
 
 
10
 
11
  def embed_text(self, text):
12
+ inputs = self.tokenizer(text, return_tensors='pt')
13
+ outputs = self.model(**inputs)
14
+ # Mean pooling
15
+ embeddings = outputs.last_hidden_state.mean(dim=1)
16
+ return embeddings
17
+
18
+ embedder = SimpleEmbedder()
19
+ print(embedder.embed_text("Hello world"))