File size: 515 Bytes
eb90fa0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
import numpy as np
from sentence_transformers import SentenceTransformer


encoder = SentenceTransformer("hfl/chinese-roberta-wwm-ext-large")

tags = []
f = open('tags.txt', 'r')
for line in f.readlines():
    tags.append(line.strip())
f.close()

tags_embed = encoder.encode(tags)
tags_dis = [np.sqrt(np.dot(_, _.T)) for _ in tags_embed]

print(tags_embed.shape, tags_dis.shape)

with open('./tags_embed.npy', 'wb') as f:
    np.save(f, tags_embed)

with open('./tags_dis.npy', 'wb') as f:
    np.save(f, tags_dis)