Commit
·
ada136d
1
Parent(s):
b55b5d0
model improved
Browse files- maker.py +8 -2
- pytorch_model.bin +1 -1
maker.py
CHANGED
@@ -36,7 +36,7 @@ class UDEmbedsDataset(object):
|
|
36 |
self.tokenizer=tokenizer
|
37 |
self.embeddings=embeddings
|
38 |
self.seeks=[0]
|
39 |
-
label=set(["SYM","SYM."])
|
40 |
dep=set()
|
41 |
s=self.conllu.readline()
|
42 |
while s!="":
|
@@ -86,8 +86,9 @@ class UDEmbedsDataset(object):
|
|
86 |
emb=self.embeddings
|
87 |
else:
|
88 |
import torch
|
89 |
-
if len(x)<
|
90 |
x=[True]*len(x)
|
|
|
91 |
else:
|
92 |
w=sum([len(x)-i+1 if b else 0 for i,b in enumerate(x)])+1
|
93 |
for i in range(len(x)):
|
@@ -104,6 +105,11 @@ class UDEmbedsDataset(object):
|
|
104 |
for j in range(i+1,len(x)):
|
105 |
ids.append(j)
|
106 |
upos.append(p[j]+"|"+d[j] if int(c[j][6])==i+1 else p[i]+"|"+d[i] if int(c[i][6])==j+1 else p[j]+"|_")
|
|
|
|
|
|
|
|
|
|
|
107 |
ids.append(-1)
|
108 |
upos.append("SYM|_")
|
109 |
with torch.no_grad():
|
|
|
36 |
self.tokenizer=tokenizer
|
37 |
self.embeddings=embeddings
|
38 |
self.seeks=[0]
|
39 |
+
label=set(["SYM","SYM.","SYM|_"])
|
40 |
dep=set()
|
41 |
s=self.conllu.readline()
|
42 |
while s!="":
|
|
|
86 |
emb=self.embeddings
|
87 |
else:
|
88 |
import torch
|
89 |
+
if len(x)<127:
|
90 |
x=[True]*len(x)
|
91 |
+
w=(len(x)+2)*(len(x)+1)/2
|
92 |
else:
|
93 |
w=sum([len(x)-i+1 if b else 0 for i,b in enumerate(x)])+1
|
94 |
for i in range(len(x)):
|
|
|
105 |
for j in range(i+1,len(x)):
|
106 |
ids.append(j)
|
107 |
upos.append(p[j]+"|"+d[j] if int(c[j][6])==i+1 else p[i]+"|"+d[i] if int(c[i][6])==j+1 else p[j]+"|_")
|
108 |
+
if w>8192 and i>0:
|
109 |
+
while w>8192 and upos[-1].endswith("|_"):
|
110 |
+
upos.pop(-1)
|
111 |
+
ids.pop(-1)
|
112 |
+
w-=1
|
113 |
ids.append(-1)
|
114 |
upos.append("SYM|_")
|
115 |
with torch.no_grad():
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 611030258
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0736e9bfbba2fc216739f47298aded53cd9ee3a725ef02f1958d556deaa03518
|
3 |
size 611030258
|