KoichiYasuoka commited on
Commit
ada136d
·
1 Parent(s): b55b5d0

model improved

Browse files
Files changed (2) hide show
  1. maker.py +8 -2
  2. pytorch_model.bin +1 -1
maker.py CHANGED
@@ -36,7 +36,7 @@ class UDEmbedsDataset(object):
36
  self.tokenizer=tokenizer
37
  self.embeddings=embeddings
38
  self.seeks=[0]
39
- label=set(["SYM","SYM."])
40
  dep=set()
41
  s=self.conllu.readline()
42
  while s!="":
@@ -86,8 +86,9 @@ class UDEmbedsDataset(object):
86
  emb=self.embeddings
87
  else:
88
  import torch
89
- if len(x)<128:
90
  x=[True]*len(x)
 
91
  else:
92
  w=sum([len(x)-i+1 if b else 0 for i,b in enumerate(x)])+1
93
  for i in range(len(x)):
@@ -104,6 +105,11 @@ class UDEmbedsDataset(object):
104
  for j in range(i+1,len(x)):
105
  ids.append(j)
106
  upos.append(p[j]+"|"+d[j] if int(c[j][6])==i+1 else p[i]+"|"+d[i] if int(c[i][6])==j+1 else p[j]+"|_")
 
 
 
 
 
107
  ids.append(-1)
108
  upos.append("SYM|_")
109
  with torch.no_grad():
 
36
  self.tokenizer=tokenizer
37
  self.embeddings=embeddings
38
  self.seeks=[0]
39
+ label=set(["SYM","SYM.","SYM|_"])
40
  dep=set()
41
  s=self.conllu.readline()
42
  while s!="":
 
86
  emb=self.embeddings
87
  else:
88
  import torch
89
+ if len(x)<127:
90
  x=[True]*len(x)
91
+ w=(len(x)+2)*(len(x)+1)/2
92
  else:
93
  w=sum([len(x)-i+1 if b else 0 for i,b in enumerate(x)])+1
94
  for i in range(len(x)):
 
105
  for j in range(i+1,len(x)):
106
  ids.append(j)
107
  upos.append(p[j]+"|"+d[j] if int(c[j][6])==i+1 else p[i]+"|"+d[i] if int(c[i][6])==j+1 else p[j]+"|_")
108
+ if w>8192 and i>0:
109
+ while w>8192 and upos[-1].endswith("|_"):
110
+ upos.pop(-1)
111
+ ids.pop(-1)
112
+ w-=1
113
  ids.append(-1)
114
  upos.append("SYM|_")
115
  with torch.no_grad():
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04c10ef1bc02136241e060e8e040ed06a23d1ce74b96ada894e1fcebd8886dcb
3
  size 611030258
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0736e9bfbba2fc216739f47298aded53cd9ee3a725ef02f1958d556deaa03518
3
  size 611030258