Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
File size: 1,420 Bytes
63858e7 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 |
from spacyface import *
import pytest
def load_sample_en_sents():
from .EN_TEST_SENTS import SPACY_EN_TEST_SENTS
return SPACY_EN_TEST_SENTS
sentences = load_sample_en_sents()
@pytest.mark.parametrize("model_name,alnr_class",
[('bert-base-uncased', BertAligner),
('bert-base-cased', BertAligner),
('gpt2', GPT2Aligner),
('roberta-base', RobertaAligner),
('distilbert-base-uncased', DistilBertAligner),
('transfo-xl-wt103', TransfoXLAligner),
('xlnet-base-cased', XLNetAligner),
('xlm-mlm-en-2048', XLMAligner),
('ctrl', CTRLAligner),
('albert-base-v1', AlbertAligner),
('openai-gpt', OpenAIGPTAligner),
('xlm-roberta-base', XLMRobertaAligner),
# ('t5-small', T5Aligner), # This does not currently work
])
def test_aligner(model_name, alnr_class):
"""NOTE: Will be obsolete when the aligner is able to work with transformer auto model"""
a = alnr_class.from_pretrained(model_name)
for s in sentences:
mtokens = [m['token'] for m in a.meta_tokenize(s)]
tokens = a.tokenize(s)
assert tokens == mtokens, f"{tokens} \n {mtokens}"
|