Skip to content
This repository was archived by the owner on May 3, 2023. It is now read-only.

Commit b3c0989

Browse files
author
Markus Konrad
committed
test_corpus: dont fail when certain language models could not be installed
1 parent 4aa68d6 commit b3c0989

File tree

1 file changed

+17
-8
lines changed

1 file changed

+17
-8
lines changed

tests/test_corpus.py

Lines changed: 17 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -176,15 +176,18 @@ def test_corpus_init():
176176
_check_copies(corp, copy(corp), same_nlp_instance=True)
177177
_check_copies(corp, deepcopy(corp), same_nlp_instance=False)
178178

179-
corp = c.Corpus(textdata_en, language='en', load_features={'vectors', 'tok2vec', 'tagger', 'morphologizer',
180-
'parser', 'attribute_ruler', 'lemmatizer', 'ner'})
181-
assert corp.has_sents
182-
assert corp.language_model == 'en_core_web_md'
183-
_check_corpus_docs(corp, has_sents=True)
184-
assert 'ner' in corp.nlp.pipe_names
179+
if 'en_core_web_md' in spacy.util.get_installed_models():
180+
corp = c.Corpus(textdata_en, language='en', load_features={'vectors', 'tok2vec', 'tagger', 'morphologizer',
181+
'parser', 'attribute_ruler', 'lemmatizer', 'ner'})
182+
assert corp.has_sents
183+
assert corp.language_model == 'en_core_web_md'
184+
_check_corpus_docs(corp, has_sents=True)
185+
assert 'ner' in corp.nlp.pipe_names
185186

186-
_check_copies(corp, copy(corp), same_nlp_instance=True)
187-
_check_copies(corp, deepcopy(corp), same_nlp_instance=False)
187+
_check_copies(corp, copy(corp), same_nlp_instance=True)
188+
_check_copies(corp, deepcopy(corp), same_nlp_instance=False)
189+
else:
190+
raise RuntimeWarning('language model "en_core_web_md" not installed')
188191

189192
corp = c.Corpus(textdata_en, language='en', load_features={'tok2vec', 'senter'})
190193
assert corp.has_sents
@@ -821,6 +824,8 @@ def test_doc_frequencies(corpora_en_serial_and_parallel_module, proportions, sel
821824
assert set(res['token']) == c.vocabulary(corp, select=select, sort=False)
822825

823826

827+
@pytest.mark.skipif('en_core_web_md' not in spacy.util.get_installed_models(),
828+
reason='language model "en_core_web_md" not installed')
824829
@settings(deadline=None)
825830
@given(select=st.sampled_from([None, 'empty', 'small2', 'nonexistent', ['small1', 'small2'], []]),
826831
omit_empty=st.booleans())
@@ -852,6 +857,8 @@ def test_doc_vectors(corpora_en_serial_and_parallel_also_w_vectors_module, selec
852857
assert len(vec) > 0
853858

854859

860+
@pytest.mark.skipif('en_core_web_md' not in spacy.util.get_installed_models(),
861+
reason='language model "en_core_web_md" not installed')
855862
@settings(deadline=None)
856863
@given(select=st.sampled_from([None, 'empty', 'small2', 'nonexistent', ['small1', 'small2'], []]),
857864
omit_oov=st.booleans())
@@ -889,6 +896,8 @@ def test_token_vectors(corpora_en_serial_and_parallel_also_w_vectors_module, sel
889896
assert mat.ndim == 2
890897

891898

899+
@pytest.mark.skipif('en_core_web_md' not in spacy.util.get_installed_models(),
900+
reason='language model "en_core_web_md" not installed')
892901
@settings(deadline=None)
893902
@given(select=st.sampled_from([None, 'empty', 'small2', 'nonexistent', ['small1', 'small2'], []]),
894903
collapse=st.sampled_from([None, ' ']))

0 commit comments

Comments
 (0)