@@ -176,15 +176,18 @@ def test_corpus_init():
176
176
_check_copies (corp , copy (corp ), same_nlp_instance = True )
177
177
_check_copies (corp , deepcopy (corp ), same_nlp_instance = False )
178
178
179
- corp = c .Corpus (textdata_en , language = 'en' , load_features = {'vectors' , 'tok2vec' , 'tagger' , 'morphologizer' ,
180
- 'parser' , 'attribute_ruler' , 'lemmatizer' , 'ner' })
181
- assert corp .has_sents
182
- assert corp .language_model == 'en_core_web_md'
183
- _check_corpus_docs (corp , has_sents = True )
184
- assert 'ner' in corp .nlp .pipe_names
179
+ if 'en_core_web_md' in spacy .util .get_installed_models ():
180
+ corp = c .Corpus (textdata_en , language = 'en' , load_features = {'vectors' , 'tok2vec' , 'tagger' , 'morphologizer' ,
181
+ 'parser' , 'attribute_ruler' , 'lemmatizer' , 'ner' })
182
+ assert corp .has_sents
183
+ assert corp .language_model == 'en_core_web_md'
184
+ _check_corpus_docs (corp , has_sents = True )
185
+ assert 'ner' in corp .nlp .pipe_names
185
186
186
- _check_copies (corp , copy (corp ), same_nlp_instance = True )
187
- _check_copies (corp , deepcopy (corp ), same_nlp_instance = False )
187
+ _check_copies (corp , copy (corp ), same_nlp_instance = True )
188
+ _check_copies (corp , deepcopy (corp ), same_nlp_instance = False )
189
+ else :
190
+ raise RuntimeWarning ('language model "en_core_web_md" not installed' )
188
191
189
192
corp = c .Corpus (textdata_en , language = 'en' , load_features = {'tok2vec' , 'senter' })
190
193
assert corp .has_sents
@@ -821,6 +824,8 @@ def test_doc_frequencies(corpora_en_serial_and_parallel_module, proportions, sel
821
824
assert set (res ['token' ]) == c .vocabulary (corp , select = select , sort = False )
822
825
823
826
827
+ @pytest .mark .skipif ('en_core_web_md' not in spacy .util .get_installed_models (),
828
+ reason = 'language model "en_core_web_md" not installed' )
824
829
@settings (deadline = None )
825
830
@given (select = st .sampled_from ([None , 'empty' , 'small2' , 'nonexistent' , ['small1' , 'small2' ], []]),
826
831
omit_empty = st .booleans ())
@@ -852,6 +857,8 @@ def test_doc_vectors(corpora_en_serial_and_parallel_also_w_vectors_module, selec
852
857
assert len (vec ) > 0
853
858
854
859
860
+ @pytest .mark .skipif ('en_core_web_md' not in spacy .util .get_installed_models (),
861
+ reason = 'language model "en_core_web_md" not installed' )
855
862
@settings (deadline = None )
856
863
@given (select = st .sampled_from ([None , 'empty' , 'small2' , 'nonexistent' , ['small1' , 'small2' ], []]),
857
864
omit_oov = st .booleans ())
@@ -889,6 +896,8 @@ def test_token_vectors(corpora_en_serial_and_parallel_also_w_vectors_module, sel
889
896
assert mat .ndim == 2
890
897
891
898
899
+ @pytest .mark .skipif ('en_core_web_md' not in spacy .util .get_installed_models (),
900
+ reason = 'language model "en_core_web_md" not installed' )
892
901
@settings (deadline = None )
893
902
@given (select = st .sampled_from ([None , 'empty' , 'small2' , 'nonexistent' , ['small1' , 'small2' ], []]),
894
903
collapse = st .sampled_from ([None , ' ' ]))
0 commit comments