@@ -176,19 +176,6 @@ def test_corpus_init():
176
176
_check_copies (corp , copy (corp ), same_nlp_instance = True )
177
177
_check_copies (corp , deepcopy (corp ), same_nlp_instance = False )
178
178
179
- if 'en_core_web_md' in spacy .util .get_installed_models ():
180
- corp = c .Corpus (textdata_en , language = 'en' , load_features = {'vectors' , 'tok2vec' , 'tagger' , 'morphologizer' ,
181
- 'parser' , 'attribute_ruler' , 'lemmatizer' , 'ner' })
182
- assert corp .has_sents
183
- assert corp .language_model == 'en_core_web_md'
184
- _check_corpus_docs (corp , has_sents = True )
185
- assert 'ner' in corp .nlp .pipe_names
186
-
187
- _check_copies (corp , copy (corp ), same_nlp_instance = True )
188
- _check_copies (corp , deepcopy (corp ), same_nlp_instance = False )
189
- else :
190
- raise RuntimeWarning ('language model "en_core_web_md" not installed' )
191
-
192
179
corp = c .Corpus (textdata_en , language = 'en' , load_features = {'tok2vec' , 'senter' })
193
180
assert corp .has_sents
194
181
assert corp .language_model == 'en_core_web_sm'
@@ -261,6 +248,20 @@ def test_corpus_init():
261
248
_check_copies (corp , deepcopy (corp ), same_nlp_instance = False )
262
249
263
250
251
+ @pytest .mark .skipif ('en_core_web_md' not in spacy .util .get_installed_models (),
252
+ reason = 'language model "en_core_web_md" not installed' )
253
+ def test_corpus_init_md_model_required ():
254
+ corp = c .Corpus (textdata_en , language = 'en' , load_features = {'vectors' , 'tok2vec' , 'tagger' , 'morphologizer' ,
255
+ 'parser' , 'attribute_ruler' , 'lemmatizer' , 'ner' })
256
+ assert corp .has_sents
257
+ assert corp .language_model == 'en_core_web_md'
258
+ _check_corpus_docs (corp , has_sents = True )
259
+ assert 'ner' in corp .nlp .pipe_names
260
+
261
+ _check_copies (corp , copy (corp ), same_nlp_instance = True )
262
+ _check_copies (corp , deepcopy (corp ), same_nlp_instance = False )
263
+
264
+
264
265
@settings (deadline = None )
265
266
@given (docs = strategy_str_str_dict_printable (),
266
267
punctuation = st .one_of (st .none (), st .lists (st .text (string .punctuation , min_size = 1 , max_size = 1 ))),
0 commit comments