diff --git a/spacy/cli/pretrain.py b/spacy/cli/pretrain.py index 598739246..9a9d9e213 100644 --- a/spacy/cli/pretrain.py +++ b/spacy/cli/pretrain.py @@ -110,7 +110,7 @@ def pretrain( msg.row(("#", "# Words", "Total Loss", "Loss", "w/s"), **row_settings) for epoch in range(nr_iter): for batch in util.minibatch_by_words( - ((text, None) for text in texts), size=5000 + ((text, None) for text in texts), size=3000 ): docs = make_docs(nlp, [text for (text, _) in batch]) loss = make_update(model, docs, optimizer, drop=dropout)