From c675746ca2ffbe13c06751cd30168c55b7d372fc Mon Sep 17 00:00:00 2001 From: Ines Montani Date: Wed, 5 Aug 2020 20:29:46 +0200 Subject: [PATCH] Update docstrings and types --- spacy/gold/batchers.py | 7 +++++-- spacy/gold/corpus.py | 1 - 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/spacy/gold/batchers.py b/spacy/gold/batchers.py index d1b8e6b55..57c6b4b3a 100644 --- a/spacy/gold/batchers.py +++ b/spacy/gold/batchers.py @@ -45,7 +45,9 @@ def configure_minibatch_by_words( @registry.batchers("batch_by_sequence.v1") -def configure_minibatch(size: Sizing, get_length=None) -> BatcherT: +def configure_minibatch( + size: Sizing, get_length: Optional[Callable[[ItemT], int]] = None +) -> BatcherT: optionals = {"get_length": get_length} if get_length is not None else {} return partial(minibatch, size=size, **optionals) @@ -79,7 +81,8 @@ def minibatch_by_words( """Create minibatches of roughly a given number of words. If any examples are longer than the specified batch length, they will appear in a batch by themselves, or be discarded if discard_oversize=True. - The argument 'docs' can be a list of strings, Doc's or Example's. """ + The argument 'docs' can be a list of strings, Docs or Examples. + """ if isinstance(size, int): size_ = itertools.repeat(size) elif isinstance(size, List): diff --git a/spacy/gold/corpus.py b/spacy/gold/corpus.py index 758fe021e..4a65d8885 100644 --- a/spacy/gold/corpus.py +++ b/spacy/gold/corpus.py @@ -74,7 +74,6 @@ class Corpus: """Yield examples from the data. nlp (Language): The current nlp object. - loc (Path): The file or directory to read from. YIELDS (Example): The examples. DOCS: https://spacy.io/api/corpus#call