mirror of https://github.com/explosion/spaCy.git
* Pass the string to Tokens
This commit is contained in:
parent
45264e356b
commit
5928d158ce
|
@ -33,7 +33,7 @@ cdef class Tokenizer:
|
||||||
|
|
||||||
cpdef Tokens tokens_from_list(self, list strings):
|
cpdef Tokens tokens_from_list(self, list strings):
|
||||||
cdef int length = sum([len(s) for s in strings])
|
cdef int length = sum([len(s) for s in strings])
|
||||||
cdef Tokens tokens = Tokens(self.vocab, length)
|
cdef Tokens tokens = Tokens(self.vocab, ' '.join(strings))
|
||||||
if length == 0:
|
if length == 0:
|
||||||
return tokens
|
return tokens
|
||||||
cdef UniStr string_struct
|
cdef UniStr string_struct
|
||||||
|
@ -66,7 +66,7 @@ cdef class Tokenizer:
|
||||||
tokens (Tokens): A Tokens object, giving access to a sequence of LexemeCs.
|
tokens (Tokens): A Tokens object, giving access to a sequence of LexemeCs.
|
||||||
"""
|
"""
|
||||||
cdef int length = len(string)
|
cdef int length = len(string)
|
||||||
cdef Tokens tokens = Tokens(self.vocab, length)
|
cdef Tokens tokens = Tokens(self.vocab, string)
|
||||||
if length == 0:
|
if length == 0:
|
||||||
return tokens
|
return tokens
|
||||||
cdef int i = 0
|
cdef int i = 0
|
||||||
|
|
Loading…
Reference in New Issue