2014-07-07 02:21:06 +00:00
|
|
|
from libcpp.vector cimport vector
|
2014-07-05 18:51:42 +00:00
|
|
|
|
2014-07-07 02:21:06 +00:00
|
|
|
from spacy.spacy cimport StringHash
|
|
|
|
from spacy.spacy cimport Vocab
|
|
|
|
from spacy.lexeme cimport Lexeme
|
|
|
|
from spacy.lexeme cimport Lexeme_addr
|
2014-07-05 18:51:42 +00:00
|
|
|
|
|
|
|
|
2014-07-07 05:36:43 +00:00
|
|
|
cdef Vocab* VOCAB
|
2014-07-07 02:21:06 +00:00
|
|
|
cdef dict BACOV
|
2014-07-05 18:51:42 +00:00
|
|
|
|
|
|
|
|
|
|
|
cpdef Lexeme_addr lookup(unicode word) except 0
|
2014-07-07 02:21:06 +00:00
|
|
|
cpdef vector[Lexeme_addr] tokenize(unicode string) except *
|
2014-07-05 18:51:42 +00:00
|
|
|
cpdef unicode unhash(StringHash hash_value)
|