spaCy/spacy/strings.pxd

34 lines
771 B
Cython
Raw Normal View History

from cymem.cymem cimport Pool
from preshed.maps cimport PreshMap
from murmurhash.mrmr cimport hash64
from .typedefs cimport attr_t
from libc.stdint cimport int64_t
2015-07-20 10:06:10 +00:00
from .structs cimport UniStr
from .typedefs cimport hash_t
cpdef hash_t hash_string(unicode string) except 0
2015-07-20 10:06:10 +00:00
ctypedef union Utf8Str:
unsigned char[8] s
unsigned char* p
cdef inline void slice_unicode(UniStr* s, Py_UNICODE* chars, int start, int end) nogil:
s.chars = &chars[start]
s.n = end - start
2014-12-20 18:36:29 +00:00
s.key = hash64(s.chars, <int>(s.n * sizeof(Py_UNICODE)), 0)
cdef class StringStore:
cdef Pool mem
2015-07-20 10:06:10 +00:00
cdef Utf8Str* c
cdef int64_t size
cdef PreshMap _map
cdef size_t _resize_at
2015-07-20 10:06:10 +00:00
cdef const Utf8Str* intern(self, unsigned char* chars, int length) except NULL