2016-10-09 10:24:24 +00:00
|
|
|
from libc.stdint cimport int64_t
|
2017-05-28 10:36:27 +00:00
|
|
|
from libcpp.vector cimport vector
|
2017-11-11 00:11:27 +00:00
|
|
|
from libcpp.set cimport set
|
2014-12-19 19:42:01 +00:00
|
|
|
from cymem.cymem cimport Pool
|
|
|
|
from preshed.maps cimport PreshMap
|
2014-12-19 20:41:08 +00:00
|
|
|
from murmurhash.mrmr cimport hash64
|
2015-07-18 20:39:57 +00:00
|
|
|
|
2016-10-09 10:24:24 +00:00
|
|
|
from .typedefs cimport attr_t, hash_t
|
2014-12-19 19:42:01 +00:00
|
|
|
|
2015-01-11 23:26:22 +00:00
|
|
|
|
|
|
|
cpdef hash_t hash_string(unicode string) except 0
|
2017-05-28 10:36:27 +00:00
|
|
|
cdef hash_t hash_utf8(char* utf8_string, int length) nogil
|
|
|
|
|
|
|
|
cdef unicode decode_Utf8Str(const Utf8Str* string)
|
2014-12-19 20:41:08 +00:00
|
|
|
|
|
|
|
|
2015-07-20 10:06:10 +00:00
|
|
|
ctypedef union Utf8Str:
|
|
|
|
unsigned char[8] s
|
|
|
|
unsigned char* p
|
|
|
|
|
|
|
|
|
2014-12-19 19:42:01 +00:00
|
|
|
cdef class StringStore:
|
|
|
|
cdef Pool mem
|
|
|
|
|
2017-05-28 10:36:27 +00:00
|
|
|
cdef vector[hash_t] keys
|
2017-11-11 00:11:27 +00:00
|
|
|
cdef set[hash_t] hits
|
2015-11-05 11:32:19 +00:00
|
|
|
cdef public PreshMap _map
|
2014-12-19 19:42:01 +00:00
|
|
|
|
2016-10-24 12:00:35 +00:00
|
|
|
cdef const Utf8Str* intern_unicode(self, unicode py_string)
|
|
|
|
cdef const Utf8Str* _intern_utf8(self, char* utf8_string, int length)
|