__init__.py
|
enable token match
|
2017-07-26 19:13:14 +07:00 |
_tokenizer_exceptions_list.py
|
updated tokenizer exceptions
|
2017-07-26 19:12:52 +07:00 |
lemmatizer.py
|
added wip lemma dict
|
2017-07-26 21:39:54 +07:00 |
lex_attrs.py
|
added lex_attrs
|
2017-07-23 22:55:22 +07:00 |
norm_exceptions.py
|
added known currencies
|
2017-07-23 22:56:48 +07:00 |
punctuation.py
|
removed -el from suffix rules
|
2017-07-26 19:28:38 +07:00 |
stop_words.py
|
added stopwords
|
2017-07-23 20:52:37 +07:00 |
tokenizer_exceptions.py
|
added hyphen-suffix rules
|
2017-07-26 19:28:57 +07:00 |