2014-09-25 16:29:42 +00:00
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
import pytest
|
|
|
|
|
|
|
|
from spacy.en import *
|
2014-10-09 21:11:31 +00:00
|
|
|
from spacy.lexeme import *
|
2014-09-25 16:29:42 +00:00
|
|
|
|
|
|
|
|
|
|
|
def test_is_alpha():
|
2014-10-30 07:15:30 +00:00
|
|
|
the = EN.lexicon['the']
|
2014-10-23 13:59:17 +00:00
|
|
|
assert the['flags'] & (1 << IS_ALPHA)
|
2014-10-30 07:15:30 +00:00
|
|
|
year = EN.lexicon['1999']
|
2014-10-23 13:59:17 +00:00
|
|
|
assert not year['flags'] & (1 << IS_ALPHA)
|
2014-10-30 07:15:30 +00:00
|
|
|
mixed = EN.lexicon['hello1']
|
2014-10-23 13:59:17 +00:00
|
|
|
assert not mixed['flags'] & (1 << IS_ALPHA)
|
2014-09-25 16:29:42 +00:00
|
|
|
|
|
|
|
|
|
|
|
def test_is_digit():
|
2014-10-30 07:15:30 +00:00
|
|
|
the = EN.lexicon['the']
|
2014-10-23 13:59:17 +00:00
|
|
|
assert not the['flags'] & (1 << IS_DIGIT)
|
2014-10-30 07:15:30 +00:00
|
|
|
year = EN.lexicon['1999']
|
2014-10-23 13:59:17 +00:00
|
|
|
assert year['flags'] & (1 << IS_DIGIT)
|
2014-10-30 07:15:30 +00:00
|
|
|
mixed = EN.lexicon['hello1']
|
2014-10-23 13:59:17 +00:00
|
|
|
assert not mixed['flags'] & (1 << IS_DIGIT)
|