mirror of https://github.com/explosion/spaCy.git
add dot after some abbrevs
This commit is contained in:
parent
b0b66fbab4
commit
54fcc5bba2
|
@ -4,15 +4,19 @@ from ..tokenizer_exceptions import BASE_EXCEPTIONS
|
||||||
|
|
||||||
_exc = {
|
_exc = {
|
||||||
"St": [{ORTH: "St", NORM: "Saint"}],
|
"St": [{ORTH: "St", NORM: "Saint"}],
|
||||||
|
"St.": [{ORTH: "St.", NORM: "Saint"}],
|
||||||
"Ste": [{ORTH: "Ste", NORM: "Sainte"}],
|
"Ste": [{ORTH: "Ste", NORM: "Sainte"}],
|
||||||
"Mme": [{ORTH: "Mme", NORM: "Madame"}],
|
"Mme": [{ORTH: "Mme", NORM: "Madame"}],
|
||||||
"Mr": [{ORTH: "Mr", NORM: "Monsieur"}],
|
"Mr": [{ORTH: "Mr", NORM: "Monsieur"}],
|
||||||
|
"Mr.": [{ORTH: "Mr.", NORM: "Monsieur"}],
|
||||||
"M.": [{ORTH: "M.", NORM: "Monsieur"}],
|
"M.": [{ORTH: "M.", NORM: "Monsieur"}],
|
||||||
"Mlle": [{ORTH: "Mlle", NORM: "Mademoiselle"}],
|
"Mlle": [{ORTH: "Mlle", NORM: "Mademoiselle"}],
|
||||||
"Dr": [{ORTH: "Dr", NORM: "Docteur"}],
|
"Dr": [{ORTH: "Dr", NORM: "Docteur"}],
|
||||||
|
"Dr.": [{ORTH: "Dr.", NORM: "Docteur"}],
|
||||||
"Dresse": [{ORTH: "Dresse", NORM: "Doctoresse"}],
|
"Dresse": [{ORTH: "Dresse", NORM: "Doctoresse"}],
|
||||||
"Drsse": [{ORTH: "Drsse", NORM: "Doctoresse"}],
|
"Drsse": [{ORTH: "Drsse", NORM: "Doctoresse"}],
|
||||||
"etc": [{ORTH: "etc", NORM: "etcaetera"}],
|
"etc": [{ORTH: "etc", NORM: "etcaetera"}],
|
||||||
|
"etc.": [{ORTH: "etc.", NORM: "etcaetera"}],
|
||||||
# months
|
# months
|
||||||
"jan.": [{ORTH: "jan.", NORM: "janvier"}],
|
"jan.": [{ORTH: "jan.", NORM: "janvier"}],
|
||||||
"janv.": [{ORTH: "janv.", NORM: "janvier"}],
|
"janv.": [{ORTH: "janv.", NORM: "janvier"}],
|
||||||
|
|
Loading…
Reference in New Issue