Update tokenizer_exceptions.py

See https://github.com/explosion/spaCy/pull/6643
This commit is contained in:
Adam Bittlingmayer 2020-12-29 16:05:11 +04:00 committed by GitHub
parent 5ca57d8221
commit f2fe60bacf
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 7 additions and 2 deletions

View File

@ -51,6 +51,9 @@ for orth in [
"Dr.", "Dr.",
"Dra.", "Dra.",
"EE.UU.", "EE.UU.",
"Ee.Uu.",
"UU.", # For "EE. UU."
"Uu.", # For "Ee. Uu."
"etc.", "etc.",
"fig.", "fig.",
"Gob.", "Gob.",
@ -65,9 +68,11 @@ for orth in [
"Prof.", "Prof.",
"Profa.", "Profa.",
"q.e.p.d.", "q.e.p.d.",
"Q.E.P.D." "S.A.", "Q.E.P.D.",
"S.A.",
"S.L.", "S.L.",
"S.R.L." "s.s.s.", "S.R.L.",
"s.s.s.",
"Sr.", "Sr.",
"Sra.", "Sra.",
"Srta.", "Srta.",