From 45ec92243a42381e21988081105a525da81d1821 Mon Sep 17 00:00:00 2001 From: Matthew Honnibal Date: Sat, 6 Jun 2015 05:56:00 +0200 Subject: [PATCH] * Add hyphenation rule to infix.txt for tokenizer --- lang_data/en/infix.txt | 1 + 1 file changed, 1 insertion(+) diff --git a/lang_data/en/infix.txt b/lang_data/en/infix.txt index 28169ecbb..b32be4c07 100644 --- a/lang_data/en/infix.txt +++ b/lang_data/en/infix.txt @@ -1 +1,2 @@ (?<=[a-z])\.(?=[A-Z]) +(?<=[a-zA-Z])-(?=[a-zA-z])