From 9efe5681778ff37188d166b7dee0819875891c2e Mon Sep 17 00:00:00 2001 From: Matthew Honnibal Date: Wed, 2 Nov 2016 12:31:34 +0100 Subject: [PATCH] Add missing unicode_literals to spacy.util. I think this was messing up the tokenizer regex for non-ascii characters in Python 2. Re Issue #596 --- spacy/util.py | 1 + 1 file changed, 1 insertion(+) diff --git a/spacy/util.py b/spacy/util.py index ee285cf80..cecbcfab6 100644 --- a/spacy/util.py +++ b/spacy/util.py @@ -1,3 +1,4 @@ +from __future__ import unicode_literals import os import io import json