From 4ff180db7404e703c49c06c4f155d637985953b0 Mon Sep 17 00:00:00 2001 From: Matthew Honnibal Date: Fri, 30 Jan 2015 12:49:33 +1100 Subject: [PATCH] * Fix off-by-one error in commit 0a7fceb --- spacy/tokenizer.pyx | 2 -- 1 file changed, 2 deletions(-) diff --git a/spacy/tokenizer.pyx b/spacy/tokenizer.pyx index 0f96c058e..1f7228c9b 100644 --- a/spacy/tokenizer.pyx +++ b/spacy/tokenizer.pyx @@ -179,8 +179,6 @@ cdef class Tokenizer: idx = tokens.data[tokens.length - 1].idx # Increment by last length idx += tokens.data[tokens.length - 1].lex.length - # Add 1 for space - idx += 1 else: split = self._find_infix(string.chars, string.n) if split == 0 or split == -1: