From 6bba793df33ee705ba3ea8eb878c8e420befc8cf Mon Sep 17 00:00:00 2001 From: Matthew Honnibal Date: Sun, 31 May 2015 06:48:43 +0200 Subject: [PATCH] * Disable the Zipf-reweighting thing while investigate effect --- spacy/_ml.pyx | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) diff --git a/spacy/_ml.pyx b/spacy/_ml.pyx index 3a439e2ba..3dffed611 100644 --- a/spacy/_ml.pyx +++ b/spacy/_ml.pyx @@ -47,13 +47,15 @@ cdef class Model: @cython.cdivision @cython.boundscheck(False) cdef int regularize(self, Feature* feats, int n, int a=3) except -1: + pass + # Disable this for now, while we investigate effect. # Use the Zipfian corruptions technique from here: # http://www.aclweb.org/anthology/N13-1077 # This seems good for 0.1 - 0.3 % on OOD data. - cdef int i - cdef long[:] zipfs = numpy.random.zipf(a, n) - for i in range(n): - feats[i].value *= 1 / zipfs[i] + #cdef int i + #cdef long[:] zipfs = numpy.random.zipf(a, n) + #for i in range(n): + # feats[i].value *= 1 / zipfs[i] def end_training(self): self._model.end_training()