From ca89fd09193ba4814a7a899c708eabdbf1f64695 Mon Sep 17 00:00:00 2001 From: Matthew Honnibal Date: Wed, 19 Oct 2016 19:37:09 +0200 Subject: [PATCH] Update Keras deep learning tutorial --- examples/deep_learning_keras.py | 17 ++++++++--------- 1 file changed, 8 insertions(+), 9 deletions(-) diff --git a/examples/deep_learning_keras.py b/examples/deep_learning_keras.py index ede640f71..368126da6 100644 --- a/examples/deep_learning_keras.py +++ b/examples/deep_learning_keras.py @@ -14,7 +14,7 @@ class SentimentAnalyser(object): def __call__(self, doc): X = get_features([doc], self.max_length) - y = self._keras_model.predict(X) + y = self._model.predict(X) self.set_sentiment(doc, y) def pipe(self, docs, batch_size=1000, n_threads=2): @@ -28,6 +28,13 @@ class SentimentAnalyser(object): doc.user_data['sentiment'] = y +def get_features(docs, max_length): + Xs = numpy.zeros(len(docs), max_length, dtype='int32') + for i, doc in enumerate(minibatch): + for j, token in enumerate(doc[:max_length]): + Xs[i, j] = token.rank if token.has_vector else 0 + return Xs + def compile_lstm(embeddings, shape, settings, optimizer): model = Sequential() model.add( @@ -59,14 +66,6 @@ def get_embeddings(vocab): return vectors -def get_features(docs, max_length): - Xs = numpy.zeros(len(docs), max_length, dtype='int32') - for i, doc in enumerate(minibatch): - for j, token in enumerate(doc[:max_length]): - Xs[i, j] = token.rank if token.has_vector else 0 - return Xs - - def train(train_texts, train_labels, dev_texts, dev_labels, lstm_shape, lstm_settings, lstm_optimizer, batch_size=100, nb_epoch=5): nlp = spacy.load('en', parser=False, tagger=False, entity=False)