Bugfix textcat reproducibility on GPU (#6411)

* add seed argument to ParametricAttention layer * bump thinc to 7.4.3 * set thinc version range Co-authored-by: Adriane Boyd <adrianeboyd@gmail.com>
2020-11-23 12:29:35 +01:00 · 2020-11-23 12:29:35 +01:00 · 2af31a8c8d
parent cdca44ac11
commit 2af31a8c8d
2 changed files with 8 additions and 6 deletions
--- a/spacy/_ml.py
+++ b/spacy/_ml.py
@ -646,7 +646,7 @@ def build_text_classifier(nr_class, width=64, **cfg):
                SpacyVectors
                >> flatten_add_lengths
                >> with_getitem(0, Affine(width, pretrained_dims))
-                >> ParametricAttention(width)
+                >> ParametricAttention(width, seed=100)
                >> Pooling(sum_pool)
                >> Residual(ReLu(width, width)) ** 2
                >> zero_init(Affine(nr_class, width, drop_factor=0.0))
@ -688,7 +688,7 @@ def build_text_classifier(nr_class, width=64, **cfg):
        cnn_model = (
            tok2vec
            >> flatten_add_lengths
-            >> ParametricAttention(width)
+            >> ParametricAttention(width, seed=99)
            >> Pooling(sum_pool)
            >> Residual(zero_init(Maxout(width, width)))
            >> zero_init(Affine(nr_class, width, drop_factor=0.0))
--- a/spacy/tests/regression/test_issue6177.py
+++ b/spacy/tests/regression/test_issue6177.py
@ -11,7 +11,6 @@ def test_issue6177():
    # NOTE: no need to transform this code to v3 when 'master' is merged into 'develop'.
    # A similar test exists already for v3: test_issue5551
    # This is just a backport
    results = []
    for i in range(3):
        fix_random_seed(0)
@ -24,9 +23,12 @@ def test_issue6177():
        nlp.add_pipe(textcat)
        for label in set(example[1]["cats"]):
            textcat.add_label(label)
-        nlp.begin_training()
+        # Train
        optimizer = nlp.begin_training()
        text, annots = example
        nlp.update([text], [annots], sgd=optimizer)
        # Store the result of each iteration
-        result = textcat.model.predict([nlp.make_doc(example[0])])
+        result = textcat.model.predict([nlp.make_doc(text)])
        results.append(list(result[0]))
    # All results should be the same because of the fixed seed