explosion · ines · Aug 15, 2019 · Aug 12, 2019 · Aug 12, 2019 · Aug 12, 2019
diff --git a/spacy/lang/en/lemmatizer/lookup.py b/spacy/lang/en/lemmatizer/lookup.py
@@ -11558,7 +11558,7 @@
  "drunker": "drunk",
  "drunkest": "drunk",
  "drunks": "drunk",
- "dry": "spin-dry",
+ "dry": "dry",
  "dry-cleaned": "dry-clean",
  "dry-cleaners": "dry-cleaner",
  "dry-cleaning": "dry-clean",
@@ -35294,7 +35294,8 @@
  "spryer": "spry",
  "spryest": "spry",
  "spuds": "spud",
- "spun": "spin-dry",
+ "spun": "spin",
+ "spun-dry": "spin-dry",
  "spunkier": "spunky",
  "spunkiest": "spunky",
  "spunks": "spunk",

diff --git a/spacy/tests/regression/test_issue4104.py b/spacy/tests/regression/test_issue4104.py
@@ -0,0 +1,13 @@
+# coding: utf8
+from __future__ import unicode_literals
+
+import pytest
+from ..util import get_doc
+
+@pytest.mark.parametrize('text', ['dry spun spun-dry'])
+
-
-
+def test_issue4104(en_tokenizer, en_vocab, text):
+ """Test that English lookup lemmatization of spun & dry are correct"""
+ doc = get_doc(en_vocab, [t for t in text.split(" ")])
+ expected = {'dry': 'dry', 'spun': 'spin', 'spun-dry': 'spin-dry'}
+ assert [token.lemma_ for token in doc] == list(expected.values())