From cd5af72c9af469bd55bcb4bc27a94db61c448919 Mon Sep 17 00:00:00 2001 From: Adriane Boyd Date: Sun, 19 Jul 2020 11:09:49 +0200 Subject: [PATCH] Update pkuseg version (#5774) * Update pkuseg version in Chinese tokenizer warnings * Update pkuseg version in `Makefile` * Remove warning about python3.8 wheels in docs --- Makefile | 4 ++-- spacy/lang/zh/__init__.py | 2 +- website/docs/usage/models.md | 12 ------------ 3 files changed, 3 insertions(+), 15 deletions(-) diff --git a/Makefile b/Makefile index 865bf44c5..6c0a59ba8 100644 --- a/Makefile +++ b/Makefile @@ -5,7 +5,7 @@ VENV := ./env$(PYVER) version := $(shell "bin/get-version.sh") dist/spacy-$(version).pex : wheelhouse/spacy-$(version).stamp - $(VENV)/bin/pex -f ./wheelhouse --no-index --disable-cache -m spacy -o $@ spacy==$(version) jsonschema spacy-lookups-data jieba pkuseg==0.0.22 sudachipy sudachidict_core + $(VENV)/bin/pex -f ./wheelhouse --no-index --disable-cache -m spacy -o $@ spacy==$(version) jsonschema spacy-lookups-data jieba pkuseg==0.0.25 sudachipy sudachidict_core chmod a+rx $@ cp $@ dist/spacy.pex @@ -15,7 +15,7 @@ dist/pytest.pex : wheelhouse/pytest-*.whl wheelhouse/spacy-$(version).stamp : $(VENV)/bin/pex setup.py spacy/*.py* spacy/*/*.py* $(VENV)/bin/pip wheel . -w ./wheelhouse - $(VENV)/bin/pip wheel jsonschema spacy-lookups-data jieba pkuseg==0.0.22 sudachipy sudachidict_core -w ./wheelhouse + $(VENV)/bin/pip wheel jsonschema spacy-lookups-data jieba pkuseg==0.0.25 sudachipy sudachidict_core -w ./wheelhouse touch $@ wheelhouse/pytest-%.whl : $(VENV)/bin/pex diff --git a/spacy/lang/zh/__init__.py b/spacy/lang/zh/__init__.py index 9d1cb71a7..9f8a82c10 100644 --- a/spacy/lang/zh/__init__.py +++ b/spacy/lang/zh/__init__.py @@ -16,7 +16,7 @@ from .tag_map import TAG_MAP from ... import util -_PKUSEG_INSTALL_MSG = "install it with `pip install pkuseg==0.0.22` or from https://github.com/lancopku/pkuseg-python" +_PKUSEG_INSTALL_MSG = "install it with `pip install pkuseg==0.0.25` or from https://github.com/lancopku/pkuseg-python" def try_jieba_import(use_jieba): diff --git a/website/docs/usage/models.md b/website/docs/usage/models.md index b11e6347a..cc65dad68 100644 --- a/website/docs/usage/models.md +++ b/website/docs/usage/models.md @@ -117,18 +117,6 @@ The Chinese language class supports three word segmentation options: better segmentation for Chinese OntoNotes and the new [Chinese models](/models/zh). - - -Note that [`pkuseg`](https://github.com/lancopku/pkuseg-python) doesn't yet ship -with pre-compiled wheels for Python 3.8. If you're running Python 3.8, you can -install it from our fork and compile it locally: - -```bash -$ pip install https://github.com/honnibal/pkuseg-python/archive/master.zip -``` - - - The `meta` argument of the `Chinese` language class supports the following