You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@beam.apache.org by em...@apache.org on 2021/08/31 21:12:51 UTC
[beam] branch master updated: sync nltk, orjson for Python image
This is an automated email from the ASF dual-hosted git repository.
emilyye pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/beam.git
The following commit(s) were added to refs/heads/master by this push:
new 99b5bfa sync nltk, orjson for Python image
new ff70e74 Merge pull request #15326 from emilymye/importsync
99b5bfa is described below
commit 99b5bfa4f3603ff9bd0d4adf374bd4b5adcb436e
Author: Emily Ye <em...@google.com>
AuthorDate: Thu Aug 12 12:01:57 2021 -0700
sync nltk, orjson for Python image
---
sdks/python/container/Dockerfile | 2 ++
sdks/python/container/base_image_requirements.txt | 3 ++-
2 files changed, 4 insertions(+), 1 deletion(-)
diff --git a/sdks/python/container/Dockerfile b/sdks/python/container/Dockerfile
index 359ca2c..f517dc1 100644
--- a/sdks/python/container/Dockerfile
+++ b/sdks/python/container/Dockerfile
@@ -43,6 +43,8 @@ RUN apt-get update && \
COPY target/base_image_requirements.txt /tmp/base_image_requirements.txt
RUN \
pip install -r /tmp/base_image_requirements.txt && \
+ python -c "import nltk; nltk.download('stopwords')" && \
+ rm /root/nltk_data/corpora/stopwords.zip && \
# Check that the fast implementation of protobuf is used.
python -c "from google.protobuf.internal import api_implementation; assert api_implementation._default_implementation_type == 'cpp'; print ('Verified fast protobuf used.')" && \
# Remove pip cache.
diff --git a/sdks/python/container/base_image_requirements.txt b/sdks/python/container/base_image_requirements.txt
index c627b4e..a5ed07d 100644
--- a/sdks/python/container/base_image_requirements.txt
+++ b/sdks/python/container/base_image_requirements.txt
@@ -68,7 +68,7 @@ cachetools == 3.1.1
dataclasses == 0.8 ; python_version=="3.6"
guppy3==3.0.10
mmh3==2.5.1
-orjson==3.5.3
+orjson==3.6.1
python-dateutil == 2.8.1
requests == 2.24.0
freezegun == 0.3.15
@@ -82,6 +82,7 @@ pandas==1.2.4 ; python_version>="3.7"
protorpc==0.12.0
python-gflags==3.1.2
tensorflow==2.5.0
+nltk==3.5.0
# Packages needed for testing.
tenacity>=5.0.2