nlp/Dockerfile

62 lines
1.9 KiB
Docker
Raw Normal View History

2020-10-08 23:17:58 +02:00
FROM debian:buster-slim
2019-02-06 16:58:17 +01:00
2019-09-11 13:20:07 +02:00
2021-02-25 11:26:11 +01:00
LABEL authors="Patrick Jentsch <p.jentsch@uni-bielefeld.de>, Stephan Porada <porada@posteo.de>"
2019-02-06 16:58:17 +01:00
2019-09-11 13:20:07 +02:00
2019-09-12 11:42:42 +02:00
ENV LANG=C.UTF-8
2021-02-25 11:26:11 +01:00
RUN apt-get update
2020-10-08 23:08:49 +02:00
# Install pipeline dependencies #
2020-09-23 15:26:53 +02:00
## Install pyFlow ##
ENV PYFLOW_RELEASE=1.1.20
ADD "https://github.com/Illumina/pyflow/releases/download/v${PYFLOW_RELEASE}/pyflow-${PYFLOW_RELEASE}.tar.gz" .
RUN tar -xzf "pyflow-${PYFLOW_RELEASE}.tar.gz" \
&& cd "pyflow-${PYFLOW_RELEASE}" \
2020-10-08 23:08:49 +02:00
&& apt-get install --no-install-recommends --yes \
2020-09-23 15:26:53 +02:00
python2.7 \
2019-09-11 13:20:07 +02:00
&& python2.7 setup.py build install \
&& cd .. \
2020-09-23 15:26:53 +02:00
&& rm -r "pyflow-${PYFLOW_RELEASE}" "pyflow-${PYFLOW_RELEASE}.tar.gz"
2020-04-06 09:21:38 +02:00
2020-10-08 23:08:49 +02:00
## Install spaCy ##
2021-02-25 11:26:11 +01:00
ENV SPACY_VERSION=3.0.3
RUN apt-get install --no-install-recommends --yes \
2020-09-23 15:26:53 +02:00
python3.7 \
python3-pip \
zip \
&& pip3 install \
chardet \
setuptools \
wheel \
2021-02-25 11:26:11 +01:00
&& pip3 install --upgrade pip \
&& pip3 install "spacy==${SPACY_VERSION}"
ENV SPACY_MODELS_VERSION=3.0.0
RUN python3 -m spacy download "da_core_news_md-${SPACY_MODELS_VERSION}" --direct \
2020-09-23 15:46:43 +02:00
&& python3 -m spacy download "de_core_news_md-${SPACY_MODELS_VERSION}" --direct \
&& python3 -m spacy download "el_core_news_md-${SPACY_MODELS_VERSION}" --direct \
&& python3 -m spacy download "en_core_web_md-${SPACY_MODELS_VERSION}" --direct \
&& python3 -m spacy download "es_core_news_md-${SPACY_MODELS_VERSION}" --direct \
&& python3 -m spacy download "fr_core_news_md-${SPACY_MODELS_VERSION}" --direct \
&& python3 -m spacy download "it_core_news_md-${SPACY_MODELS_VERSION}" --direct \
&& python3 -m spacy download "nl_core_news_md-${SPACY_MODELS_VERSION}" --direct \
2021-02-25 11:26:11 +01:00
&& python3 -m spacy download "pt_core_news_md-${SPACY_MODELS_VERSION}" --direct \
&& python3 -m spacy download "ru_core_news_md-${SPACY_MODELS_VERSION}" --direct \
&& python3 -m spacy download "zh_core_web_md-${SPACY_MODELS_VERSION}" --direct
2019-02-06 16:58:17 +01:00
2019-09-11 13:34:01 +02:00
2020-10-08 23:08:49 +02:00
## Install Pipeline ##
COPY nlp spacy-nlp /usr/local/bin/
2020-09-23 15:26:53 +02:00
2021-02-25 11:26:11 +01:00
RUN rm -r /var/lib/apt/lists/*
2019-05-20 11:28:51 +02:00
ENTRYPOINT ["nlp"]
2019-09-11 13:20:07 +02:00
CMD ["--help"]