mirror of
https://gitlab.ub.uni-bielefeld.de/sfb1288inf/nlp.git
synced 2024-12-26 08:04:17 +00:00
55 lines
1.7 KiB
Docker
55 lines
1.7 KiB
Docker
FROM debian:10-slim
|
|
|
|
|
|
LABEL authors="Patrick Jentsch <p.jentsch@uni-bielefeld.de>, Stephan Porada <sporada@uni-bielefeld.de>"
|
|
|
|
|
|
ENV LANG=C.UTF-8
|
|
|
|
|
|
RUN apt-get update
|
|
|
|
|
|
## Install pyFlow ##
|
|
ENV PYFLOW_RELEASE=1.1.20
|
|
ADD "https://github.com/Illumina/pyflow/releases/download/v${PYFLOW_RELEASE}/pyflow-${PYFLOW_RELEASE}.tar.gz" .
|
|
RUN tar -xzf "pyflow-${PYFLOW_RELEASE}.tar.gz" \
|
|
&& cd "pyflow-${PYFLOW_RELEASE}" \
|
|
&& apt-get install -y --no-install-recommends \
|
|
python2.7 \
|
|
&& python2.7 setup.py build install \
|
|
&& cd .. \
|
|
&& rm -r "pyflow-${PYFLOW_RELEASE}" "pyflow-${PYFLOW_RELEASE}.tar.gz"
|
|
|
|
|
|
## Install Pipeline ##
|
|
ENV SPACY_VERSION=2.3.2
|
|
ENV SPACY_MODELS_VERSION=2.3.0
|
|
RUN apt-get install -y --no-install-recommends \
|
|
python3.7 \
|
|
python3-pip \
|
|
zip \
|
|
&& pip3 install \
|
|
chardet \
|
|
setuptools \
|
|
wheel \
|
|
&& pip3 install "spacy==${SPACY_VERSION}" \
|
|
&& python3 -m spacy download "de_core_news_md-${SPACY_MODELS_VERSION}" --direct \
|
|
&& python3 -m spacy download "el_core_news_md-${SPACY_MODELS_VERSION}" --direct \
|
|
&& python3 -m spacy download "en_core_web_md-${SPACY_MODELS_VERSION}" --direct \
|
|
&& python3 -m spacy download "es_core_news_md-${SPACY_MODELS_VERSION}" --direct \
|
|
&& python3 -m spacy download "fr_core_news_md-${SPACY_MODELS_VERSION}" --direct \
|
|
&& python3 -m spacy download "it_core_news_md-${SPACY_MODELS_VERSION}" --direct \
|
|
&& python3 -m spacy download "nl_core_news_md-${SPACY_MODELS_VERSION}" --direct \
|
|
&& python3 -m spacy download "pt_core_news_md-${SPACY_MODELS_VERSION}" --direct
|
|
COPY nlp /usr/local/bin
|
|
COPY spacy-nlp /usr/local/bin
|
|
|
|
|
|
## Cleanup ##
|
|
RUN rm -r /var/lib/apt/lists/*
|
|
|
|
|
|
ENTRYPOINT ["nlp"]
|
|
CMD ["--help"]
|