From f8b0e77352f4b911626bba07dffac8d2ac1b3371 Mon Sep 17 00:00:00 2001 From: mhabsaoui Date: Mon, 3 Jun 2019 06:44:49 +0200 Subject: [PATCH] updated TreeTagger with version 3.2.2 and download URLs --- Dockerfile | 22 ++++++++-------------- 1 file changed, 8 insertions(+), 14 deletions(-) diff --git a/Dockerfile b/Dockerfile index d86a643..6a7fb15 100644 --- a/Dockerfile +++ b/Dockerfile @@ -3,7 +3,7 @@ FROM openjdk:8-jre LABEL maintainer="Damien Cram " ENV \ - TT_VERSION=3.2.1 \ + TT_VERSION=3.2.2 \ TERMSUITE_VERSION=3.0.10 \ TT_URL=http://www.cis.uni-muenchen.de/~schmid/tools/TreeTagger/data @@ -21,12 +21,12 @@ RUN mkdir -p /opt/treetagger/ WORKDIR /opt/treetagger/ RUN wget ${TT_URL}/tree-tagger-linux-${TT_VERSION}.tar.gz \ && wget ${TT_URL}/tagger-scripts.tar.gz \ - && wget ${TT_URL}/english-par-linux-3.2-utf8.bin.gz \ - && wget ${TT_URL}/french-par-linux-3.2-utf8.bin.gz \ - && wget ${TT_URL}/german-par-linux-3.2-utf8.bin.gz \ - && wget ${TT_URL}/russian-par-linux-3.2-utf8.bin.gz \ - && wget ${TT_URL}/italian-par-linux-3.2-utf8.bin.gz \ - && wget ${TT_URL}/spanish-par-linux-3.2-utf8.bin.gz \ + && wget ${TT_URL}/english.par.gz \ + && wget ${TT_URL}/french.par.gz \ + && wget ${TT_URL}/german.par.gz \ + && wget ${TT_URL}/russian.par.gz \ + && wget ${TT_URL}/italian.par.gz \ + && wget ${TT_URL}/spanish.par.gz \ # && wget http://corpus.leeds.ac.uk/tools/zh/tt-lcmc.tgz \ && wget ${TT_URL}/install-tagger.sh \ && sh /opt/treetagger/install-tagger.sh \ @@ -34,13 +34,7 @@ RUN wget ${TT_URL}/tree-tagger-linux-${TT_VERSION}.tar.gz \ && rm -rf *.gz *.tgz cmd/ doc/ WORKDIR /opt/treetagger/models/ -RUN mv french-utf8.par french.par \ - && mv english-utf8.par english.par \ - && mv spanish-utf8.par spanish.par \ - && mv italian-utf8.par italian.par \ - && mv russian-utf8.par russian.par \ - && mv german-utf8.par german.par \ - && rm *-utf8 *-abbreviations *-mwls *-tokens *.txt \ +RUN rm *-abbreviations *-mwls *-tokens *.txt \ && chmod a+x /opt/treetagger/models/ WORKDIR /opt/