-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathDockerfile
18 lines (14 loc) · 1.26 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
FROM elasticsearch:7.3.1
WORKDIR /usr/share/elasticsearch
RUN elasticsearch-plugin install https://github.com/vhyza/elasticsearch-analysis-lemmagen/releases/download/v7.3.1/elasticsearch-analysis-lemmagen-7.3.1-plugin.zip
RUN mkdir -p config/lemmagen
RUN curl -Lso config/lemmagen/sk.lem https://github.com/vhyza/lemmagen-lexicons/raw/master/free/lexicons/sk.lem
RUN curl -Lso config/lemmagen/cs.lem https://github.com/vhyza/lemmagen-lexicons/raw/master/free/lexicons/cs.lem
RUN curl -Lso config/lemmagen/en.lem https://github.com/vhyza/lemmagen-lexicons/raw/master/free/lexicons/en.lem
# grab sng elasticsearch repository - will make proper directory structure inside config
RUN curl -Ls https://github.com/SlovakNationalGallery/elasticsearch-slovencina/archive/master.tar.gz | tar xz -C config --strip-components=1
# grab extra synonym files and save them inside config/synonyms
RUN curl -Lso config/synonyms/synonyms_cz.txt https://sites.google.com/site/kevinbouge/synonyms-lists/synonyms_cz.txt
RUN curl -Ls http://wordnetcode.princeton.edu/3.0/WNprolog-3.0.tar.gz | tar xz -C config/synonyms --strip-components=1 prolog/wn_s.pl
# grab extra stop-words files
RUN curl -Lso config/stop-words/stop-words-czech2.txt https://sites.google.com/site/kevinbouge/stopwords-lists/stopwords_cz.txt