From cf83b6cc12db38d98e24f8be562b644377a7217a Mon Sep 17 00:00:00 2001 From: Peter Johnson Date: Tue, 21 May 2024 14:56:58 +0200 Subject: [PATCH] feat(docker): use Sensing model --- Dockerfile | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) diff --git a/Dockerfile b/Dockerfile index 8120fbf..a576fd6 100644 --- a/Dockerfile +++ b/Dockerfile @@ -25,6 +25,24 @@ RUN make -j4 RUN DESTDIR=/libpostal make install RUN ldconfig +# install Senzing model +# https://github.com/Senzing/libpostal-data + +# language classifier +RUN rm -rf /usr/share/libpostal/libpostal/language_classifier \ + && curl -Ls https://public-read-libpostal-data.s3.amazonaws.com/v1.1.0/language_classifier.tar.gz \ + | tar zxvf - -C /usr/share/libpostal/libpostal/ + +# libpostal data +RUN rm -rf /usr/share/libpostal/libpostal/numex /usr/share/libpostal/libpostal/transliteration \ + && curl -Ls https://public-read-libpostal-data.s3.amazonaws.com/v1.1.0/libpostal_data.tar.gz \ + | tar zxvf - -C /usr/share/libpostal/libpostal/ + +# parser +RUN rm -rf /usr/share/libpostal/libpostal/address_parser \ + && curl -Ls https://public-read-libpostal-data.s3.amazonaws.com/v1.1.0/parser.tar.gz \ + | tar zxvf - -C /usr/share/libpostal/libpostal/ + # main image FROM pelias/baseimage