Philipp Horstenkamp 066800123d
Created pipeline to run ner sentiment and sql ingest (#314)
Created a dataprocessing pipline that enhances the raw mined data with
Organsiation extractions and sentiment analysis prio to moving the data
to the sql db.
The transfer of matched data is done afterword.

---------

Co-authored-by: SeZett <zeleny.sebastian@fh-swf.de>
2023-11-11 13:28:12 +00:00

50 lines
1.2 KiB
Docker

FROM python:3.11-slim as base
LABEL AUTHOR="AKI Projektseminar 23" \
PROJECT="Transparenzregister" \
ORGANISATION="fh-swf.de"
ENV SQLALCHEMY_SILENCE_UBER_WARNING="1"
ARG APP_HOME="transparenzregister"
ARG GIT_HASH
ENV GIT_HASH=${GIT_HASH}
LABEL GIT_HASH=${GIT_HASH}
WORKDIR /${APP_HOME}/
USER root
RUN apt update -y && \
apt install git sqlite3 -y && \
rm -rf /var/lib/apt/lists/*
COPY dist/*.whl dist/
RUN pip install --find-links=dist aki-prj23-transparenzregister --no-cache-dir
FROM base as ingest
LABEL PART="DATA_INGESTOR"
RUN pip install --find-links=dist aki-prj23-transparenzregister[ingest] --no-cache-dir && \
rm dist/ -R
FROM base as data-transformation
LABEL PART="DATA-TRANSFORMATION"
RUN pip install --find-links=dist aki-prj23-transparenzregister[transformation] --no-cache-dir && \
rm dist/ -R
ENTRYPOINT ["data-processing", "ENV"]
CMD ["--level", "DEBUG"]
FROM base as web-server
LABEL PART="WEB-SERVER"
RUN pip install --find-links=dist aki-prj23-transparenzregister[web-server] --no-cache-dir && \
rm dist/ -R
ENV DASH_URL_BASE_PATHNAME="/transparenzregister/"
ENTRYPOINT ["webserver", "ENV"]
CMD ["--level", "DEBUG"]