mirror of
https://github.com/fhswf/aki_prj23_transparenzregister.git
synced 2025-04-24 21:22:34 +02:00
Created a dataprocessing pipline that enhances the raw mined data with Organsiation extractions and sentiment analysis prio to moving the data to the sql db. The transfer of matched data is done afterword. --------- Co-authored-by: SeZett <zeleny.sebastian@fh-swf.de>
50 lines
1.2 KiB
Docker
50 lines
1.2 KiB
Docker
FROM python:3.11-slim as base
|
|
LABEL AUTHOR="AKI Projektseminar 23" \
|
|
PROJECT="Transparenzregister" \
|
|
ORGANISATION="fh-swf.de"
|
|
|
|
ENV SQLALCHEMY_SILENCE_UBER_WARNING="1"
|
|
|
|
ARG APP_HOME="transparenzregister"
|
|
ARG GIT_HASH
|
|
ENV GIT_HASH=${GIT_HASH}
|
|
LABEL GIT_HASH=${GIT_HASH}
|
|
|
|
WORKDIR /${APP_HOME}/
|
|
USER root
|
|
RUN apt update -y && \
|
|
apt install git sqlite3 -y && \
|
|
rm -rf /var/lib/apt/lists/*
|
|
|
|
COPY dist/*.whl dist/
|
|
|
|
RUN pip install --find-links=dist aki-prj23-transparenzregister --no-cache-dir
|
|
|
|
FROM base as ingest
|
|
|
|
LABEL PART="DATA_INGESTOR"
|
|
|
|
RUN pip install --find-links=dist aki-prj23-transparenzregister[ingest] --no-cache-dir && \
|
|
rm dist/ -R
|
|
|
|
FROM base as data-transformation
|
|
|
|
LABEL PART="DATA-TRANSFORMATION"
|
|
|
|
RUN pip install --find-links=dist aki-prj23-transparenzregister[transformation] --no-cache-dir && \
|
|
rm dist/ -R
|
|
|
|
ENTRYPOINT ["data-processing", "ENV"]
|
|
CMD ["--level", "DEBUG"]
|
|
|
|
FROM base as web-server
|
|
|
|
LABEL PART="WEB-SERVER"
|
|
|
|
RUN pip install --find-links=dist aki-prj23-transparenzregister[web-server] --no-cache-dir && \
|
|
rm dist/ -R
|
|
|
|
ENV DASH_URL_BASE_PATHNAME="/transparenzregister/"
|
|
ENTRYPOINT ["webserver", "ENV"]
|
|
CMD ["--level", "DEBUG"]
|