mirror of
https://github.com/open-metadata/OpenMetadata.git
synced 2025-07-04 15:45:42 +00:00

* VERSION - Bump ingestion debian to bookworm * MINOR - Fix collate app yaml reader with unwanted dropwizard java props
103 lines
3.5 KiB
Docker
103 lines
3.5 KiB
Docker
FROM python:3.10-bookworm
|
|
|
|
RUN curl -sS https://packages.microsoft.com/keys/microsoft.asc | apt-key add -
|
|
RUN curl -sS https://packages.microsoft.com/config/debian/11/prod.list > /etc/apt/sources.list.d/mssql-release.list
|
|
|
|
# Install Dependencies (listed in alphabetical order)
|
|
RUN apt-get -qq update \
|
|
&& apt-get -qq install -y \
|
|
alien \
|
|
build-essential \
|
|
default-libmysqlclient-dev \
|
|
freetds-bin \
|
|
freetds-dev \
|
|
gcc \
|
|
gnupg \
|
|
libaio1 \
|
|
libevent-dev \
|
|
libffi-dev \
|
|
libpq-dev \
|
|
librdkafka-dev \
|
|
libsasl2-dev \
|
|
libsasl2-2 \
|
|
libsasl2-modules \
|
|
libsasl2-modules-gssapi-mit \
|
|
libssl-dev \
|
|
libxml2 \
|
|
libkrb5-dev \
|
|
default-jdk \
|
|
openssl \
|
|
# To ensure compatibility with unixodbc package
|
|
odbcinst=2.3.11-2+deb12u1 \
|
|
postgresql \
|
|
postgresql-contrib \
|
|
tdsodbc \
|
|
unixodbc=2.3.11-2+deb12u1 \
|
|
unixodbc-dev=2.3.11-2+deb12u1 \
|
|
unzip \
|
|
vim \
|
|
git \
|
|
wget --no-install-recommends \
|
|
# Accept MSSQL ODBC License
|
|
&& ACCEPT_EULA=Y apt-get -qq install -y msodbcsql18 \
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
# Add updated postgres/redshift dependencies based on libq
|
|
ENV DEBIAN_FRONTEND=noninteractive
|
|
RUN curl -sS https://www.postgresql.org/media/keys/ACCC4CF8.asc | apt-key add -
|
|
RUN echo "deb https://apt.postgresql.org/pub/repos/apt/ bookworm-pgdg main" > /etc/apt/sources.list.d/pgdg.list; \
|
|
apt-get -qq update; \
|
|
apt-get -qq install --no-install-recommends -y libpq-dev postgresql-client postgresql-common postgresql postgresql-contrib; \
|
|
apt-get -qq autoremove -yqq --purge; \
|
|
apt-get -qq clean && rm -rf /var/lib/apt/lists/*
|
|
|
|
RUN if [ $(uname -m) = "arm64" ] | [ $(uname -m) = "aarch64" ]; \
|
|
then \
|
|
wget -q https://download.oracle.com/otn_software/linux/instantclient/191000/instantclient-basic-linux.arm64-19.10.0.0.0dbru.zip -O /oracle-instantclient.zip && \
|
|
unzip -qq -d /instantclient -j /oracle-instantclient.zip && rm -f /oracle-instantclient.zip; \
|
|
else \
|
|
wget -q https://download.oracle.com/otn_software/linux/instantclient/1917000/instantclient-basic-linux.x64-19.17.0.0.0dbru.zip -O /oracle-instantclient.zip && \
|
|
unzip -qq -d /instantclient -j /oracle-instantclient.zip && rm -f /oracle-instantclient.zip; \
|
|
fi
|
|
|
|
ENV LD_LIBRARY_PATH=/instantclient
|
|
|
|
# Install DB2 iAccess Driver
|
|
RUN if [ $(uname -m) = "x86_64" ]; \
|
|
then \
|
|
curl https://public.dhe.ibm.com/software/ibmi/products/odbc/debs/dists/1.1.0/ibmi-acs-1.1.0.list | tee /etc/apt/sources.list.d/ibmi-acs-1.1.0.list \
|
|
&& apt update \
|
|
&& apt install ibm-iaccess; \
|
|
fi
|
|
|
|
WORKDIR ingestion/
|
|
|
|
# For the dev build, we copy all files
|
|
COPY ingestion/ .
|
|
|
|
# Disable pip cache dir
|
|
# https://pip.pypa.io/en/stable/topics/caching/#avoiding-caching
|
|
ENV PIP_NO_CACHE_DIR=1
|
|
# Make pip silent
|
|
ENV PIP_QUIET=1
|
|
|
|
RUN pip install --upgrade pip setuptools~=70.3.0
|
|
|
|
ARG INGESTION_DEPENDENCY="all"
|
|
RUN pip install ".[airflow]"
|
|
RUN pip install ".[${INGESTION_DEPENDENCY}]"
|
|
|
|
# Temporary workaround for https://github.com/open-metadata/OpenMetadata/issues/9593
|
|
RUN [ $(uname -m) = "x86_64" ] \
|
|
&& pip install ".[db2]" \
|
|
|| echo "DB2 not supported on ARM architectures."
|
|
|
|
# Required for Airflow DockerOperator, as we need to run the workflows from a `python main.py` command in the container.
|
|
COPY ingestion/operators/docker/*.py .
|
|
|
|
# Uninstalling psycopg2-binary and installing psycopg2 instead
|
|
# because the psycopg2-binary generates a architecture specific error
|
|
# while authenticating connection with the airflow, psycopg2 solves this error
|
|
RUN pip uninstall psycopg2-binary -y
|
|
RUN pip install psycopg2 mysqlclient==2.1.1
|