| 
									
										
										
										
											2023-11-13 10:38:06 +01:00
										 |  |  | FROM python:3.10-bullseye
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  | RUN curl -sS https://packages.microsoft.com/keys/microsoft.asc | apt-key add -
 | 
					
						
							|  |  |  | RUN curl -sS https://packages.microsoft.com/config/debian/11/prod.list > /etc/apt/sources.list.d/mssql-release.list
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | # Install Dependencies (listed in alphabetical order)
 | 
					
						
							| 
									
										
										
										
											2024-06-05 21:18:37 +02:00
										 |  |  | RUN dpkg --configure -a \
 | 
					
						
							|  |  |  |     && apt-get -qq update \
 | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  |     && apt-get -qq install -y \
 | 
					
						
							|  |  |  |     alien \
 | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |     build-essential \
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     default-libmysqlclient-dev \
 | 
					
						
							|  |  |  |     freetds-bin \
 | 
					
						
							|  |  |  |     freetds-dev \
 | 
					
						
							|  |  |  |     gcc \
 | 
					
						
							|  |  |  |     gnupg \
 | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |     libaio1 \
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     libevent-dev \
 | 
					
						
							|  |  |  |     libffi-dev \
 | 
					
						
							|  |  |  |     libpq-dev \
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  |     librdkafka-dev \
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     libsasl2-dev \
 | 
					
						
							| 
									
										
										
										
											2023-05-16 14:32:48 +02:00
										 |  |  |     libsasl2-2 \
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     libsasl2-modules \
 | 
					
						
							| 
									
										
										
										
											2023-05-16 14:32:48 +02:00
										 |  |  |     libsasl2-modules-gssapi-mit \
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     libssl-dev \
 | 
					
						
							|  |  |  |     libxml2 \
 | 
					
						
							| 
									
										
										
										
											2023-04-20 10:56:46 +02:00
										 |  |  |     libkrb5-dev \
 | 
					
						
							| 
									
										
										
										
											2024-06-05 21:18:37 +02:00
										 |  |  |     default-jdk \
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     openssl \
 | 
					
						
							|  |  |  |     postgresql \
 | 
					
						
							|  |  |  |     postgresql-contrib \
 | 
					
						
							|  |  |  |     tdsodbc \
 | 
					
						
							|  |  |  |     unixodbc \
 | 
					
						
							|  |  |  |     unixodbc-dev \
 | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |     unzip \
 | 
					
						
							| 
									
										
										
										
											2023-10-06 11:51:07 +07:00
										 |  |  |     git \
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  |     wget --no-install-recommends \
 | 
					
						
							|  |  |  |     # Accept MSSQL ODBC License
 | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  |     && ACCEPT_EULA=Y apt-get -qq install -y msodbcsql18 \
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  |     && rm -rf /var/lib/apt/lists/*
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | # Add updated postgres/redshift dependencies based on libq
 | 
					
						
							|  |  |  | RUN curl https://www.postgresql.org/media/keys/ACCC4CF8.asc | apt-key add -
 | 
					
						
							| 
									
										
										
										
											2024-10-04 11:31:01 +05:30
										 |  |  | RUN echo "deb https://apt.postgresql.org/pub/repos/apt/ bullseye-pgdg main" > /etc/apt/sources.list.d/pgdg.list; \
 | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  |     apt-get -qq update; \
 | 
					
						
							|  |  |  |     apt-get -qq install --no-install-recommends -y libpq-dev postgresql-client postgresql-common postgresql postgresql-contrib; \
 | 
					
						
							|  |  |  |     apt-get -qq autoremove -yqq --purge; \
 | 
					
						
							|  |  |  |     apt-get -qq clean && rm -rf /var/lib/apt/lists/*
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-03 23:22:48 +02:00
										 |  |  | RUN if [ $(uname -m) = "arm64" || $(uname -m) = "aarch64" ]; \
 | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |  then \
 | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  |  wget -q https://download.oracle.com/otn_software/linux/instantclient/191000/instantclient-basic-linux.arm64-19.10.0.0.0dbru.zip -O /oracle-instantclient.zip && \
 | 
					
						
							|  |  |  |  unzip -qq -d /instantclient -j /oracle-instantclient.zip && rm -f /oracle-instantclient.zip; \
 | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |  else \
 | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  |  wget -q https://download.oracle.com/otn_software/linux/instantclient/1917000/instantclient-basic-linux.x64-19.17.0.0.0dbru.zip -O /oracle-instantclient.zip && \
 | 
					
						
							|  |  |  |  unzip -qq -d /instantclient -j /oracle-instantclient.zip && rm -f /oracle-instantclient.zip; \
 | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |  fi
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ENV LD_LIBRARY_PATH=/instantclient
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-08-20 09:24:38 +02:00
										 |  |  | # Install DB2 iAccess driver
 | 
					
						
							| 
									
										
										
										
											2024-10-03 23:22:48 +02:00
										 |  |  | RUN if [ $(uname -m) = "x86_64" ]; \
 | 
					
						
							| 
									
										
										
										
											2024-08-13 13:16:19 +02:00
										 |  |  |   then \
 | 
					
						
							|  |  |  |   curl https://public.dhe.ibm.com/software/ibmi/products/odbc/debs/dists/1.1.0/ibmi-acs-1.1.0.list | tee /etc/apt/sources.list.d/ibmi-acs-1.1.0.list \
 | 
					
						
							|  |  |  |   && apt update \
 | 
					
						
							|  |  |  |   && apt install ibm-iaccess; \
 | 
					
						
							|  |  |  |   fi
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | WORKDIR ingestion/
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | # Required for Airflow DockerOperator, as we need to run the workflows from a `python main.py` command in the container.
 | 
					
						
							| 
									
										
										
										
											2023-02-26 00:52:14 +01:00
										 |  |  | COPY ingestion/operators/docker/*.py .
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  | # Disable pip cache dir
 | 
					
						
							|  |  |  | # https://pip.pypa.io/en/stable/topics/caching/#avoiding-caching
 | 
					
						
							|  |  |  | ENV PIP_NO_CACHE_DIR=1 | 
					
						
							|  |  |  | # Make pip silent
 | 
					
						
							|  |  |  | ENV PIP_QUIET=1 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | RUN pip install --upgrade pip
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ARG INGESTION_DEPENDENCY="all"
 | 
					
						
							| 
									
										
										
										
											2024-10-03 15:01:32 +00:00
										 |  |  | ARG RI_VERSION="1.5.7.0"
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | RUN pip install --upgrade pip
 | 
					
						
							| 
									
										
										
										
											2023-09-13 11:40:28 +02:00
										 |  |  | RUN pip install "openmetadata-ingestion[airflow]~=${RI_VERSION}"
 | 
					
						
							|  |  |  | RUN pip install "openmetadata-ingestion[${INGESTION_DEPENDENCY}]~=${RI_VERSION}"
 | 
					
						
							| 
									
										
										
										
											2023-05-30 07:06:48 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-08-20 09:24:38 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-05-30 07:06:48 +02:00
										 |  |  | # Temporary workaround for https://github.com/open-metadata/OpenMetadata/issues/9593
 | 
					
						
							| 
									
										
										
										
											2024-10-03 23:22:48 +02:00
										 |  |  | RUN [ $(uname -m) = "x86_64" ] \
 | 
					
						
							|  |  |  |   && pip install "openmetadata-ingestion[db2]~=${RI_VERSION}" \
 | 
					
						
							|  |  |  |   || echo "DB2 not supported on ARM architectures."
 | 
					
						
							| 
									
										
										
										
											2023-05-30 07:06:48 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | # Uninstalling psycopg2-binary and installing psycopg2 instead
 | 
					
						
							|  |  |  | # because the psycopg2-binary generates a architecture specific error
 | 
					
						
							| 
									
										
										
										
											2023-12-19 11:09:38 +01:00
										 |  |  | # while authenticating connection with the airflow, psycopg2 solves this error
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | RUN pip uninstall psycopg2-binary -y
 | 
					
						
							| 
									
										
										
										
											2023-06-22 15:18:39 +05:30
										 |  |  | RUN pip install psycopg2 mysqlclient==2.1.1
 |