| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | FROM python:3.9-bullseye | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  | RUN curl -sS https://packages.microsoft.com/keys/microsoft.asc | apt-key add - | 
					
						
							|  |  |  | RUN curl -sS https://packages.microsoft.com/config/debian/11/prod.list > /etc/apt/sources.list.d/mssql-release.list | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | # Install Dependencies (listed in alphabetical order) | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  | RUN apt-get -qq update \ | 
					
						
							|  |  |  |     && apt-get -qq install -y \ | 
					
						
							|  |  |  |     alien \ | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |     build-essential \ | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     default-libmysqlclient-dev \ | 
					
						
							|  |  |  |     freetds-bin \ | 
					
						
							|  |  |  |     freetds-dev \ | 
					
						
							|  |  |  |     gcc \ | 
					
						
							|  |  |  |     gnupg \ | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |     libaio1 \ | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     libevent-dev \ | 
					
						
							|  |  |  |     libffi-dev \ | 
					
						
							|  |  |  |     libpq-dev \ | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  |     librdkafka-dev \ | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     libsasl2-dev \ | 
					
						
							| 
									
										
										
										
											2023-05-16 14:32:48 +02:00
										 |  |  |     libsasl2-2 \ | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     libsasl2-modules \ | 
					
						
							| 
									
										
										
										
											2023-05-16 14:32:48 +02:00
										 |  |  |     libsasl2-modules-gssapi-mit \ | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     libssl-dev \ | 
					
						
							|  |  |  |     libxml2 \ | 
					
						
							| 
									
										
										
										
											2023-04-20 10:56:46 +02:00
										 |  |  |     libkrb5-dev \ | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  |     openjdk-11-jre \ | 
					
						
							|  |  |  |     openssl \ | 
					
						
							|  |  |  |     postgresql \ | 
					
						
							|  |  |  |     postgresql-contrib \ | 
					
						
							|  |  |  |     tdsodbc \ | 
					
						
							|  |  |  |     unixodbc \ | 
					
						
							|  |  |  |     unixodbc-dev \ | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |     unzip \ | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  |     vim \ | 
					
						
							|  |  |  |     wget --no-install-recommends \ | 
					
						
							|  |  |  |     # Accept MSSQL ODBC License | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  |     && ACCEPT_EULA=Y apt-get -qq install -y msodbcsql18 \ | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  |     && rm -rf /var/lib/apt/lists/* | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | # Add updated postgres/redshift dependencies based on libq | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  | RUN curl -sS https://www.postgresql.org/media/keys/ACCC4CF8.asc | apt-key add - | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | RUN echo "deb https://apt.postgresql.org/pub/repos/apt/ buster-pgdg main" > /etc/apt/sources.list.d/pgdg.list; \ | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  |     apt-get -qq update; \ | 
					
						
							|  |  |  |     apt-get -qq install --no-install-recommends -y libpq-dev postgresql-client postgresql-common postgresql postgresql-contrib; \ | 
					
						
							|  |  |  |     apt-get -qq autoremove -yqq --purge; \ | 
					
						
							|  |  |  |     apt-get -qq clean && rm -rf /var/lib/apt/lists/* | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | RUN if [[ $(uname -m) == "arm64" || $(uname -m) == "aarch64" ]]; \ | 
					
						
							|  |  |  |  then \ | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  |  wget -q https://download.oracle.com/otn_software/linux/instantclient/191000/instantclient-basic-linux.arm64-19.10.0.0.0dbru.zip -O /oracle-instantclient.zip && \ | 
					
						
							|  |  |  |  unzip -qq -d /instantclient -j /oracle-instantclient.zip && rm -f /oracle-instantclient.zip; \ | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |  else \ | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  |  wget -q https://download.oracle.com/otn_software/linux/instantclient/1917000/instantclient-basic-linux.x64-19.17.0.0.0dbru.zip -O /oracle-instantclient.zip && \ | 
					
						
							|  |  |  |  unzip -qq -d /instantclient -j /oracle-instantclient.zip && rm -f /oracle-instantclient.zip; \ | 
					
						
							| 
									
										
										
										
											2023-01-19 08:08:56 +01:00
										 |  |  |  fi | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ENV LD_LIBRARY_PATH=/instantclient | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | # Security patches for base image | 
					
						
							|  |  |  | # monitor no fixed version for | 
					
						
							|  |  |  | #    https://security.snyk.io/vuln/SNYK-DEBIAN11-LIBTASN16-3061097 | 
					
						
							|  |  |  | #    https://security.snyk.io/vuln/SNYK-DEBIAN11-MARIADB105-2940589 | 
					
						
							|  |  |  | #    https://security.snyk.io/vuln/SNYK-DEBIAN11-BIND9-3027852 | 
					
						
							|  |  |  | #    https://security.snyk.io/vuln/SNYK-DEBIAN11-EXPAT-3023031 we are already installed the latest | 
					
						
							|  |  |  | RUN echo "deb http://deb.debian.org/debian bullseye-backports main" > /etc/apt/sources.list.d/backports.list | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  | RUN apt-get -qq update \ | 
					
						
							|  |  |  |     && apt-get -qq install -t bullseye-backports -y \ | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  |     curl \ | 
					
						
							|  |  |  |     libpcre2-8-0 \ | 
					
						
							|  |  |  |     postgresql-common \ | 
					
						
							|  |  |  |     expat \ | 
					
						
							|  |  |  |     bind9 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | WORKDIR ingestion/ | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | # For the dev build, we copy all files | 
					
						
							|  |  |  | COPY ingestion/ . | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-08-02 14:36:27 +02:00
										 |  |  | # Disable pip cache dir | 
					
						
							|  |  |  | # https://pip.pypa.io/en/stable/topics/caching/#avoiding-caching | 
					
						
							|  |  |  | ENV PIP_NO_CACHE_DIR=1 | 
					
						
							|  |  |  | # Make pip silent | 
					
						
							|  |  |  | ENV PIP_QUIET=1 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | RUN pip install --upgrade pip setuptools | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | ARG INGESTION_DEPENDENCY="all" | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | RUN pip install ".[airflow]" | 
					
						
							|  |  |  | RUN pip install ".[${INGESTION_DEPENDENCY}]" | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | # Required for Airflow DockerOperator, as we need to run the workflows from a `python main.py` command in the container. | 
					
						
							|  |  |  | COPY ingestion/operators/docker/*.py . | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-05-30 07:06:48 +02:00
										 |  |  | # Temporary workaround for https://github.com/open-metadata/OpenMetadata/issues/9593 | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  | RUN echo "Image built for $(uname -m)" | 
					
						
							| 
									
										
										
										
											2023-06-26 19:04:55 +05:30
										 |  |  | RUN if [[ $(uname -m) == "arm64" ]]; \ | 
					
						
							| 
									
										
										
										
											2023-06-19 12:09:09 +02:00
										 |  |  |     then \ | 
					
						
							|  |  |  |     pip install "ibm-db-sa~=0.4"; \ | 
					
						
							|  |  |  |     fi | 
					
						
							| 
									
										
										
										
											2023-05-30 07:06:48 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-10-11 07:50:49 +02:00
										 |  |  | # Uninstalling psycopg2-binary and installing psycopg2 instead | 
					
						
							|  |  |  | # because the psycopg2-binary generates a architecture specific error | 
					
						
							|  |  |  | # while authrenticating connection with the airflow, psycopg2 solves this error | 
					
						
							|  |  |  | RUN pip uninstall psycopg2-binary -y | 
					
						
							| 
									
										
										
										
											2023-06-22 15:18:39 +05:30
										 |  |  | RUN pip install psycopg2 mysqlclient==2.1.1 |