mirror of
https://github.com/Azure-Samples/graphrag-accelerator.git
synced 2025-07-03 23:26:56 +00:00
31 lines
1.2 KiB
Plaintext
31 lines
1.2 KiB
Plaintext
# Copyright (c) Microsoft Corporation.
|
|
# Licensed under the MIT License.
|
|
|
|
FROM python:3.10
|
|
|
|
# default graphrag version will be 0.0.0 unless overridden by --build-arg
|
|
ARG GRAPHRAG_VERSION=0.0.0
|
|
ENV GRAPHRAG_VERSION=v${GRAPHRAG_VERSION}
|
|
ENV PIP_ROOT_USER_ACTION=ignore
|
|
ENV PIP_DISABLE_PIP_VERSION_CHECK=1
|
|
ENV SETUPTOOLS_USE_DISTUTILS=stdlib
|
|
ENV PYTHONPATH=/backend
|
|
|
|
COPY poetry.lock pyproject.toml /
|
|
COPY backend /backend
|
|
RUN pip install poetry \
|
|
&& poetry config virtualenvs.create false \
|
|
&& poetry install --without frontend
|
|
|
|
# download all nltk data that graphrag requires
|
|
RUN python -m nltk.downloader punkt averaged_perceptron_tagger maxent_ne_chunker words wordnet
|
|
|
|
# Note: we temporarily patch the adlfs library to enable use of managed identity. A PR has been submitted to the adlfs library.
|
|
# See https://github.com/fsspec/adlfs/pull/480
|
|
# TODO: remove this once PR has been merged and a new version released
|
|
RUN sed -i '/self.credential = credential/a\ \ \ \ \ \ \ \ if kwargs.get("account_host"): self.account_host = kwargs.get("account_host")' /usr/local/lib/python3.10/site-packages/adlfs/spec.py
|
|
|
|
WORKDIR /backend
|
|
EXPOSE 80
|
|
CMD ["uvicorn", "src.main:app", "--host", "0.0.0.0", "--port", "80"]
|