2022-01-26 18:12:55 +01:00
[metadata]
name = farm-haystack
version = file: VERSION.txt
url = https://github.com/deepset-ai/haystack
project_urls =
Docs: RTD = https://haystack.deepset.ai/overview/intro
CI: GitHub = https://github.com/deepset-ai/haystack/actions
GitHub: issues = https://github.com/deepset-ai/haystack/issues
GitHub: repo = https://github.com/deepset-ai/haystack
description = Neural Question Answering & Semantic Search at Scale. Use modern transformer based models like BERT to find answers in large document collections
long_description = file: README.md
long_description_content_type = text/markdown
keywords =
QA
Question-Answering
Reader
Retriever
semantic-search
search
BERT
roberta
albert
squad
mrc
transfer-learning
language-model
transformer
author = deepset.ai
author_email = malte.pietsch@deepset.ai
license = Apache License 2.0
license_file = LICENSE
platforms = any
classifiers =
Development Status :: 5 - Production/Stable
Intended Audience :: Science/Research
License :: Freely Distributable
License :: OSI Approved :: Apache Software License
Topic :: Scientific/Engineering :: Artificial Intelligence
Operating System :: OS Independent
Programming Language :: Python
Programming Language :: Python :: 3
Programming Language :: Python :: 3.7
Programming Language :: Python :: 3.8
Programming Language :: Python :: 3.9
Programming Language :: Python :: 3.10
[options]
use_scm_version = True
2022-02-02 16:14:12 +01:00
python_requires = >=3.7, <4
2022-01-26 18:12:55 +01:00
packages = find:
2022-01-28 17:21:23 +01:00
setup_requires =
setuptools
wheel
2022-01-26 18:12:55 +01:00
install_requires =
importlib-metadata; python_version < '3.8'
torch>1.9,<1.11
requests
pydantic
transformers = =4.13.0
nltk
pandas
# Utils
dill # pickle extension for (de-)serialization
tqdm # progress bars in model download and training scripts
networkx # graphs library
mmh3 # fast hashing function (murmurhash3)
quantulum3 # quantities extraction from text
azure-ai-formrecognizer = =3.2.0b2 # forms reader
# Preprocessing
more_itertools # for windowing
python-docx
langdetect # for PDF conversions
tika # Apache Tika (text & metadata extractor)
# See haystack/nodes/retriever/_embedding_encoder.py, _SentenceTransformersEmbeddingEncoder
sentence-transformers> = 0.4.0
# for stats in run_classifier
scipy> = 1.3.2
scikit-learn> = 1.0.0
# Metrics and logging
seqeval
mlflow< = 1.13.1
# Elasticsearch
elasticsearch> = 7.7,<=7.10
elastic-apm
# Not found in repo, to review:
#uvloop==0.14; sys_platform != 'win32' and sys_platform != 'cygwin'
[options.packages.find]
exclude =
rest_api*
test*
tutorials*
ui*
[options.extras_require]
sql =
2022-02-09 16:32:52 +01:00
sqlalchemy> = 1.4.2,<2
2022-01-26 18:12:55 +01:00
sqlalchemy_utils
psycopg2-binary; sys_platform ! = 'win32' and sys_platform != 'cygwin'
only-faiss =
2022-02-09 16:32:52 +01:00
faiss-cpu> = 1.6.3,<2
2022-01-26 18:12:55 +01:00
faiss =
farm-haystack[sql,only-faiss]
only-faiss-gpu =
2022-02-09 16:32:52 +01:00
faiss-gpu> = 1.6.3,<2
2022-01-26 18:12:55 +01:00
faiss-gpu =
farm-haystack[sql,only-faiss-gpu]
only-milvus1 =
pymilvus<2.0.0 # Refer milvus version support matrix at https://github.com/milvus-io/pymilvus#install-pymilvus
milvus1 =
farm-haystack[sql,only-milvus1]
only-milvus =
2022-02-09 16:32:52 +01:00
pymilvus> = 2.0.0,<3 # Refer milvus version support matrix at https://github.com/milvus-io/pymilvus#install-pymilvus
2022-01-26 18:12:55 +01:00
milvus =
farm-haystack[sql,only-milvus]
weaviate =
weaviate-client = =2.5.0
graphdb =
SPARQLWrapper
docstores =
farm-haystack[faiss,milvus1,weaviate,graphdb]
docstores-gpu =
farm-haystack[faiss-gpu,milvus1,weaviate,graphdb]
crawler =
selenium
webdriver-manager
preprocessing =
beautifulsoup4
markdown
ocr =
pytesseract = =0.3.7
pillow
pdf2image = =1.14.0
onnx =
onnxruntime
onnxruntime_tools
onnx-gpu =
onnxruntime-gpu
onnxruntime_tools
ray =
2022-02-09 16:32:52 +01:00
ray> = 1.9.1,<2
aiorwlock> = 1.3.0,<2
2022-01-26 18:12:55 +01:00
colab =
grpcio = =1.43.0
dev =
2022-02-04 15:45:09 +01:00
# Type check
2022-01-26 18:12:55 +01:00
mypy
2022-02-09 18:27:12 +01:00
typing_extensions; python_version < '3.8'
2022-02-04 15:45:09 +01:00
# Test
2022-01-26 18:12:55 +01:00
pytest
responses
tox
coverage
python-multipart
psutil
2022-02-04 15:45:09 +01:00
# Linting
2022-01-26 18:12:55 +01:00
pylint
2022-02-04 15:45:09 +01:00
# Code formatting
black[jupyter]
# Documentation
pydoc-markdown> = 4,<5
mkdocs
jupytercontrib
watchdog # = =1.0.2
2022-01-26 18:12:55 +01:00
test =
2022-02-02 16:14:12 +01:00
farm-haystack[docstores,crawler,preprocessing,ocr,ray,dev]
2022-01-26 18:12:55 +01:00
all =
2022-02-02 16:14:12 +01:00
farm-haystack[docstores,crawler,preprocessing,ocr,ray,dev,onnx]
2022-01-26 18:12:55 +01:00
all-gpu =
2022-02-02 16:14:12 +01:00
farm-haystack[docstores-gpu,crawler,preprocessing,ocr,ray,dev,onnx-gpu]
2022-01-26 18:12:55 +01:00
[tool:pytest]
testpaths =
test
rest_api/test
ui/test
python_files =
test_*.py
addopts =
-vv
[mypy]
warn_return_any = false
warn_unused_configs = true
ignore_missing_imports = true
plugins = pydantic.mypy
[tox]
requires = tox-venv
setuptools > = 30.0.0
envlist = py36,py37
[testenv]
changedir = test
deps =
coverage
pytest
pandas
setenv =
COVERAGE_FILE = test-reports/.coverage
PYTEST_ADDOPTS = --junitxml=test-reports/{envname}/junit.xml -vv
commands =
coverage run --source haystack --parallel-mode -m pytest {posargs}
coverage combine
coverage report -m
coverage html -d test-reports/coverage-html
coverage xml -o test-reports/coverage.xml