2022-04-19 16:08:08 +02:00
|
|
|
version: ignore
|
2022-05-19 19:40:03 +02:00
|
|
|
extras: ray
|
2022-03-15 11:17:26 +01:00
|
|
|
|
|
|
|
components:
|
2022-05-04 17:39:06 +02:00
|
|
|
- name: DocumentStore
|
|
|
|
type: ElasticsearchDocumentStore
|
2022-03-15 11:17:26 +01:00
|
|
|
params:
|
2022-05-04 17:39:06 +02:00
|
|
|
index: haystack_test
|
|
|
|
label_index: haystack_test_label
|
2022-08-11 03:50:14 -04:00
|
|
|
- name: ESRetriever1
|
|
|
|
type: BM25Retriever
|
|
|
|
params:
|
|
|
|
document_store: DocumentStore
|
|
|
|
- name: ESRetriever2
|
|
|
|
# type: TfidfRetriever # can't use TfidfRetriever until https://github.com/deepset-ai/haystack/pull/2984 isn't merged
|
2022-04-26 16:09:39 +02:00
|
|
|
type: BM25Retriever
|
2022-03-15 11:17:26 +01:00
|
|
|
params:
|
|
|
|
document_store: DocumentStore
|
2022-05-04 17:39:06 +02:00
|
|
|
- name: Reader
|
|
|
|
type: FARMReader
|
2022-03-15 11:17:26 +01:00
|
|
|
params:
|
2022-05-04 17:39:06 +02:00
|
|
|
no_ans_boost: -10
|
|
|
|
model_name_or_path: deepset/roberta-base-squad2
|
|
|
|
num_processes: 0
|
2022-03-15 11:17:26 +01:00
|
|
|
- name: PDFConverter
|
|
|
|
type: PDFToTextConverter
|
|
|
|
params:
|
|
|
|
remove_numeric_tables: false
|
|
|
|
- name: Preprocessor
|
|
|
|
type: PreProcessor
|
|
|
|
params:
|
|
|
|
clean_whitespace: true
|
|
|
|
- name: IndexTimeDocumentClassifier
|
|
|
|
type: TransformersDocumentClassifier
|
|
|
|
params:
|
|
|
|
batch_size: 16
|
|
|
|
use_gpu: false
|
|
|
|
- name: QueryTimeDocumentClassifier
|
|
|
|
type: TransformersDocumentClassifier
|
|
|
|
params:
|
|
|
|
use_gpu: false
|
2022-08-11 03:50:14 -04:00
|
|
|
- name: JoinDocuments
|
|
|
|
params: {}
|
|
|
|
type: JoinDocuments
|
2022-03-15 11:17:26 +01:00
|
|
|
|
|
|
|
|
|
|
|
pipelines:
|
|
|
|
- name: ray_query_pipeline
|
|
|
|
nodes:
|
2022-08-11 03:50:14 -04:00
|
|
|
- name: ESRetriever1
|
2022-03-15 11:17:26 +01:00
|
|
|
inputs: [ Query ]
|
2022-08-03 10:38:22 -04:00
|
|
|
serve_deployment_kwargs:
|
|
|
|
num_replicas: 2
|
|
|
|
version: Twenty
|
|
|
|
ray_actor_options:
|
|
|
|
# num_gpus: 0.25 # we have no GPU to test this
|
2022-08-11 03:50:14 -04:00
|
|
|
num_cpus: 0.25
|
2022-08-03 10:38:22 -04:00
|
|
|
max_concurrent_queries: 17
|
2022-08-11 03:50:14 -04:00
|
|
|
- name: ESRetriever2
|
|
|
|
inputs: [ Query ]
|
|
|
|
serve_deployment_kwargs:
|
|
|
|
num_replicas: 2
|
|
|
|
version: Twenty
|
|
|
|
ray_actor_options:
|
|
|
|
# num_gpus: 0.25 # we have no GPU to test this
|
|
|
|
num_cpus: 0.25
|
|
|
|
max_concurrent_queries: 15
|
|
|
|
- name: JoinDocuments
|
|
|
|
inputs:
|
|
|
|
- ESRetriever1
|
|
|
|
- ESRetriever2
|
2022-03-15 11:17:26 +01:00
|
|
|
- name: Reader
|
2022-08-11 03:50:14 -04:00
|
|
|
inputs: [ JoinDocuments ]
|