2022-04-19 16:08:08 +02:00
|
|
|
version: ignore
|
2021-02-02 17:32:17 +01:00
|
|
|
|
|
|
|
components:
|
2021-04-07 17:53:32 +02:00
|
|
|
- name: Reader
|
2021-02-02 17:32:17 +01:00
|
|
|
type: FARMReader
|
|
|
|
params:
|
|
|
|
no_ans_boost: -10
|
|
|
|
model_name_or_path: deepset/roberta-base-squad2
|
2021-12-22 17:20:23 +01:00
|
|
|
num_processes: 0
|
2021-04-07 17:53:32 +02:00
|
|
|
- name: ESRetriever
|
2022-04-26 16:09:39 +02:00
|
|
|
type: BM25Retriever
|
2021-02-02 17:32:17 +01:00
|
|
|
params:
|
2021-04-07 17:53:32 +02:00
|
|
|
document_store: DocumentStore
|
|
|
|
- name: DocumentStore
|
2021-02-02 17:32:17 +01:00
|
|
|
type: ElasticsearchDocumentStore
|
|
|
|
params:
|
2021-08-02 14:51:24 +02:00
|
|
|
index: haystack_test
|
2021-04-07 17:53:32 +02:00
|
|
|
label_index: haystack_test_label
|
|
|
|
- name: PDFConverter
|
2021-02-16 16:24:28 +01:00
|
|
|
type: PDFToTextConverter
|
|
|
|
params:
|
|
|
|
remove_numeric_tables: false
|
2022-05-04 17:39:06 +02:00
|
|
|
- name: TextConverter
|
|
|
|
type: TextConverter
|
2021-04-07 17:53:32 +02:00
|
|
|
- name: Preprocessor
|
2021-02-16 16:24:28 +01:00
|
|
|
type: PreProcessor
|
|
|
|
params:
|
|
|
|
clean_whitespace: true
|
2021-11-09 18:43:00 +01:00
|
|
|
- name: IndexTimeDocumentClassifier
|
|
|
|
type: TransformersDocumentClassifier
|
|
|
|
params:
|
|
|
|
batch_size: 16
|
2022-03-15 11:17:26 +01:00
|
|
|
use_gpu: false
|
2021-11-09 18:43:00 +01:00
|
|
|
- name: QueryTimeDocumentClassifier
|
|
|
|
type: TransformersDocumentClassifier
|
|
|
|
params:
|
2022-03-15 11:17:26 +01:00
|
|
|
use_gpu: false
|
2021-02-16 16:24:28 +01:00
|
|
|
|
2021-02-02 17:32:17 +01:00
|
|
|
|
|
|
|
pipelines:
|
2021-04-07 17:53:32 +02:00
|
|
|
- name: query_pipeline
|
2021-02-02 17:32:17 +01:00
|
|
|
nodes:
|
2021-04-07 17:53:32 +02:00
|
|
|
- name: ESRetriever
|
2021-02-02 17:32:17 +01:00
|
|
|
inputs: [Query]
|
2021-04-07 17:53:32 +02:00
|
|
|
- name: Reader
|
|
|
|
inputs: [ESRetriever]
|
2021-02-16 16:24:28 +01:00
|
|
|
|
2021-11-09 18:43:00 +01:00
|
|
|
- name: query_pipeline_with_document_classifier
|
|
|
|
nodes:
|
|
|
|
- name: ESRetriever
|
|
|
|
inputs: [Query]
|
|
|
|
- name: QueryTimeDocumentClassifier
|
|
|
|
inputs: [ESRetriever]
|
|
|
|
- name: Reader
|
|
|
|
inputs: [QueryTimeDocumentClassifier]
|
|
|
|
|
2021-04-07 17:53:32 +02:00
|
|
|
- name: indexing_pipeline
|
2021-02-16 16:24:28 +01:00
|
|
|
nodes:
|
2021-04-07 17:53:32 +02:00
|
|
|
- name: PDFConverter
|
2021-02-16 16:24:28 +01:00
|
|
|
inputs: [File]
|
2021-04-07 17:53:32 +02:00
|
|
|
- name: Preprocessor
|
|
|
|
inputs: [PDFConverter]
|
|
|
|
- name: ESRetriever
|
|
|
|
inputs: [Preprocessor]
|
|
|
|
- name: DocumentStore
|
|
|
|
inputs: [ESRetriever]
|
2021-10-12 10:53:54 +02:00
|
|
|
|
|
|
|
- name: indexing_text_pipeline
|
|
|
|
nodes:
|
|
|
|
- name: TextConverter
|
|
|
|
inputs: [File]
|
|
|
|
- name: Preprocessor
|
|
|
|
inputs: [TextConverter]
|
|
|
|
- name: ESRetriever
|
|
|
|
inputs: [Preprocessor]
|
|
|
|
- name: DocumentStore
|
|
|
|
inputs: [ESRetriever]
|
2021-11-09 18:43:00 +01:00
|
|
|
|
|
|
|
- name: indexing_pipeline_with_classifier
|
|
|
|
nodes:
|
|
|
|
- name: PDFConverter
|
|
|
|
inputs: [File]
|
|
|
|
- name: Preprocessor
|
|
|
|
inputs: [PDFConverter]
|
|
|
|
- name: IndexTimeDocumentClassifier
|
|
|
|
inputs: [Preprocessor]
|
|
|
|
- name: ESRetriever
|
|
|
|
inputs: [IndexTimeDocumentClassifier]
|
|
|
|
- name: DocumentStore
|
|
|
|
inputs: [ESRetriever]
|