mirror of
https://github.com/deepset-ai/haystack.git
synced 2025-07-29 03:39:58 +00:00

* Refactoring the `Raypipeline.run` method - merging it with the `Pipeline.run` This is to fix #2968 * Bug: variable `i` was already in use * Removing unused imports * Removing unused import * [EMPTY] Re-trigger CI * Addressing concerns raised pre-review - Removing the attempt to try to make it without the need for `JoinDocuments` - it is okey to fail without `JoinDocuments` for certain pipelines. * Refactoring based on reviews
53 lines
1.2 KiB
YAML
53 lines
1.2 KiB
YAML
version: ignore
|
|
extras: ray
|
|
|
|
components:
|
|
- name: DocumentStore
|
|
type: ElasticsearchDocumentStore
|
|
params:
|
|
index: haystack_test
|
|
label_index: haystack_test_label
|
|
- name: ESRetriever
|
|
type: BM25Retriever
|
|
params:
|
|
document_store: DocumentStore
|
|
- name: Reader
|
|
type: FARMReader
|
|
params:
|
|
no_ans_boost: -10
|
|
model_name_or_path: deepset/roberta-base-squad2
|
|
num_processes: 0
|
|
- name: PDFConverter
|
|
type: PDFToTextConverter
|
|
params:
|
|
remove_numeric_tables: false
|
|
- name: Preprocessor
|
|
type: PreProcessor
|
|
params:
|
|
clean_whitespace: true
|
|
- name: IndexTimeDocumentClassifier
|
|
type: TransformersDocumentClassifier
|
|
params:
|
|
batch_size: 16
|
|
use_gpu: false
|
|
- name: QueryTimeDocumentClassifier
|
|
type: TransformersDocumentClassifier
|
|
params:
|
|
use_gpu: false
|
|
|
|
|
|
pipelines:
|
|
- name: ray_query_pipeline
|
|
nodes:
|
|
- name: ESRetriever
|
|
inputs: [ Query ]
|
|
serve_deployment_kwargs:
|
|
num_replicas: 2
|
|
version: Twenty
|
|
ray_actor_options:
|
|
# num_gpus: 0.25 # we have no GPU to test this
|
|
num_cpus: 0.5
|
|
max_concurrent_queries: 17
|
|
- name: Reader
|
|
inputs: [ ESRetriever ]
|