2023-10-27 14:53:03 +02:00
|
|
|
loaders:
|
2024-01-23 18:28:52 +01:00
|
|
|
- type: haystack_pydoc_tools.loaders.CustomPythonLoader
|
2023-12-04 14:03:28 +01:00
|
|
|
search_path: [../../../haystack/components/preprocessors]
|
2025-03-19 19:25:23 +01:00
|
|
|
modules: [
|
|
|
|
"csv_document_cleaner",
|
|
|
|
"csv_document_splitter",
|
|
|
|
"document_cleaner",
|
2025-04-17 12:02:26 +02:00
|
|
|
"document_preprocessor",
|
2025-03-19 19:25:23 +01:00
|
|
|
"document_splitter",
|
|
|
|
"hierarchical_document_splitter",
|
|
|
|
"recursive_splitter",
|
|
|
|
"text_cleaner"]
|
2023-10-27 14:53:03 +02:00
|
|
|
ignore_when_discovered: ["__init__"]
|
|
|
|
processors:
|
|
|
|
- type: filter
|
|
|
|
expression:
|
|
|
|
documented_only: true
|
|
|
|
do_not_filter_modules: false
|
|
|
|
skip_empty_modules: true
|
|
|
|
- type: smart
|
|
|
|
- type: crossref
|
|
|
|
renderer:
|
2024-03-13 12:30:13 +01:00
|
|
|
type: haystack_pydoc_tools.renderers.ReadmeCoreRenderer
|
2024-02-27 16:00:44 +01:00
|
|
|
excerpt: Preprocess your Documents and texts. Clean, split, and more.
|
2024-02-01 16:47:26 +01:00
|
|
|
category_slug: haystack-api
|
|
|
|
title: PreProcessors
|
|
|
|
slug: preprocessors-api
|
2023-12-04 14:03:28 +01:00
|
|
|
order: 100
|
2023-10-27 14:53:03 +02:00
|
|
|
markdown:
|
|
|
|
descriptive_class_title: false
|
2024-03-07 15:54:16 +01:00
|
|
|
classdef_code_block: false
|
2023-10-27 14:53:03 +02:00
|
|
|
descriptive_module_title: true
|
|
|
|
add_method_class_prefix: true
|
|
|
|
add_member_class_prefix: false
|
2024-02-01 16:47:26 +01:00
|
|
|
filename: preprocessors_api.md
|