2020-09-22 11:48:26 +02:00
|
|
|
loaders:
|
|
|
|
- type: python
|
2021-10-25 15:50:23 +02:00
|
|
|
search_path: [../../../../haystack/nodes/file_converter]
|
2022-08-09 15:55:27 +02:00
|
|
|
modules: ['base', 'docx', 'image', 'markdown', 'pdf', 'parsr', 'azure', 'tika', 'txt']
|
2020-09-22 11:48:26 +02:00
|
|
|
ignore_when_discovered: ['__init__']
|
2022-02-04 15:45:09 +01:00
|
|
|
processors:
|
2020-09-22 11:48:26 +02:00
|
|
|
- type: filter
|
2022-09-21 17:18:34 +02:00
|
|
|
expression:
|
2022-02-04 15:45:09 +01:00
|
|
|
documented_only: true
|
|
|
|
do_not_filter_modules: false
|
|
|
|
skip_empty_modules: true
|
|
|
|
- type: smart
|
|
|
|
- type: crossref
|
2020-09-22 11:48:26 +02:00
|
|
|
renderer:
|
2022-09-21 17:18:34 +02:00
|
|
|
type: renderers.ReadmeRenderer
|
|
|
|
excerpt: Extracts text from files in different formats and cast it into the unified Document format.
|
|
|
|
category: 6310ca73c622850ddd3875a2
|
|
|
|
title: File Converters API
|
|
|
|
slug: file-converters-api
|
|
|
|
order: 70
|
|
|
|
markdown:
|
|
|
|
descriptive_class_title: false
|
|
|
|
descriptive_module_title: true
|
|
|
|
add_method_class_prefix: true
|
|
|
|
add_member_class_prefix: false
|
|
|
|
filename: file_converters_api.md
|