haystack/docs/pydoc/config_docusaurus/extractors_api.yml
Sebastian Husch Lee b9b1652fd4
feat: Add LLMDocumentContentExtractor (#9637)
* Add LLMDocumentContentExtractor

* Remove file

* Remove from slow
2025-07-23 11:16:37 +02:00

28 lines
946 B
YAML

loaders:
- type: haystack_pydoc_tools.loaders.CustomPythonLoader
search_path: [../../../haystack/components/extractors]
modules: ["named_entity_extractor", "llm_metadata_extractor", "image/llm_document_content_extractor"]
ignore_when_discovered: ["__init__"]
processors:
- type: filter
expression:
documented_only: true
do_not_filter_modules: false
skip_empty_modules: true
- type: filter
expression: "name not in ['_BackendEnumMeta', '_NerBackend', '_HfBackend', '_SpacyBackend']"
- type: smart
- type: crossref
renderer:
type: haystack_pydoc_tools.renderers.DocusaurusRenderer
description: Extracts predefined entities out of a piece of text.
title: Extractors
id: extractors-api
markdown:
descriptive_class_title: false
classdef_code_block: false
descriptive_module_title: true
add_method_class_prefix: true
add_member_class_prefix: false
filename: extractors_api.md