LightRAG/examples/modalprocessors_example.py

"""
Example of directly using modal processors

This example demonstrates how to use LightRAG's modal processors directly without going through MinerU.
"""

import asyncio
import argparse
from lightrag.llm.openai import openai_complete_if_cache, openai_embed
from lightrag.kg.shared_storage import initialize_pipeline_status
from lightrag import LightRAG
from raganything.modalprocessors import (
    ImageModalProcessor,
    TableModalProcessor,
    EquationModalProcessor,
)

WORKING_DIR = "./rag_storage"


def get_llm_model_func(api_key: str, base_url: str = None):
    return (
        lambda prompt,
        system_prompt=None,
        history_messages=[],
        **kwargs: openai_complete_if_cache(
            "gpt-4o-mini",
            prompt,
            system_prompt=system_prompt,
            history_messages=history_messages,
            api_key=api_key,
            base_url=base_url,
            **kwargs,
        )
    )


def get_vision_model_func(api_key: str, base_url: str = None):
    return (
        lambda prompt,
        system_prompt=None,
        history_messages=[],
        image_data=None,
        **kwargs: openai_complete_if_cache(
            "gpt-4o",
            "",
            system_prompt=None,
            history_messages=[],
            messages=[
                {"role": "system", "content": system_prompt} if system_prompt else None,
                {
                    "role": "user",
                    "content": [
                        {"type": "text", "text": prompt},
                        {
                            "type": "image_url",
                            "image_url": {
                                "url": f"data:image/jpeg;base64,{image_data}"
                            },
                        },
                    ],
                }
                if image_data
                else {"role": "user", "content": prompt},
            ],
            api_key=api_key,
            base_url=base_url,
            **kwargs,
        )
        if image_data
        else openai_complete_if_cache(
            "gpt-4o-mini",
            prompt,
            system_prompt=system_prompt,
            history_messages=history_messages,
            api_key=api_key,
            base_url=base_url,
            **kwargs,
        )
    )


async def process_image_example(lightrag: LightRAG, vision_model_func):
    """Example of processing an image"""
    # Create image processor
    image_processor = ImageModalProcessor(
        lightrag=lightrag, modal_caption_func=vision_model_func
    )

    # Prepare image content
    image_content = {
        "img_path": "image.jpg",
        "img_caption": ["Example image caption"],
        "img_footnote": ["Example image footnote"],
    }

    # Process image
    description, entity_info = await image_processor.process_multimodal_content(
        modal_content=image_content,
        content_type="image",
        file_path="image_example.jpg",
        entity_name="Example Image",
    )

    print("Image Processing Results:")
    print(f"Description: {description}")
    print(f"Entity Info: {entity_info}")


async def process_table_example(lightrag: LightRAG, llm_model_func):
    """Example of processing a table"""
    # Create table processor
    table_processor = TableModalProcessor(
        lightrag=lightrag, modal_caption_func=llm_model_func
    )

    # Prepare table content
    table_content = {
        "table_body": """
        | Name | Age | Occupation |
        |------|-----|------------|
        | John | 25  | Engineer   |
        | Mary | 30  | Designer   |
        """,
        "table_caption": ["Employee Information Table"],
        "table_footnote": ["Data updated as of 2024"],
    }

    # Process table
    description, entity_info = await table_processor.process_multimodal_content(
        modal_content=table_content,
        content_type="table",
        file_path="table_example.md",
        entity_name="Employee Table",
    )

    print("\nTable Processing Results:")
    print(f"Description: {description}")
    print(f"Entity Info: {entity_info}")


async def process_equation_example(lightrag: LightRAG, llm_model_func):
    """Example of processing a mathematical equation"""
    # Create equation processor
    equation_processor = EquationModalProcessor(
        lightrag=lightrag, modal_caption_func=llm_model_func
    )

    # Prepare equation content
    equation_content = {"text": "E = mc^2", "text_format": "LaTeX"}

    # Process equation
    description, entity_info = await equation_processor.process_multimodal_content(
        modal_content=equation_content,
        content_type="equation",
        file_path="equation_example.txt",
        entity_name="Mass-Energy Equivalence",
    )

    print("\nEquation Processing Results:")
    print(f"Description: {description}")
    print(f"Entity Info: {entity_info}")


async def initialize_rag(api_key: str, base_url: str = None):
    rag = LightRAG(
        working_dir=WORKING_DIR,
        embedding_func=lambda texts: openai_embed(
            texts,
            model="text-embedding-3-large",
            api_key=api_key,
            base_url=base_url,
        ),
        llm_model_func=lambda prompt,
        system_prompt=None,
        history_messages=[],
        **kwargs: openai_complete_if_cache(
            "gpt-4o-mini",
            prompt,
            system_prompt=system_prompt,
            history_messages=history_messages,
            api_key=api_key,
            base_url=base_url,
            **kwargs,
        ),
    )

    await rag.initialize_storages()
    await initialize_pipeline_status()

    return rag


def main():
    """Main function to run the example"""
    parser = argparse.ArgumentParser(description="Modal Processors Example")
    parser.add_argument("--api-key", required=True, help="OpenAI API key")
    parser.add_argument("--base-url", help="Optional base URL for API")
    parser.add_argument(
        "--working-dir", "-w", default=WORKING_DIR, help="Working directory path"
    )

    args = parser.parse_args()

    # Run examples
    asyncio.run(main_async(args.api_key, args.base_url))


async def main_async(api_key: str, base_url: str = None):
    # Initialize LightRAG
    lightrag = await initialize_rag(api_key, base_url)

    # Get model functions
    llm_model_func = get_llm_model_func(api_key, base_url)
    vision_model_func = get_vision_model_func(api_key, base_url)

    # Run examples
    await process_image_example(lightrag, vision_model_func)
    await process_table_example(lightrag, llm_model_func)
    await process_equation_example(lightrag, llm_model_func)


if __name__ == "__main__":
    main()
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`"""`
			`Example of directly using modal processors`

			`This example demonstrates how to use LightRAG's modal processors directly without going through MinerU.`
			`"""`

			`import asyncio`
			`import argparse`
			`from lightrag.llm.openai import openai_complete_if_cache, openai_embed`
			`from lightrag.kg.shared_storage import initialize_pipeline_status`
			`from lightrag import LightRAG`
RAG-Anything Integration 2025-06-17 01:16:02 +08:00			`from raganything.modalprocessors import (`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`ImageModalProcessor,`
			`TableModalProcessor,`
			`EquationModalProcessor,`
			`)`

			`WORKING_DIR = "./rag_storage"`

fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`def get_llm_model_func(api_key: str, base_url: str = None):`
fix lint 2025-06-05 17:37:11 +08:00			`return (`
			`lambda prompt,`
			`system_prompt=None,`
			`history_messages=[],`
			`**kwargs: openai_complete_if_cache(`
			`"gpt-4o-mini",`
			`prompt,`
			`system_prompt=system_prompt,`
			`history_messages=history_messages,`
			`api_key=api_key,`
			`base_url=base_url,`
			`**kwargs,`
			`)`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`)`

fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`def get_vision_model_func(api_key: str, base_url: str = None):`
fix lint 2025-06-05 17:37:11 +08:00			`return (`
			`lambda prompt,`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`system_prompt=None,`
			`history_messages=[],`
fix lint 2025-06-05 17:37:11 +08:00			`image_data=None,`
			`**kwargs: openai_complete_if_cache(`
			`"gpt-4o",`
			`"",`
			`system_prompt=None,`
			`history_messages=[],`
			`messages=[`
			`{"role": "system", "content": system_prompt} if system_prompt else None,`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`{`
fix lint 2025-06-05 17:37:11 +08:00			`"role": "user",`
			`"content": [`
			`{"type": "text", "text": prompt},`
			`{`
			`"type": "image_url",`
			`"image_url": {`
			`"url": f"data:image/jpeg;base64,{image_data}"`
			`},`
			`},`
			`],`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`}`
fix lint 2025-06-05 17:37:11 +08:00			`if image_data`
			`else {"role": "user", "content": prompt},`
			`],`
			`api_key=api_key,`
			`base_url=base_url,`
			`**kwargs,`
			`)`
			`if image_data`
			`else openai_complete_if_cache(`
			`"gpt-4o-mini",`
			`prompt,`
			`system_prompt=system_prompt,`
			`history_messages=history_messages,`
			`api_key=api_key,`
			`base_url=base_url,`
			`**kwargs,`
			`)`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`)`

fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`async def process_image_example(lightrag: LightRAG, vision_model_func):`
			`"""Example of processing an image"""`
			`# Create image processor`
			`image_processor = ImageModalProcessor(`
fix lint 2025-06-05 17:37:11 +08:00			`lightrag=lightrag, modal_caption_func=vision_model_func`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`)`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`# Prepare image content`
			`image_content = {`
			`"img_path": "image.jpg",`
			`"img_caption": ["Example image caption"],`
fix lint 2025-06-05 17:37:11 +08:00			`"img_footnote": ["Example image footnote"],`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`}`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`# Process image`
			`description, entity_info = await image_processor.process_multimodal_content(`
			`modal_content=image_content,`
			`content_type="image",`
			`file_path="image_example.jpg",`
fix lint 2025-06-05 17:37:11 +08:00			`entity_name="Example Image",`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`)`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`print("Image Processing Results:")`
			`print(f"Description: {description}")`
			`print(f"Entity Info: {entity_info}")`

fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`async def process_table_example(lightrag: LightRAG, llm_model_func):`
			`"""Example of processing a table"""`
			`# Create table processor`
			`table_processor = TableModalProcessor(`
fix lint 2025-06-05 17:37:11 +08:00			`lightrag=lightrag, modal_caption_func=llm_model_func`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`)`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`# Prepare table content`
			`table_content = {`
			`"table_body": """`
			`\| Name \| Age \| Occupation \|`
			`\|------\|-----\|------------\|`
			`\| John \| 25 \| Engineer \|`
			`\| Mary \| 30 \| Designer \|`
			`""",`
			`"table_caption": ["Employee Information Table"],`
fix lint 2025-06-05 17:37:11 +08:00			`"table_footnote": ["Data updated as of 2024"],`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`}`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`# Process table`
			`description, entity_info = await table_processor.process_multimodal_content(`
			`modal_content=table_content,`
			`content_type="table",`
			`file_path="table_example.md",`
fix lint 2025-06-05 17:37:11 +08:00			`entity_name="Employee Table",`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`)`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`print("\nTable Processing Results:")`
			`print(f"Description: {description}")`
			`print(f"Entity Info: {entity_info}")`

fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`async def process_equation_example(lightrag: LightRAG, llm_model_func):`
			`"""Example of processing a mathematical equation"""`
			`# Create equation processor`
			`equation_processor = EquationModalProcessor(`
fix lint 2025-06-05 17:37:11 +08:00			`lightrag=lightrag, modal_caption_func=llm_model_func`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`)`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`# Prepare equation content`
fix lint 2025-06-05 17:37:11 +08:00			`equation_content = {"text": "E = mc^2", "text_format": "LaTeX"}`

Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`# Process equation`
			`description, entity_info = await equation_processor.process_multimodal_content(`
			`modal_content=equation_content,`
			`content_type="equation",`
			`file_path="equation_example.txt",`
fix lint 2025-06-05 17:37:11 +08:00			`entity_name="Mass-Energy Equivalence",`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`)`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`print("\nEquation Processing Results:")`
			`print(f"Description: {description}")`
			`print(f"Entity Info: {entity_info}")`

fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`async def initialize_rag(api_key: str, base_url: str = None):`
			`rag = LightRAG(`
			`working_dir=WORKING_DIR,`
			`embedding_func=lambda texts: openai_embed(`
			`texts,`
			`model="text-embedding-3-large",`
			`api_key=api_key,`
			`base_url=base_url,`
			`),`
fix lint 2025-06-05 17:37:11 +08:00			`llm_model_func=lambda prompt,`
			`system_prompt=None,`
			`history_messages=[],`
			`**kwargs: openai_complete_if_cache(`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`"gpt-4o-mini",`
			`prompt,`
			`system_prompt=system_prompt,`
			`history_messages=history_messages,`
			`api_key=api_key,`
			`base_url=base_url,`
			`**kwargs,`
			`),`
			`)`

			`await rag.initialize_storages()`
			`await initialize_pipeline_status()`

			`return rag`

fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`def main():`
			`"""Main function to run the example"""`
fix lint 2025-06-05 17:37:11 +08:00			`parser = argparse.ArgumentParser(description="Modal Processors Example")`
			`parser.add_argument("--api-key", required=True, help="OpenAI API key")`
			`parser.add_argument("--base-url", help="Optional base URL for API")`
			`parser.add_argument(`
			`"--working-dir", "-w", default=WORKING_DIR, help="Working directory path"`
			`)`
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00
			`args = parser.parse_args()`

			`# Run examples`
			`asyncio.run(main_async(args.api_key, args.base_url))`

fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`async def main_async(api_key: str, base_url: str = None):`
			`# Initialize LightRAG`
			`lightrag = await initialize_rag(api_key, base_url)`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`# Get model functions`
			`llm_model_func = get_llm_model_func(api_key, base_url)`
			`vision_model_func = get_vision_model_func(api_key, base_url)`
fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`# Run examples`
			`await process_image_example(lightrag, vision_model_func)`
			`await process_table_example(lightrag, llm_model_func)`
			`await process_equation_example(lightrag, llm_model_func)`

fix lint 2025-06-05 17:37:11 +08:00
Add example of directly using modal processors 2025-06-05 17:36:05 +08:00			`if __name__ == "__main__":`
fix lint 2025-06-05 17:37:11 +08:00			`main()`