mirror of
				https://github.com/Unstructured-IO/unstructured.git
				synced 2025-10-31 01:54:25 +00:00 
			
		
		
		
	 d7f4c24e21
			
		
	
	
		d7f4c24e21
		
			
		
	
	
	
	
		
			
			To test: cd docs && make HTML changelogs: point main readme to the correct connector html page point chroma docs to correct sample code --------- Co-authored-by: potter-potter <david.potter@gmail.com>
		
			
				
	
	
		
			56 lines
		
	
	
		
			1.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			56 lines
		
	
	
		
			1.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| from unstructured.ingest.connector.chroma import (
 | |
|     ChromaAccessConfig,
 | |
|     ChromaWriteConfig,
 | |
|     SimpleChromaConfig,
 | |
| )
 | |
| from unstructured.ingest.connector.local import SimpleLocalConfig
 | |
| from unstructured.ingest.interfaces import (
 | |
|     ChunkingConfig,
 | |
|     EmbeddingConfig,
 | |
|     PartitionConfig,
 | |
|     ProcessorConfig,
 | |
|     ReadConfig,
 | |
| )
 | |
| from unstructured.ingest.runner import LocalRunner
 | |
| from unstructured.ingest.runner.writers.base_writer import Writer
 | |
| from unstructured.ingest.runner.writers.chroma import (
 | |
|     ChromaWriter,
 | |
| )
 | |
| 
 | |
| 
 | |
| def get_writer() -> Writer:
 | |
|     return ChromaWriter(
 | |
|         connector_config=SimpleChromaConfig(
 | |
|             access_config=ChromaAccessConfig(),
 | |
|             host="localhost",
 | |
|             port=8000,
 | |
|             collection_name="elements",
 | |
|             tenant="default_tenant",
 | |
|             database="default_database",
 | |
|         ),
 | |
|         write_config=ChromaWriteConfig(),
 | |
|     )
 | |
| 
 | |
| 
 | |
| if __name__ == "__main__":
 | |
|     writer = get_writer()
 | |
|     runner = LocalRunner(
 | |
|         processor_config=ProcessorConfig(
 | |
|             verbose=True,
 | |
|             output_dir="local-output-to-chroma",
 | |
|             num_processes=2,
 | |
|         ),
 | |
|         connector_config=SimpleLocalConfig(
 | |
|             input_path="example-docs/book-war-and-peace-1225p.txt",
 | |
|         ),
 | |
|         read_config=ReadConfig(),
 | |
|         partition_config=PartitionConfig(),
 | |
|         chunking_config=ChunkingConfig(chunk_elements=True),
 | |
|         embedding_config=EmbeddingConfig(
 | |
|             provider="langchain-huggingface",
 | |
|         ),
 | |
|         writer=writer,
 | |
|         writer_kwargs={},
 | |
|     )
 | |
|     runner.run()
 |