mirror of
				https://github.com/Unstructured-IO/unstructured.git
				synced 2025-10-24 22:41:05 +00:00 
			
		
		
		
	 bd8a74d686
			
		
	
	
		bd8a74d686
		
			
		
	
	
	
	
		
			
			Given the tendency for shell scripts to easily enter into a few levels of indentation and long line lengths, update the default to 2 spaces.
		
			
				
	
	
		
			17 lines
		
	
	
		
			484 B
		
	
	
	
		
			Bash
		
	
	
	
	
	
			
		
		
	
	
			17 lines
		
	
	
		
			484 B
		
	
	
	
		
			Bash
		
	
	
	
	
	
| #!/usr/bin/env bash
 | |
| 
 | |
| EMBEDDING_PROVIDER=${EMBEDDING_PROVIDER:-"langchain-huggingface"}
 | |
| 
 | |
| unstructured-ingest \
 | |
|   local \
 | |
|   --input-path example-docs/book-war-and-peace-1225p.txt \
 | |
|   --output-dir local-output-to-box \
 | |
|   --strategy fast \
 | |
|   --chunk-elements \
 | |
|   --embedding-provider "$EMBEDDING_PROVIDER" \
 | |
|   --num-processes 2 \
 | |
|   --verbose \
 | |
|   box \
 | |
|   --box_app_config "$BOX_APP_CONFIG_PATH" \
 | |
|   --remote-url "<your destination path here, ie 'box://unstructured/war-and-peace-output'>"
 |