mirror of
				https://github.com/Unstructured-IO/unstructured.git
				synced 2025-10-31 18:14:51 +00:00 
			
		
		
		
	 bd8a74d686
			
		
	
	
		bd8a74d686
		
			
		
	
	
	
	
		
			
			Given the tendency for shell scripts to easily enter into a few levels of indentation and long line lengths, update the default to 2 spaces.
		
			
				
	
	
		
			25 lines
		
	
	
		
			740 B
		
	
	
	
		
			Bash
		
	
	
		
			Executable File
		
	
	
	
	
			
		
		
	
	
			25 lines
		
	
	
		
			740 B
		
	
	
	
		
			Bash
		
	
	
		
			Executable File
		
	
	
	
	
| #!/usr/bin/env bash
 | |
| 
 | |
| # Processes the Unstructured-IO/unstructured repository
 | |
| # through Unstructured's library in 2 processes.
 | |
| 
 | |
| # Structured outputs are stored in slack-ingest-output/
 | |
| 
 | |
| # oldest, latest arguments are optional
 | |
| 
 | |
| # Ingests a slack text channel into a file.
 | |
| # channels is a comma separated list of channel IDs.
 | |
| # Bot user must be in the channels for them to be ingested.
 | |
| 
 | |
| SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &>/dev/null && pwd)
 | |
| cd "$SCRIPT_DIR"/../../.. || exit 1
 | |
| 
 | |
| PYTHONPATH=. ./unstructured/ingest/main.py \
 | |
|   slack \
 | |
|   --channels 12345678 \
 | |
|   --token 12345678 \
 | |
|   --download-dir slack-ingest-download \
 | |
|   --output-dir slack-ingest-output \
 | |
|   --start-date 2023-04-01T01:00:00-08:00 \
 | |
|   --end-date 2023-04-02
 |