mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-07-03 15:11:30 +00:00
27 lines
758 B
Bash
27 lines
758 B
Bash
![]() |
#!/bin/bash
|
||
|
|
||
|
# Define the input and output top directories
|
||
|
SCRIPT_DIR=$(dirname "$(realpath "$0")")
|
||
|
OUTPUT_DIR=${1:-"$SCRIPT_DIR/structured-output-html"}
|
||
|
INPUT_DIR="$SCRIPT_DIR/expected-structured-output"
|
||
|
PYTHON_SCRIPT="$SCRIPT_DIR/../scripts/html/elements_json_to_html.py"
|
||
|
EXCLUDE_IMG=0
|
||
|
NO_GROUP=1
|
||
|
|
||
|
# Function to process JSON files
|
||
|
process_json_files() {
|
||
|
# Add flags based on the variables
|
||
|
cmd="PYTHONPATH=${PYTHONPATH:-.} python \"$PYTHON_SCRIPT\" \"$INPUT_DIR\" --outdir \"$OUTPUT_DIR\""
|
||
|
if [ "$EXCLUDE_IMG" -eq 1 ]; then
|
||
|
cmd+=" --exclude-img"
|
||
|
fi
|
||
|
if [ "$NO_GROUP" -eq 1 ]; then
|
||
|
cmd+=" --no-group"
|
||
|
fi
|
||
|
# Run the Python script with the constructed command
|
||
|
eval "$cmd"
|
||
|
}
|
||
|
|
||
|
# Start processing from the input directory
|
||
|
process_json_files
|