2023-10-30 16:09:49 -04:00
|
|
|
#!/usr/bin/env bash
|
|
|
|
#TODO currently box api/sdk does not work to create folders and check for content similar to other fsspec ingest tests
|
|
|
|
|
|
|
|
#
|
|
|
|
#set -e
|
|
|
|
#
|
2023-11-01 15:23:44 -04:00
|
|
|
#DEST_PATH=$(dirname "$(realpath "$0")")
|
|
|
|
#SCRIPT_DIR=$(dirname "$DEST_PATH")
|
2023-10-30 16:09:49 -04:00
|
|
|
#cd "$SCRIPT_DIR"/.. || exit 1
|
|
|
|
#OUTPUT_FOLDER_NAME=box-dest
|
2023-11-02 16:41:56 -05:00
|
|
|
#OUTPUT_DIR=$OUTPUT_ROOT/structured-output/$OUTPUT_FOLDER_NAME
|
|
|
|
#WORK_DIR=$OUTPUT_ROOT/workdir/$OUTPUT_FOLDER_NAME
|
2023-10-30 16:09:49 -04:00
|
|
|
#max_processes=${MAX_PROCESSES:=$(python3 -c "import os; print(os.cpu_count())")}
|
2023-11-07 15:14:01 -08:00
|
|
|
#DESTINATION_BOX="box://utic-dev-tech-fixtures/utic-ingest-test-fixtures-output/$(uuidgen)/"
|
2023-10-30 16:09:49 -04:00
|
|
|
#
|
|
|
|
#CI=${CI:-"false"}
|
|
|
|
#
|
|
|
|
#if [ -z "$BOX_APP_CONFIG" ] && [ -z "$BOX_APP_CONFIG_PATH" ]; then
|
|
|
|
# echo "Skipping Box ingest test because neither BOX_APP_CONFIG nor BOX_APP_CONFIG_PATH env vars are set."
|
|
|
|
# exit 0
|
|
|
|
#fi
|
|
|
|
#
|
|
|
|
#if [ -z "$BOX_APP_CONFIG_PATH" ]; then
|
|
|
|
# # Create temporary service key file
|
|
|
|
# BOX_APP_CONFIG_PATH=$(mktemp)
|
|
|
|
# echo "$BOX_APP_CONFIG" >"$BOX_APP_CONFIG_PATH"
|
|
|
|
#fi
|
|
|
|
#
|
|
|
|
## shellcheck disable=SC1091
|
|
|
|
#source "$SCRIPT_DIR"/cleanup.sh
|
|
|
|
#function cleanup() {
|
|
|
|
# cleanup_dir "$OUTPUT_DIR"
|
|
|
|
# cleanup_dir "$WORK_DIR"
|
|
|
|
# if [ "$CI" == "true" ]; then
|
|
|
|
# cleanup_dir "$DOWNLOAD_DIR"
|
|
|
|
# fi
|
|
|
|
#}
|
|
|
|
#trap cleanup EXIT
|
|
|
|
#
|
2023-11-02 16:41:56 -05:00
|
|
|
#RUN_SCRIPT=${RUN_SCRIPT:-./unstructured/ingest/main.py}
|
|
|
|
#PYTHONPATH=${PYTHONPATH:-.} "$RUN_SCRIPT" \
|
2023-10-30 16:09:49 -04:00
|
|
|
# local \
|
|
|
|
# --num-processes "$max_processes" \
|
|
|
|
# --output-dir "$OUTPUT_DIR" \
|
|
|
|
# --strategy fast \
|
|
|
|
# --verbose \
|
|
|
|
# --reprocess \
|
|
|
|
# --input-path example-docs/fake-memo.pdf \
|
|
|
|
# --work-dir "$WORK_DIR" \
|
|
|
|
# box \
|
|
|
|
# --box-app-config "$BOX_APP_CONFIG_PATH" \
|
|
|
|
# --remote-url "$DESTINATION_BOX" \
|
|
|
|
#
|
|
|
|
## Simply check the number of files uploaded
|
|
|
|
#expected_num_files=1
|