mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-07-03 23:20:35 +00:00

Adds MongoDB as a source (we already had it as a destination connector) --------- Co-authored-by: potter-potter <david.potter@gmail.com>
11 lines
309 B
Bash
11 lines
309 B
Bash
#!/usr/bin/env bash
|
|
|
|
unstructured-ingest \
|
|
mongodb \
|
|
--metadata-exclude filename,file_directory,metadata.data_source.date_processed \
|
|
--uri "<MongoDB uri>" \
|
|
--database "<MongoDB Database Name>" \
|
|
--collection "<MongoDB Collection name>" \
|
|
--output-dir mongodb-ingest-output \
|
|
--num-processes 2
|