kotaemon/scripts/download_pdfjs.sh
kan_cin d3fd75297f
feat: add multi-stages docker and support platform arm (#274)
* feat: add multi-stages docker and support platform arm

* refactor: pre-commit

* fix: raise ImportError (fastembed) instead of auto install

* feat: add dependencies for local llm

* feat: free disk

* feat: update README

* feat: update README

* chore: fix typo

---------

Co-authored-by: cin-niko <niko@cinnamon.is>
2024-09-12 20:25:03 +07:00

54 lines
1.3 KiB
Bash

#!/bin/bash
set -eo pipefail
# Check and capture input argument for PDFJS_VERSION_DIST
if [ -z "$1" ]; then
echo "Usage: $0 <pdfjs_version_dist>"
exit 1
fi
pdfjs_version_dist=$1
function check_path_for_spaces() {
if [[ $PWD =~ \ ]]; then
echo "The current workdir has whitespace which can lead to unintended behaviour. Please modify your path and continue later."
exit 1
fi
}
function download_and_unzip() {
local url=$1
local dest_dir=$2
if [ -d "$dest_dir" ]; then
echo "Destination directory $dest_dir already exists. Skipping download."
return
fi
mkdir -p "$dest_dir"
local zip_file="${dest_dir}/downloaded.zip"
echo "Downloading $url to $zip_file"
curl -L -o "$zip_file" "$url"
echo "Unzipping $zip_file to $dest_dir"
unzip -o "$zip_file" -d "$dest_dir"
rm "$zip_file"
echo "Download and unzip completed successfully."
}
# Main script execution
pdf_js_version="4.0.379"
pdf_js_dist_name="pdfjs-${pdf_js_version}-dist"
pdf_js_dist_url="https://github.com/mozilla/pdf.js/releases/download/v${pdf_js_version}/${pdf_js_dist_name}.zip"
check_path_for_spaces
echo "Downloading and unzipping PDF.js"
download_and_unzip "$pdf_js_dist_url" "$pdfjs_version_dist"
echo "PDF.js has been set up in $pdfjs_version_dist"