2022-04-20 12:27:53 +02:00
|
|
|
# shellcheck shell=bash disable=SC2154
|
|
|
|
|
2022-10-06 13:28:47 +02:00
|
|
|
# check if stdin is present if selected
|
|
|
|
if [[ ${args[file]} == '-' ]] || [[ ${args[file]} == '"-"' ]] && [ -t 0 ]; then
|
|
|
|
orcli_batch_usage
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
|
2022-04-20 12:27:53 +02:00
|
|
|
# locate orcli and OpenRefine
|
|
|
|
if command -v orcli &>/dev/null; then
|
|
|
|
orcli="orcli"
|
|
|
|
elif [[ -x "orcli" ]]; then
|
|
|
|
orcli="./orcli"
|
|
|
|
else
|
|
|
|
error "orcli is not executable!" "Try: chmod + ./orcli"
|
|
|
|
fi
|
|
|
|
if [[ -x "refine" ]]; then
|
|
|
|
openrefine="./refine"
|
|
|
|
else
|
|
|
|
error "OpenRefine's startup script (refine) not found!" "Did you put orcli in your OpenRefine app dir?"
|
|
|
|
fi
|
|
|
|
|
|
|
|
# create tmp directory
|
|
|
|
tmpdir="$(mktemp -d)"
|
|
|
|
trap '{ rm -rf "$tmpdir"; }' 0 2 3 15
|
|
|
|
|
|
|
|
# update OPENREFINE_URL env
|
|
|
|
OPENREFINE_URL="http://localhost:${args[--port]}"
|
|
|
|
|
2022-10-06 13:28:47 +02:00
|
|
|
# catch args, convert the space delimited string to an array
|
|
|
|
files=()
|
|
|
|
eval "files=(${args[file]})"
|
|
|
|
# read pipes if name starts with /dev/fd
|
|
|
|
for i in "${!files[@]}"; do
|
|
|
|
if [[ ${files[$i]} == "/dev/fd"* ]]; then
|
|
|
|
if ! cat "${files[$i]}" >"${tmpdir}/${files[$i]//[^A-Za-z0-9._-]/_}"; then
|
|
|
|
error "reading of ${files[$i]} failed!"
|
|
|
|
fi
|
|
|
|
files[$i]="${tmpdir}/${files[$i]//[^A-Za-z0-9._-]/_}"
|
|
|
|
fi
|
|
|
|
done
|
|
|
|
|
2022-04-20 12:27:53 +02:00
|
|
|
# check if OpenRefine is already running
|
|
|
|
if curl -fs "${OPENREFINE_URL}" &>/dev/null; then
|
|
|
|
error "OpenRefine is already running on port ${args[--port]}." "Hint: Stop the other process or use another port."
|
|
|
|
fi
|
|
|
|
|
|
|
|
# start OpenRefine with tmp workspace and autosave period 25 hours
|
2022-04-20 12:51:51 +02:00
|
|
|
REFINE_AUTOSAVE_PERIOD=1440 $openrefine -d "$tmpdir" -m "${args[--memory]}" -p "${args[--port]}" -x refine.headless=true -v warn &>"$tmpdir/openrefine.log" &
|
2022-04-20 12:27:53 +02:00
|
|
|
openrefine_pid="$!"
|
|
|
|
|
|
|
|
# update trap to kill OpenRefine on error or exit
|
|
|
|
trap '{ rm -rf "$tmpdir"; kill -9 "$openrefine_pid"; }' 0 2 3 15
|
|
|
|
|
|
|
|
# wait until OpenRefine is running (timeout 20s)
|
|
|
|
if ! curl -fs --retry 20 --retry-connrefused --retry-delay 1 "${OPENREFINE_URL}/command/core/get-version" &>/dev/null; then
|
|
|
|
error "starting OpenRefine server failed!"
|
|
|
|
else
|
|
|
|
log "started OpenRefine" "port: ${args[--port]}" "memory: ${args[--memory]}" "tmpdir: ${tmpdir}" "pid: ${openrefine_pid}"
|
|
|
|
fi
|
|
|
|
|
2022-10-06 13:28:47 +02:00
|
|
|
# execute shell script
|
|
|
|
export orcli tmpdir OPENREFINE_URL openrefine_pid
|
|
|
|
bash -e "${files[@]}"
|