2023-05-01 22:57:48 +02:00
|
|
|
#!/bin/bash
|
|
|
|
|
|
|
|
# Copy the original tesseract-ocr files to the volume directory without overwriting existing files
|
|
|
|
echo "Copying original files without overwriting existing files"
|
2023-12-31 17:14:55 +01:00
|
|
|
mkdir -p /usr/share/tessdata
|
|
|
|
cp -rn /usr/share/tessdata-original/* /usr/share/tessdata
|
2023-05-01 22:57:48 +02:00
|
|
|
|
2023-12-31 15:54:34 +01:00
|
|
|
if [ -d /usr/share/tesseract-ocr/4.00/tessdata ]; then
|
|
|
|
cp -r /usr/share/tesseract-ocr/4.00/tessdata/* /usr/share/tessdata || true;
|
|
|
|
fi
|
|
|
|
|
|
|
|
if [ -d /usr/share/tesseract-ocr/5/tessdata ]; then
|
|
|
|
cp -r /usr/share/tesseract-ocr/5/tessdata/* /usr/share/tessdata || true;
|
2023-12-11 00:06:35 +01:00
|
|
|
fi
|
|
|
|
|
2024-03-08 21:49:19 +01:00
|
|
|
|
|
|
|
# Update the user and group IDs as per environment variables
|
|
|
|
if [ ! -z "$PUID" ] && [ "$PUID" != "$(id -u stirlingpdfuser)" ]; then
|
|
|
|
usermod -o -u "$PUID" stirlingpdfuser
|
|
|
|
fi
|
|
|
|
|
|
|
|
if [ ! -z "$PGID" ] && [ "$PGID" != "$(id -g stirlingpdfgroup)" ]; then
|
|
|
|
groupmod -o -g "$PGID" stirlingpdfgroup
|
|
|
|
fi
|
|
|
|
umask "$UMASK"
|
|
|
|
|
2024-03-04 21:51:49 +01:00
|
|
|
echo "Setting permissions and ownership for necessary directories..."
|
|
|
|
chown -R stirlingpdfuser:stirlingpdfgroup /logs /scripts /usr/share/fonts/opentype/noto /usr/share/tessdata /configs /customFiles
|
|
|
|
chmod -R 755 /logs /scripts /usr/share/fonts/opentype/noto /usr/share/tessdata /configs /customFiles
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2023-07-29 14:53:30 +02:00
|
|
|
# Check if TESSERACT_LANGS environment variable is set and is not empty
|
|
|
|
if [[ -n "$TESSERACT_LANGS" ]]; then
|
|
|
|
# Convert comma-separated values to a space-separated list
|
|
|
|
LANGS=$(echo $TESSERACT_LANGS | tr ',' ' ')
|
2024-03-04 21:51:49 +01:00
|
|
|
pattern='^[a-zA-Z]{2,4}(_[a-zA-Z]{2,4})?$'
|
2023-07-29 14:53:30 +02:00
|
|
|
# Install each language pack
|
|
|
|
for LANG in $LANGS; do
|
2024-03-04 21:51:49 +01:00
|
|
|
if [[ $LANG =~ $pattern ]]; then
|
|
|
|
apk add --no-cache "tesseract-ocr-data-$LANG"
|
|
|
|
else
|
|
|
|
echo "Skipping invalid language code"
|
|
|
|
fi
|
2023-07-29 14:53:30 +02:00
|
|
|
done
|
|
|
|
fi
|
|
|
|
|
2024-03-04 21:51:49 +01:00
|
|
|
if [[ "$INSTALL_BOOK_AND_ADVANCED_HTML_OPS" == "true" ]]; then
|
|
|
|
apk add --no-cache calibre@testing
|
|
|
|
fi
|
|
|
|
|
|
|
|
|
|
|
|
|
2023-12-18 15:52:18 +01:00
|
|
|
/scripts/download-security-jar.sh
|
2023-07-29 14:53:30 +02:00
|
|
|
|
2024-03-04 21:51:49 +01:00
|
|
|
# Run the main command and switch to stirling user for rest of run
|
|
|
|
exec su-exec stirlingpdfuser "$@"
|