diff --git a/OCRmyPDF.sh b/OCRmyPDF.sh index a6f29956..756572fc 100644 --- a/OCRmyPDF.sh +++ b/OCRmyPDF.sh @@ -70,6 +70,7 @@ LOG_ERR="0" # 0=only error messages LOG_INFO="1" # 1=error messages and some infos LOG_DEBUG="2" # 2=debug level logging JHOVE="./jhove/bin/JhoveApp.jar" # java SW for validating the final PDF/A +JHOVE_CFG="./jhove/conf/jhove.conf" # location of the jhove config file # Initialization the configuration parameters with default values VERBOSITY="$LOG_ERR" # default verbosity level @@ -135,7 +136,7 @@ cd "`dirname $0`" ! command -v pdftk > /dev/null && echo "Please install pdftk. Exiting..." >&2 && exit $EXIT_MISSING_DEPENDENCY [ $PREPROCESS_CLEAN -eq 1 ] && ! command -v unpaper > /dev/null && echo "Please install unpaper. Exiting..." >&2 && exit $EXIT_MISSING_DEPENDENCY ! command -v tesseract > /dev/null && echo "Please install tesseract and tesseract-data. Exiting..." >&2 && exit $EXIT_MISSING_DEPENDENCY -! command -v python > /dev/null && echo "Please install python, as well as the following python libraries: reportlab, lxml. Exiting..." >&2 && exit $EXIT_MISSING_DEPENDENCY +! command -v python > /dev/null && echo "Please install python, and the python libraries: reportlab, lxml. Exiting..." >&2 && exit $EXIT_MISSING_DEPENDENCY ! command -v gs > /dev/null && echo "Please install ghostcript. Exiting..." >&2 && exit $EXIT_MISSING_DEPENDENCY ! command -v java > /dev/null && echo "Please install java. Exiting..." >&2 && exit $EXIT_MISSING_DEPENDENCY @@ -309,7 +310,7 @@ done < "$FILE_SIZE_PAGES" # validate generated pdf file (compliance to PDF/A) [ $VERBOSITY -ge $LOG_DEBUG ] && echo "Output file: Checking compliance to PDF/A standard" -java -jar "$JHOVE" -m PDF-hul "$FILE_OUTPUT_PDFA" > "$FILE_VALIDATION_LOG" +java -jar "$JHOVE" -c "$JHOVE_CFG" -m PDF-hul "$FILE_OUTPUT_PDFA" > "$FILE_VALIDATION_LOG" grep -i "Status|Message" "$FILE_VALIDATION_LOG" # summary of the validation [ $VERBOSITY -ge $LOG_DEBUG ] && cat "$FILE_VALIDATION_LOG" # check the validation results diff --git a/jhove/conf/jhove.conf b/jhove/conf/jhove.conf index 8a1ebe9c..bf50f3bf 100644 --- a/jhove/conf/jhove.conf +++ b/jhove/conf/jhove.conf @@ -4,7 +4,7 @@ xmlns="http://hul.harvard.edu/ois/xml/ns/jhove/jhoveConfig" xsi:schemaLocation="http://hul.harvard.edu/ois/xml/ns/jhove/jhoveConfig http://hul.harvard.edu/ois/xml/xsd/jhove/1.4/jhoveConfig.xsd"> - /root/jhove-1_9/jhove/ + /root/OCRmyPDF/jhove/ utf-8 /var/tmp 131072