From 4db4df5c727a112b32d37dac4259c1c19c06cbef Mon Sep 17 00:00:00 2001 From: Olivier Scherler Date: Wed, 25 May 2022 12:05:07 +0200 Subject: [PATCH] Log a warning instead of failing on images with a corrupt ICC profile. --- src/ocrmypdf/pdfinfo/info.py | 20 +++++++++++++------- 1 file changed, 13 insertions(+), 7 deletions(-) diff --git a/src/ocrmypdf/pdfinfo/info.py b/src/ocrmypdf/pdfinfo/info.py index c63bfa03..67781e14 100644 --- a/src/ocrmypdf/pdfinfo/info.py +++ b/src/ocrmypdf/pdfinfo/info.py @@ -38,6 +38,7 @@ from pikepdf import ( PdfInlineImage, PdfMatrix, parse_content_stream, + UnsupportedImageTypeError, ) from ocrmypdf._concurrent import Executor, SerialExecutor @@ -350,13 +351,18 @@ class ImageInfo: if self._color == Colorspace.icc: # Check the ICC profile to determine actual colorspace - pim_icc = pim.icc - if pim_icc.profile.xcolor_space == 'GRAY': - self._comp = 1 - elif pim_icc.profile.xcolor_space == 'CMYK': - self._comp = 4 - else: - self._comp = 3 + try: + pim_icc = pim.icc + if pim_icc.profile.xcolor_space == 'GRAY': + self._comp = 1 + elif pim_icc.profile.xcolor_space == 'CMYK': + self._comp = 4 + else: + self._comp = 3 + except UnsupportedImageTypeError as ex: + logger.warn('Unreadable image: {}. {}'.format(ex, self)) + self._comp = None + else: if isinstance(self._color, Colorspace): self._comp = FRIENDLY_COMP.get(self._color)