diff --git a/src/ocrmypdf/pdfinfo.py b/src/ocrmypdf/pdfinfo.py index 98e62c2e..e53ecc86 100644 --- a/src/ocrmypdf/pdfinfo.py +++ b/src/ocrmypdf/pdfinfo.py @@ -164,8 +164,7 @@ def _interpret_contents(contentstream, initial_shorthand=UNIT_SQUARE): xobject_settings = [] inline_images = [] found_text = False - text_operators = tuple( - pikepdf.Operator(op) for op in ('Tj', 'TJ', '"', "'")) + text_operators = set(['Tj', 'TJ', '"', "'"]) operator_whitelist = """q Q Do cm TJ Tj " ' BI ID EI""" for n, op in enumerate(_normalize_stack(