BUG: fix image look-up table in EncodedStreamObject

closes py-pdf#2124 closes py-pdf#2110
pubpub-zz · Aug 28, 2023 · 9188157 · 9188157
1 parent 0ab320c
commit 9188157
Show file tree

Hide file tree

Showing 2 changed files with 11 additions and 1 deletion.
diff --git a/pypdf/filters.py b/pypdf/filters.py
@@ -58,6 +58,7 @@
     ArrayObject,
     DecodedStreamObject,
     DictionaryObject,
+    EncodedStreamObject,
     IndirectObject,
     NullObject,
 )
@@ -860,7 +861,7 @@ def bits2byte(data: bytes, size: Tuple[int, int], bits: int) -> bytes:
         if color_space == "/Indexed":
             from .generic import TextStringObject
 
-            if isinstance(lookup, DecodedStreamObject):
+            if isinstance(lookup, (EncodedStreamObject, DecodedStreamObject)):
                 lookup = lookup.get_data()
             if isinstance(lookup, TextStringObject):
                 lookup = lookup.original_bytes

diff --git a/tests/test_filters.py b/tests/test_filters.py
@@ -585,3 +585,12 @@ def test_jpx_no_spacecode():
     with pytest.raises(PdfReadError) as exc:
         reader.pages[0].images[0]
     assert exc.value.args[0].startswith("ColorSpace field not found")
+
+
+@pytest.mark.enable_socket()
+def test_encodedstream_lookup():
+    """From #2124"""
+    url = "https://github.com/py-pdf/pypdf/files/12455580/10.pdf"
+    name = "iss2124.pdf"
+    reader = PdfReader(BytesIO(get_data_from_url(url, name=name)))
+    reader.pages[12].images[0]