py-pdf · MartinThoma · Dec 9, 2022 · Nov 30, 2022 · Nov 30, 2022 · Dec 7, 2022
diff --git a/PyPDF2/filters.py b/PyPDF2/filters.py
@@ -602,10 +602,12 @@ def _xobj_to_image(x_object_obj: Dict[str, Any]) -> Tuple[Optional[str], bytes]:
                 from .generic import ByteStringObject
 
                 if isinstance(lookup, ByteStringObject):
+                    if base == ColorSpaces.DEVICE_GRAY and len(lookup) == hival + 1:
+                        lookup = b"".join([lookup[i:i + 1] * 3 for i in range(len(lookup))])
                     img.putpalette(lookup)
                 else:
                     img.putpalette(lookup.get_data())
-                img = img.convert("RGB")
+                img = img.convert("L" if base == ColorSpaces.DEVICE_GRAY else "RGB")
             if G.S_MASK in x_object_obj:  # add alpha channel
                 alpha = Image.frombytes("L", size, x_object_obj[G.S_MASK].get_data())
                 img.putalpha(alpha)

diff --git a/resources/grayscale.pdf b/resources/grayscale.pdf
diff --git a/tests/test_reader.py b/tests/test_reader.py
@@ -185,6 +185,7 @@ def test_get_outline(src, outline_elements):
             marks=pytest.mark.xfail(reason="broken image extraction"),
         ),
         ("imagemagick-CCITTFaxDecode.pdf", ["Im0.tiff"]),
+        ("grayscale.pdf", ["X0.png"]),
     ],
 )
 def test_get_images(src, expected_images):