py-pdf · MartinThoma · Apr 24, 2022 · Mar 6, 2021 · Apr 9, 2022 · Apr 24, 2022
diff --git a/PyPDF2/pdf.py b/PyPDF2/pdf.py
@@ -2205,7 +2205,13 @@ def _authenticateUserPassword(self, password):
         rev = encrypt['/R'].getObject()
         owner_entry = encrypt['/O'].getObject()
         p_entry = encrypt['/P'].getObject()
-        id_entry = self.trailer[TK.ID].getObject()
+        if TK.ID in self.trailer:
+            id_entry = self.trailer[TK.ID].getObject()
+        else:
+            # Some documents may not have a /ID, use two empty
+            # byte strings instead. Solves
+            # https://github.com/mstamy2/PyPDF2/issues/608
+            id_entry = ArrayObject([ByteStringObject(b''), ByteStringObject(b'')])
         id1_entry = id_entry[0].getObject()
         real_U = encrypt['/U'].getObject().original_bytes
         if rev == 2:

diff --git a/Resources/encrypted_doc_no_id.pdf b/Resources/encrypted_doc_no_id.pdf
diff --git a/Tests/test_reader.py b/Tests/test_reader.py
@@ -486,3 +486,18 @@ def test_do_not_get_stuck_on_large_files_without_start_xref():
     # parsing is expected take less than a second on a modern cpu, but include a large
     # tolerance to account for busy or slow systems
     assert parse_duration < 60
+
+
+def test_PdfReaderDecryptWhenNoID():
+    """
+    Decrypt an encrypted file that's missing the 'ID' value in its
+    trailer.
+    https://github.com/mstamy2/PyPDF2/issues/608
+    """
+
+    with open(
+        os.path.join(RESOURCE_ROOT, "encrypted_doc_no_id.pdf"), "rb"
+    ) as inputfile:
+        ipdf = PdfFileReader(inputfile)
+        ipdf.decrypt("")
+        assert ipdf.getDocumentInfo() == {"/Producer": "European Patent Office"}