From e86d1ff6d4e5b66a91b242966028a0022408e050 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Diego=20Elio=20Petten=C3=B2?= Date: Mon, 31 Aug 2020 11:46:37 +0100 Subject: [PATCH] Fix out-of-bound access on some PDFs. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Replace the non-emptiness check with a minimum length check — you can't get the second to last item in a list of less than two items. --- pdfminer/pdfdocument.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pdfminer/pdfdocument.py b/pdfminer/pdfdocument.py index 19187aee..108d3487 100644 --- a/pdfminer/pdfdocument.py +++ b/pdfminer/pdfdocument.py @@ -669,7 +669,7 @@ def _getobj_parse(self, pos, objid): while kwd is not self.KEYWORD_OBJ: (_, kwd) = self._parser.nexttoken() x.append(kwd) - if x: + if len(x) >= 2: objid1 = x[-2] # #### end hack around malformed pdf files if objid1 != objid: