Skip to content

Commit a9fe98d

Browse files
authored
ROB: Accept '/annn' charset as ASCII code (#1316)
Closes #1312
1 parent 475bd68 commit a9fe98d

File tree

2 files changed

+18
-0
lines changed

2 files changed

+18
-0
lines changed

PyPDF2/_codecs/adobe_glyphs.py

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -13425,3 +13425,13 @@
1342513425
"/zukatakana": "\u30BA",
1342613426
"/zwarakay": "\u0659",
1342713427
}
13428+
13429+
13430+
def _complete() -> None:
13431+
global adobe_glyphs
13432+
for i in range(256):
13433+
adobe_glyphs[f"/a{i}"] = chr(i)
13434+
adobe_glyphs["/.notdef"] = "□"
13435+
13436+
13437+
_complete()

tests/test_cmap.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -46,3 +46,11 @@ def test_get_font_width_from_default(): # L40
4646
reader = PdfReader(BytesIO(get_pdf_from_url(url, name=name)))
4747
for page in reader.pages:
4848
page.extract_text()
49+
50+
51+
def test_ascii_charset():
52+
# iss #1312
53+
url = "https://github.com/py-pdf/PyPDF2/files/9472500/main.pdf"
54+
name = "ascii charset.pdf"
55+
reader = PdfReader(BytesIO(get_pdf_from_url(url, name=name)))
56+
assert "/a" not in reader.pages[0].extract_text()

0 commit comments

Comments
 (0)