Skip to content

Commit 40c5710

Browse files
just add cp949 encoding.
1 parent c785211 commit 40c5710

2 files changed

Lines changed: 7 additions & 6 deletions

File tree

PyPDF2/generic.py

Lines changed: 7 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,6 @@
4444
import decimal
4545
import codecs
4646
import sys
47-
import chardet
4847
#import debugging
4948

5049
ObjectPrefix = b_('/<[tf(n%')
@@ -478,12 +477,16 @@ def readFromStream(stream, pdf):
478477
name = stream.read(1)
479478
if name != NameObject.surfix:
480479
raise utils.PdfReadError("name read error")
481-
name += utils.readUntilRegex(stream, NameObject.delimiterPattern, ignore_eof=True)
480+
name += utils.readUntilRegex(stream, NameObject.delimiterPattern,
481+
ignore_eof=True)
482482
if debug: print(name)
483483
try:
484-
encoding = chardet.detect(name)['encoding']
485-
return NameObject(name.decode(encoding if encoding else 'utf-8'))
484+
return NameObject(name.decode('utf-8'))
486485
except (UnicodeEncodeError, UnicodeDecodeError) as e:
486+
try:
487+
return NameObject(name.decode('cp949'))
488+
except (UnicodeEncodeError, UnicodeDecodeError) as e:
489+
pass
487490
# Name objects should represent irregular characters
488491
# with a '#' followed by the symbol's hex number
489492
if not pdf.strict:

requirements.txt

Lines changed: 0 additions & 2 deletions
This file was deleted.

0 commit comments

Comments
 (0)