From 9f78915ea6353b041b36f7f9c53ab98d4d91ab93 Mon Sep 17 00:00:00 2001 From: "yusuke.shinyama.dummy" Date: Tue, 23 Nov 2010 10:53:19 +0000 Subject: [PATCH] show cid for unknown characters git-svn-id: https://pdfminerr.googlecode.com/svn/trunk/pdfminer@275 1aa58f4a-7d42-0410-adbc-911cccaed67c --- pdfminer/converter.py | 2 +- pdfminer/pdffont.py | 4 +++- 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/pdfminer/converter.py b/pdfminer/converter.py index a5476e6..8fcf7f1 100644 --- a/pdfminer/converter.py +++ b/pdfminer/converter.py @@ -105,7 +105,7 @@ class PDFLayoutAnalyzer(PDFTextDevice): def handle_undefined_char(self, font, cid): if self.debug: print >>sys.stderr, 'undefined: %r, %r' % (font, cid) - return '?' + return '(cid:%d)' % cid def receive_layout(self, ltpage): return diff --git a/pdfminer/pdffont.py b/pdfminer/pdffont.py index a8da08e..1d7c5ed 100644 --- a/pdfminer/pdffont.py +++ b/pdfminer/pdffont.py @@ -399,6 +399,8 @@ class TrueTypeFont(object): else: for c in xrange(sc, ec+1): char2gid[c] = (c + idd) & 0xffff + else: + assert 0 # create unicode map unicode_map = FileUnicodeMap() for (char,gid) in char2gid.iteritems(): @@ -668,7 +670,7 @@ class PDFCIDFont(PDFFont): def main(argv): for fname in argv[1:]: fp = file(fname, 'rb') - CFFFont(fp) + font = TrueTypeFont(fname, fp) fp.close() return