From c4c0a36e4f18bbb782ab87e07528fbc81ce6ddeb Mon Sep 17 00:00:00 2001 From: Andrew Baumann Date: Mon, 25 Feb 2019 13:08:04 -0800 Subject: [PATCH 1/5] name2unicode(): handle hexadecimal constants for unicode glyphs fixes #183, #229 --- pdfminer/encodingdb.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/pdfminer/encodingdb.py b/pdfminer/encodingdb.py index 870bd28..468b3db 100644 --- a/pdfminer/encodingdb.py +++ b/pdfminer/encodingdb.py @@ -6,7 +6,7 @@ from .latin_enc import ENCODING import six # Python 2+3 compatibility -STRIP_NAME = re.compile(r'[0-9]+') +STRIP_NAME = re.compile(r'[0-9A-Fa-f]+') ## name2unicode @@ -18,7 +18,7 @@ def name2unicode(name): m = STRIP_NAME.search(name) if not m: raise KeyError(name) - return six.unichr(int(m.group(0))) + return six.unichr(int(m.group(0), base=16)) ## EncodingDB From bfbb8b8f0bbbac88539d28905839388b867e03af Mon Sep 17 00:00:00 2001 From: Kaushik Acharya Date: Thu, 15 Aug 2019 11:59:29 +0530 Subject: [PATCH 2/5] Adding Denis's article name. --- docs/programming.html | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/programming.html b/docs/programming.html index b01eef9..c72ab48 100644 --- a/docs/programming.html +++ b/docs/programming.html @@ -182,7 +182,7 @@ Could be used for framing another pictures or figures.

-Also, check out a more complete example by Denis Papathanasiou. +Also, check out a more complete example by Denis Papathanasiou(Extracting Text & Images from PDF Files).

Obtaining Table of Contents

From 963a227b2e3fc7c7327b7e49dbdad9a7656e66aa Mon Sep 17 00:00:00 2001 From: Kaushik Acharya Date: Mon, 19 Aug 2019 20:16:34 +0530 Subject: [PATCH 3/5] Updated URL for the article --- docs/programming.html | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/programming.html b/docs/programming.html index c72ab48..dc4c186 100644 --- a/docs/programming.html +++ b/docs/programming.html @@ -182,7 +182,7 @@ Could be used for framing another pictures or figures.

-Also, check out a more complete example by Denis Papathanasiou(Extracting Text & Images from PDF Files). +Also, check out a more complete example by Denis Papathanasiou(Extracting Text & Images from PDF Files).

Obtaining Table of Contents

From 2156efe64fae5715de4a8cbe3dba7f020b313c03 Mon Sep 17 00:00:00 2001 From: Tony Tong Date: Thu, 22 Aug 2019 10:24:51 -0400 Subject: [PATCH 4/5] fix stoke color and non-stroke color in PDFGraphicState --- pdfminer/pdfinterp.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/pdfminer/pdfinterp.py b/pdfminer/pdfinterp.py index a14f64a..de54835 100644 --- a/pdfminer/pdfinterp.py +++ b/pdfminer/pdfinterp.py @@ -598,25 +598,25 @@ class PDFPageInterpreter(object): # setrgb-stroking def do_RG(self, r, g, b): - self.graphicstate.color = (r, g, b) + self.graphicstate.scolor = (r, g, b) #self.do_CS(LITERAL_DEVICE_RGB) return # setrgb-non-stroking def do_rg(self, r, g, b): - self.graphicstate.color = (r, g, b) + self.graphicstate.ncolor = (r, g, b) #self.do_cs(LITERAL_DEVICE_RGB) return # setcmyk-stroking def do_K(self, c, m, y, k): - self.graphicstate.color = (c, m, y, k) + self.graphicstate.scolor = (c, m, y, k) #self.do_CS(LITERAL_DEVICE_CMYK) return # setcmyk-non-stroking def do_k(self, c, m, y, k): - self.graphicstate.color = (c, m, y, k) + self.graphicstate.ncolor = (c, m, y, k) #self.do_cs(LITERAL_DEVICE_CMYK) return From cc310d3d74a47c6c4d0d1c7ef961461dd7ea1f7b Mon Sep 17 00:00:00 2001 From: Tata Ganesh Date: Sat, 12 Oct 2019 21:19:36 +0530 Subject: [PATCH 5/5] Revert "Fix stoke color and non-stroke color in PDFGraphicState" --- pdfminer/pdfinterp.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/pdfminer/pdfinterp.py b/pdfminer/pdfinterp.py index de54835..a14f64a 100644 --- a/pdfminer/pdfinterp.py +++ b/pdfminer/pdfinterp.py @@ -598,25 +598,25 @@ class PDFPageInterpreter(object): # setrgb-stroking def do_RG(self, r, g, b): - self.graphicstate.scolor = (r, g, b) + self.graphicstate.color = (r, g, b) #self.do_CS(LITERAL_DEVICE_RGB) return # setrgb-non-stroking def do_rg(self, r, g, b): - self.graphicstate.ncolor = (r, g, b) + self.graphicstate.color = (r, g, b) #self.do_cs(LITERAL_DEVICE_RGB) return # setcmyk-stroking def do_K(self, c, m, y, k): - self.graphicstate.scolor = (c, m, y, k) + self.graphicstate.color = (c, m, y, k) #self.do_CS(LITERAL_DEVICE_CMYK) return # setcmyk-non-stroking def do_k(self, c, m, y, k): - self.graphicstate.ncolor = (c, m, y, k) + self.graphicstate.color = (c, m, y, k) #self.do_cs(LITERAL_DEVICE_CMYK) return