From cd412308bd81c1a570c4d0334d6dc53f16a7b1b4 Mon Sep 17 00:00:00 2001 From: Yusuke Shinyama Date: Mon, 14 Feb 2011 22:32:55 +0900 Subject: [PATCH] text flow detection bug fix (thanks to fujimoto-san) --- pdfminer/layout.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/pdfminer/layout.py b/pdfminer/layout.py index 08bfc9e..89535c8 100644 --- a/pdfminer/layout.py +++ b/pdfminer/layout.py @@ -402,7 +402,7 @@ class LTTextGroupLRTB(LTTextGroup): def analyze(self, laparams): # reorder the objects from top-left to bottom-right. self._objs = csort(self._objs, key=lambda obj: - (1-laparams.boxes_flow)*(obj.x0+obj.x1) - + (1-laparams.boxes_flow)*(obj.x0) - (1+laparams.boxes_flow)*(obj.y0+obj.y1)) return LTTextGroup.analyze(self, laparams) @@ -412,7 +412,7 @@ class LTTextGroupTBRL(LTTextGroup): # reorder the objects from top-right to bottom-left. self._objs = csort(self._objs, key=lambda obj: -(1+laparams.boxes_flow)*(obj.x0+obj.x1) - -(1-laparams.boxes_flow)*(obj.y0+obj.y1)) + -(1-laparams.boxes_flow)*(obj.y1)) return LTTextGroup.analyze(self, laparams)