fix pychecker warning

git-svn-id: https://pdfminerr.googlecode.com/svn/trunk/pdfminer@104 1aa58f4a-7d42-0410-adbc-911cccaed67c
pull/1/head
yusuke.shinyama.dummy 2009-05-16 06:38:44 +00:00
parent 3e12268bf6
commit 759e21e606
10 changed files with 52 additions and 72 deletions

View File

@ -1,12 +1,12 @@
# Makefile for pdfminer # Makefile for pdfminer
PACKAGE=pdfminer PACKAGE=pdfminer
VERSION=20090330
GNUTAR=tar
SVN=svn
PYTHON=python
WORKDIR=/tmp SVN=svn
GNUTAR=tar
PYTHON=python
TMPDIR=/tmp
VERSION=`$(PYTHON) $(PACKAGE)/__init__.py`
DISTNAME=$(PACKAGE)-dist-$(VERSION) DISTNAME=$(PACKAGE)-dist-$(VERSION)
DISTFILE=$(DISTNAME).tar.gz DISTFILE=$(DISTNAME).tar.gz
@ -14,34 +14,33 @@ CONV_CMAP=$(PYTHON) -m tools.conv_cmap
all: all:
clean:
-rm -rf build
-cd $(PACKAGE) && make clean
-cd tools && make clean
-cd samples && make clean
test:
cd samples && make test
cdbcmap: CMap cdbcmap: CMap
-mkdir CDBCMap -mkdir CDBCMap
$(CONV_CMAP) CMap/* $(CONV_CMAP) CMap/*
test:
cd samples && make
clean:
-cd pdflib && make clean
-cd tools && make clean
-cd samples && make clean
-rm -rf build
# Maintainance: # Maintainance:
pack: clean
$(SVN) cleanup
$(SVN) export . $(WORKDIR)/$(DISTNAME)
$(GNUTAR) c -z -C$(WORKDIR) -f $(WORKDIR)/$(DISTFILE) $(DISTNAME) --dereference --numeric-owner
-rm -rf $(WORKDIR)/$(DISTNAME)
check:
-pychecker --limit=0 *.py
commit: clean commit: clean
$(SVN) commit $(SVN) commit
check:
cd $(PACKAGE) && make check
dist: clean
$(SVN) cleanup
$(SVN) export . $(TMPDIR)/$(DISTNAME)
$(GNUTAR) c -z -C$(TMPDIR) -f $(TMPDIR)/$(DISTFILE) $(DISTNAME) --dereference --numeric-owner
-rm -rf $(TMPDIR)/$(DISTNAME)
WEBDIR=$$HOME/Site/unixuser.org/python/pdfminer WEBDIR=$$HOME/Site/unixuser.org/python/pdfminer
publish: pack publish: dist
cp $(WORKDIR)/$(DISTFILE) $(WEBDIR) cp $(TMPDIR)/$(DISTFILE) $(WEBDIR)
cp README.html $(WEBDIR)/index.html cp README.html $(WEBDIR)/index.html

View File

@ -1,32 +1,11 @@
# Makefile for pdfminer # Makefile for pdfminer
DESTDIR=/usr/local/src/pdflib PYCHECKER=pychecker --limit=0
PDFLIB = ${DESTDIR}/__init__.py \ all:
${DESTDIR}/arcfour.py \
${DESTDIR}/ascii85.py \
${DESTDIR}/cmap.py \
${DESTDIR}/fontmetrics.py \
${DESTDIR}/glyphlist.py \
${DESTDIR}/latin_enc.py \
${DESTDIR}/lzw.py \
${DESTDIR}/pdf2txt.py \
${DESTDIR}/pdfcolor.py \
${DESTDIR}/pdfdevice.py \
${DESTDIR}/pdffont.py \
${DESTDIR}/pdfinterp.py \
${DESTDIR}/pdfparser.py \
${DESTDIR}/pdftypes.py \
${DESTDIR}/psparser.py \
${DESTDIR}/pycdb.py \
${DESTDIR}/rijndael.py \
${DESTDIR}/utils.py \
${DESTDIR}/%: %
cp $? $@
chmod 755 $@
all: ${PDFLIB}
clean: clean:
-rm *.pyc *.pyo -rm *.pyc *.pyo
check:
$(PYCHECKER) *.py

View File

@ -0,0 +1,4 @@
#!/usr/bin/env python
__version__ = '20090330'
if __name__ == '__main__': print __version__

View File

@ -45,7 +45,7 @@ class PDFPageAggregator(PDFDevice):
def handle_undefined_char(self, cidcoding, cid): def handle_undefined_char(self, cidcoding, cid):
if self.debug: if self.debug:
print >>stderr, 'undefined: %r, %r' % (cidcoding, cid) print >>sys.stderr, 'undefined: %r, %r' % (cidcoding, cid)
return self.undefined_char return self.undefined_char
def paint_path(self, gstate, stroke, fill, evenodd, path): def paint_path(self, gstate, stroke, fill, evenodd, path):
@ -149,7 +149,7 @@ class TagExtractor(PDFDevice):
text += char text += char
except PDFUnicodeNotDefined: except PDFUnicodeNotDefined:
pass pass
self.write(text) self.outfp.write(enc(text, self.codec))
return return
def begin_page(self, page): def begin_page(self, page):
@ -306,18 +306,17 @@ class TextConverter(PDFConverter):
def end_page(self, page): def end_page(self, page):
def render(item): def render(item):
if isinstance(item, LTText): if isinstance(item, LTText):
self.outfp.write(obj.text.encode(self.codec, 'replace')) self.write(item.text+'\n')
self.outfp.write('\n')
elif isinstance(item, LTTextBox): elif isinstance(item, LTTextBox):
for line in item.get_lines(self.word_margin): for line in item.get_lines(self.word_margin):
self.outfp.write(line.encode(self.codec, 'replace')+'\n') self.write(line+'\n')
self.outfp.write('\n') self.write('\n')
elif isinstance(item, LayoutContainer): elif isinstance(item, LayoutContainer):
for child in item: for child in item:
render(child) render(child)
page = PDFConverter.end_page(self, page) page = PDFConverter.end_page(self, page)
if self.showpageno: if self.showpageno:
self.outfp.write('Page %d\n' % page.id) self.write('Page %d\n' % page.id)
render(page) render(page)
self.outfp.write('\f') self.write('\f')
return return

View File

@ -362,7 +362,7 @@ class LTFigure(LayoutContainer):
return return
def __repr__(self): def __repr__(self):
return ('<figure id=%r bbox=%s ctm=%r>' % (self.id, self.get_bbox(), self.ctm)) return ('<figure id=%r bbox=%s matrix=%r>' % (self.id, self.get_bbox(), self.matrix))
## LTTextBox ## LTTextBox

View File

@ -86,12 +86,12 @@ class LZWDecoder(object):
def main(argv): def main(argv):
import StringIO import StringIO
input = '\x80\x0b\x60\x50\x22\x0c\x0c\x85\x01' data = '\x80\x0b\x60\x50\x22\x0c\x0c\x85\x01'
fp = StringIO.StringIO(input) fp = StringIO.StringIO(data)
expected = '\x2d\x2d\x2d\x2d\x2d\x41\x2d\x2d\x2d\x42' expected = '\x2d\x2d\x2d\x2d\x2d\x41\x2d\x2d\x2d\x42'
LZWDecoder.debug = 1 LZWDecoder.debug = 1
output = ''.join(LZWDecoder(fp).run()) output = ''.join(LZWDecoder(fp).run())
print (input, expected, output) print (data, expected, output)
print output == expected print output == expected
return 0 return 0

View File

@ -243,7 +243,7 @@ class TrueTypeFont(object):
self.tables = {} self.tables = {}
fonttype = fp.read(4) fonttype = fp.read(4)
(ntables, _1, _2, _3) = unpack('>HHHH', fp.read(8)) (ntables, _1, _2, _3) = unpack('>HHHH', fp.read(8))
for i in xrange(ntables): for _ in xrange(ntables):
(name, tsum, offset, length) = unpack('>4sLLL', fp.read(16)) (name, tsum, offset, length) = unpack('>4sLLL', fp.read(16))
self.tables[name] = (offset, length) self.tables[name] = (offset, length)
return return

View File

@ -152,7 +152,7 @@ class PDFResourceManager(object):
else: else:
if STRICT: if STRICT:
raise PDFFontError('Invalid Font spec: %r' % spec) raise PDFFontError('Invalid Font spec: %r' % spec)
font = PDFType1Font(spec) # this is so wrong! font = PDFType1Font(self, spec) # this is so wrong!
if objid: if objid:
self.fonts[objid] = font self.fonts[objid] = font
return font return font

View File

@ -55,7 +55,6 @@ class XRefObjRange(object):
class PDFBaseXRef(object): class PDFBaseXRef(object):
def __init__(self): def __init__(self):
self.objid_ranges = None self.objid_ranges = None
self.objid_list = None
return return
def objids(self): def objids(self):
@ -63,11 +62,9 @@ class PDFBaseXRef(object):
for objid_range in self.objid_ranges: for objid_range in self.objid_ranges:
for objid in xrange(objid_range.get_start_id(), objid_range.get_end_id() + 1): for objid in xrange(objid_range.get_start_id(), objid_range.get_end_id() + 1):
yield objid yield objid
else:
for objid in self.offsets:
yield objid
return return
## PDFXRef ## PDFXRef
## ##
class PDFXRef(PDFBaseXRef): class PDFXRef(PDFBaseXRef):
@ -154,7 +151,7 @@ class PDFXRefStream(PDFBaseXRef):
return return
def __repr__(self): def __repr__(self):
return '<PDFXRef: objid=%d-%d>' % (self.objid_first, self.objid_last) return '<PDFXRefStream: fields=%d,%d,%d>' % (self.fl1, self.fl2, self.fl3)
def load(self, parser, debug=0): def load(self, parser, debug=0):
(_,objid) = parser.nexttoken() # ignored (_,objid) = parser.nexttoken() # ignored

View File

@ -16,11 +16,13 @@ HTMLS= \
naacl06-shinyama.html \ naacl06-shinyama.html \
nlp2004slides.html nlp2004slides.html
all: $(HTMLS) all:
clean: clean:
-rm $(HTMLS) -rm $(HTMLS)
test: $(HTMLS)
.SUFFIXES: .pdf .html .sgml .txt .SUFFIXES: .pdf .html .sgml .txt
.pdf.html: .pdf.html:
$(PDF2TXT) -t html -o $@ $< $(PDF2TXT) -t html -o $@ $<