fix pychecker warning
git-svn-id: https://pdfminerr.googlecode.com/svn/trunk/pdfminer@104 1aa58f4a-7d42-0410-adbc-911cccaed67cpull/1/head
parent
3e12268bf6
commit
759e21e606
51
Makefile
51
Makefile
|
@ -1,12 +1,12 @@
|
||||||
# Makefile for pdfminer
|
# Makefile for pdfminer
|
||||||
|
|
||||||
PACKAGE=pdfminer
|
PACKAGE=pdfminer
|
||||||
VERSION=20090330
|
|
||||||
GNUTAR=tar
|
|
||||||
SVN=svn
|
|
||||||
PYTHON=python
|
|
||||||
|
|
||||||
WORKDIR=/tmp
|
SVN=svn
|
||||||
|
GNUTAR=tar
|
||||||
|
PYTHON=python
|
||||||
|
TMPDIR=/tmp
|
||||||
|
VERSION=`$(PYTHON) $(PACKAGE)/__init__.py`
|
||||||
DISTNAME=$(PACKAGE)-dist-$(VERSION)
|
DISTNAME=$(PACKAGE)-dist-$(VERSION)
|
||||||
DISTFILE=$(DISTNAME).tar.gz
|
DISTFILE=$(DISTNAME).tar.gz
|
||||||
|
|
||||||
|
@ -14,34 +14,33 @@ CONV_CMAP=$(PYTHON) -m tools.conv_cmap
|
||||||
|
|
||||||
all:
|
all:
|
||||||
|
|
||||||
|
clean:
|
||||||
|
-rm -rf build
|
||||||
|
-cd $(PACKAGE) && make clean
|
||||||
|
-cd tools && make clean
|
||||||
|
-cd samples && make clean
|
||||||
|
|
||||||
|
test:
|
||||||
|
cd samples && make test
|
||||||
|
|
||||||
cdbcmap: CMap
|
cdbcmap: CMap
|
||||||
-mkdir CDBCMap
|
-mkdir CDBCMap
|
||||||
$(CONV_CMAP) CMap/*
|
$(CONV_CMAP) CMap/*
|
||||||
|
|
||||||
test:
|
|
||||||
cd samples && make
|
|
||||||
|
|
||||||
clean:
|
|
||||||
-cd pdflib && make clean
|
|
||||||
-cd tools && make clean
|
|
||||||
-cd samples && make clean
|
|
||||||
-rm -rf build
|
|
||||||
|
|
||||||
# Maintainance:
|
# Maintainance:
|
||||||
|
|
||||||
pack: clean
|
|
||||||
$(SVN) cleanup
|
|
||||||
$(SVN) export . $(WORKDIR)/$(DISTNAME)
|
|
||||||
$(GNUTAR) c -z -C$(WORKDIR) -f $(WORKDIR)/$(DISTFILE) $(DISTNAME) --dereference --numeric-owner
|
|
||||||
-rm -rf $(WORKDIR)/$(DISTNAME)
|
|
||||||
|
|
||||||
check:
|
|
||||||
-pychecker --limit=0 *.py
|
|
||||||
|
|
||||||
commit: clean
|
commit: clean
|
||||||
$(SVN) commit
|
$(SVN) commit
|
||||||
|
|
||||||
|
check:
|
||||||
|
cd $(PACKAGE) && make check
|
||||||
|
|
||||||
|
dist: clean
|
||||||
|
$(SVN) cleanup
|
||||||
|
$(SVN) export . $(TMPDIR)/$(DISTNAME)
|
||||||
|
$(GNUTAR) c -z -C$(TMPDIR) -f $(TMPDIR)/$(DISTFILE) $(DISTNAME) --dereference --numeric-owner
|
||||||
|
-rm -rf $(TMPDIR)/$(DISTNAME)
|
||||||
|
|
||||||
WEBDIR=$$HOME/Site/unixuser.org/python/pdfminer
|
WEBDIR=$$HOME/Site/unixuser.org/python/pdfminer
|
||||||
publish: pack
|
publish: dist
|
||||||
cp $(WORKDIR)/$(DISTFILE) $(WEBDIR)
|
cp $(TMPDIR)/$(DISTFILE) $(WEBDIR)
|
||||||
cp README.html $(WEBDIR)/index.html
|
cp README.html $(WEBDIR)/index.html
|
||||||
|
|
|
@ -1,32 +1,11 @@
|
||||||
# Makefile for pdfminer
|
# Makefile for pdfminer
|
||||||
|
|
||||||
DESTDIR=/usr/local/src/pdflib
|
PYCHECKER=pychecker --limit=0
|
||||||
|
|
||||||
PDFLIB = ${DESTDIR}/__init__.py \
|
all:
|
||||||
${DESTDIR}/arcfour.py \
|
|
||||||
${DESTDIR}/ascii85.py \
|
|
||||||
${DESTDIR}/cmap.py \
|
|
||||||
${DESTDIR}/fontmetrics.py \
|
|
||||||
${DESTDIR}/glyphlist.py \
|
|
||||||
${DESTDIR}/latin_enc.py \
|
|
||||||
${DESTDIR}/lzw.py \
|
|
||||||
${DESTDIR}/pdf2txt.py \
|
|
||||||
${DESTDIR}/pdfcolor.py \
|
|
||||||
${DESTDIR}/pdfdevice.py \
|
|
||||||
${DESTDIR}/pdffont.py \
|
|
||||||
${DESTDIR}/pdfinterp.py \
|
|
||||||
${DESTDIR}/pdfparser.py \
|
|
||||||
${DESTDIR}/pdftypes.py \
|
|
||||||
${DESTDIR}/psparser.py \
|
|
||||||
${DESTDIR}/pycdb.py \
|
|
||||||
${DESTDIR}/rijndael.py \
|
|
||||||
${DESTDIR}/utils.py \
|
|
||||||
|
|
||||||
${DESTDIR}/%: %
|
|
||||||
cp $? $@
|
|
||||||
chmod 755 $@
|
|
||||||
|
|
||||||
all: ${PDFLIB}
|
|
||||||
|
|
||||||
clean:
|
clean:
|
||||||
-rm *.pyc *.pyo
|
-rm *.pyc *.pyo
|
||||||
|
|
||||||
|
check:
|
||||||
|
$(PYCHECKER) *.py
|
||||||
|
|
|
@ -0,0 +1,4 @@
|
||||||
|
#!/usr/bin/env python
|
||||||
|
__version__ = '20090330'
|
||||||
|
|
||||||
|
if __name__ == '__main__': print __version__
|
|
@ -45,7 +45,7 @@ class PDFPageAggregator(PDFDevice):
|
||||||
|
|
||||||
def handle_undefined_char(self, cidcoding, cid):
|
def handle_undefined_char(self, cidcoding, cid):
|
||||||
if self.debug:
|
if self.debug:
|
||||||
print >>stderr, 'undefined: %r, %r' % (cidcoding, cid)
|
print >>sys.stderr, 'undefined: %r, %r' % (cidcoding, cid)
|
||||||
return self.undefined_char
|
return self.undefined_char
|
||||||
|
|
||||||
def paint_path(self, gstate, stroke, fill, evenodd, path):
|
def paint_path(self, gstate, stroke, fill, evenodd, path):
|
||||||
|
@ -149,7 +149,7 @@ class TagExtractor(PDFDevice):
|
||||||
text += char
|
text += char
|
||||||
except PDFUnicodeNotDefined:
|
except PDFUnicodeNotDefined:
|
||||||
pass
|
pass
|
||||||
self.write(text)
|
self.outfp.write(enc(text, self.codec))
|
||||||
return
|
return
|
||||||
|
|
||||||
def begin_page(self, page):
|
def begin_page(self, page):
|
||||||
|
@ -306,18 +306,17 @@ class TextConverter(PDFConverter):
|
||||||
def end_page(self, page):
|
def end_page(self, page):
|
||||||
def render(item):
|
def render(item):
|
||||||
if isinstance(item, LTText):
|
if isinstance(item, LTText):
|
||||||
self.outfp.write(obj.text.encode(self.codec, 'replace'))
|
self.write(item.text+'\n')
|
||||||
self.outfp.write('\n')
|
|
||||||
elif isinstance(item, LTTextBox):
|
elif isinstance(item, LTTextBox):
|
||||||
for line in item.get_lines(self.word_margin):
|
for line in item.get_lines(self.word_margin):
|
||||||
self.outfp.write(line.encode(self.codec, 'replace')+'\n')
|
self.write(line+'\n')
|
||||||
self.outfp.write('\n')
|
self.write('\n')
|
||||||
elif isinstance(item, LayoutContainer):
|
elif isinstance(item, LayoutContainer):
|
||||||
for child in item:
|
for child in item:
|
||||||
render(child)
|
render(child)
|
||||||
page = PDFConverter.end_page(self, page)
|
page = PDFConverter.end_page(self, page)
|
||||||
if self.showpageno:
|
if self.showpageno:
|
||||||
self.outfp.write('Page %d\n' % page.id)
|
self.write('Page %d\n' % page.id)
|
||||||
render(page)
|
render(page)
|
||||||
self.outfp.write('\f')
|
self.write('\f')
|
||||||
return
|
return
|
||||||
|
|
|
@ -362,7 +362,7 @@ class LTFigure(LayoutContainer):
|
||||||
return
|
return
|
||||||
|
|
||||||
def __repr__(self):
|
def __repr__(self):
|
||||||
return ('<figure id=%r bbox=%s ctm=%r>' % (self.id, self.get_bbox(), self.ctm))
|
return ('<figure id=%r bbox=%s matrix=%r>' % (self.id, self.get_bbox(), self.matrix))
|
||||||
|
|
||||||
|
|
||||||
## LTTextBox
|
## LTTextBox
|
||||||
|
|
|
@ -86,12 +86,12 @@ class LZWDecoder(object):
|
||||||
|
|
||||||
def main(argv):
|
def main(argv):
|
||||||
import StringIO
|
import StringIO
|
||||||
input = '\x80\x0b\x60\x50\x22\x0c\x0c\x85\x01'
|
data = '\x80\x0b\x60\x50\x22\x0c\x0c\x85\x01'
|
||||||
fp = StringIO.StringIO(input)
|
fp = StringIO.StringIO(data)
|
||||||
expected = '\x2d\x2d\x2d\x2d\x2d\x41\x2d\x2d\x2d\x42'
|
expected = '\x2d\x2d\x2d\x2d\x2d\x41\x2d\x2d\x2d\x42'
|
||||||
LZWDecoder.debug = 1
|
LZWDecoder.debug = 1
|
||||||
output = ''.join(LZWDecoder(fp).run())
|
output = ''.join(LZWDecoder(fp).run())
|
||||||
print (input, expected, output)
|
print (data, expected, output)
|
||||||
print output == expected
|
print output == expected
|
||||||
return 0
|
return 0
|
||||||
|
|
||||||
|
|
|
@ -243,7 +243,7 @@ class TrueTypeFont(object):
|
||||||
self.tables = {}
|
self.tables = {}
|
||||||
fonttype = fp.read(4)
|
fonttype = fp.read(4)
|
||||||
(ntables, _1, _2, _3) = unpack('>HHHH', fp.read(8))
|
(ntables, _1, _2, _3) = unpack('>HHHH', fp.read(8))
|
||||||
for i in xrange(ntables):
|
for _ in xrange(ntables):
|
||||||
(name, tsum, offset, length) = unpack('>4sLLL', fp.read(16))
|
(name, tsum, offset, length) = unpack('>4sLLL', fp.read(16))
|
||||||
self.tables[name] = (offset, length)
|
self.tables[name] = (offset, length)
|
||||||
return
|
return
|
||||||
|
|
|
@ -152,7 +152,7 @@ class PDFResourceManager(object):
|
||||||
else:
|
else:
|
||||||
if STRICT:
|
if STRICT:
|
||||||
raise PDFFontError('Invalid Font spec: %r' % spec)
|
raise PDFFontError('Invalid Font spec: %r' % spec)
|
||||||
font = PDFType1Font(spec) # this is so wrong!
|
font = PDFType1Font(self, spec) # this is so wrong!
|
||||||
if objid:
|
if objid:
|
||||||
self.fonts[objid] = font
|
self.fonts[objid] = font
|
||||||
return font
|
return font
|
||||||
|
|
|
@ -55,7 +55,6 @@ class XRefObjRange(object):
|
||||||
class PDFBaseXRef(object):
|
class PDFBaseXRef(object):
|
||||||
def __init__(self):
|
def __init__(self):
|
||||||
self.objid_ranges = None
|
self.objid_ranges = None
|
||||||
self.objid_list = None
|
|
||||||
return
|
return
|
||||||
|
|
||||||
def objids(self):
|
def objids(self):
|
||||||
|
@ -63,11 +62,9 @@ class PDFBaseXRef(object):
|
||||||
for objid_range in self.objid_ranges:
|
for objid_range in self.objid_ranges:
|
||||||
for objid in xrange(objid_range.get_start_id(), objid_range.get_end_id() + 1):
|
for objid in xrange(objid_range.get_start_id(), objid_range.get_end_id() + 1):
|
||||||
yield objid
|
yield objid
|
||||||
else:
|
|
||||||
for objid in self.offsets:
|
|
||||||
yield objid
|
|
||||||
return
|
return
|
||||||
|
|
||||||
|
|
||||||
## PDFXRef
|
## PDFXRef
|
||||||
##
|
##
|
||||||
class PDFXRef(PDFBaseXRef):
|
class PDFXRef(PDFBaseXRef):
|
||||||
|
@ -154,7 +151,7 @@ class PDFXRefStream(PDFBaseXRef):
|
||||||
return
|
return
|
||||||
|
|
||||||
def __repr__(self):
|
def __repr__(self):
|
||||||
return '<PDFXRef: objid=%d-%d>' % (self.objid_first, self.objid_last)
|
return '<PDFXRefStream: fields=%d,%d,%d>' % (self.fl1, self.fl2, self.fl3)
|
||||||
|
|
||||||
def load(self, parser, debug=0):
|
def load(self, parser, debug=0):
|
||||||
(_,objid) = parser.nexttoken() # ignored
|
(_,objid) = parser.nexttoken() # ignored
|
||||||
|
|
|
@ -16,11 +16,13 @@ HTMLS= \
|
||||||
naacl06-shinyama.html \
|
naacl06-shinyama.html \
|
||||||
nlp2004slides.html
|
nlp2004slides.html
|
||||||
|
|
||||||
all: $(HTMLS)
|
all:
|
||||||
|
|
||||||
clean:
|
clean:
|
||||||
-rm $(HTMLS)
|
-rm $(HTMLS)
|
||||||
|
|
||||||
|
test: $(HTMLS)
|
||||||
|
|
||||||
.SUFFIXES: .pdf .html .sgml .txt
|
.SUFFIXES: .pdf .html .sgml .txt
|
||||||
.pdf.html:
|
.pdf.html:
|
||||||
$(PDF2TXT) -t html -o $@ $<
|
$(PDF2TXT) -t html -o $@ $<
|
||||||
|
|
Loading…
Reference in New Issue