source code tidy up
git-svn-id: https://pdfminerr.googlecode.com/svn/trunk/pdfminer@147 1aa58f4a-7d42-0410-adbc-911cccaed67cpull/1/head
parent
78f7866554
commit
3dd4f1668b
5
Makefile
5
Makefile
|
@ -9,9 +9,6 @@ PYTHON=python
|
||||||
RM=rm -f
|
RM=rm -f
|
||||||
CP=cp -f
|
CP=cp -f
|
||||||
|
|
||||||
VERSION=`$(PYTHON) $(PACKAGE)/__init__.py`
|
|
||||||
DISTFILE=$(PACKAGE)-$(VERSION).tar.gz
|
|
||||||
|
|
||||||
all:
|
all:
|
||||||
|
|
||||||
install:
|
install:
|
||||||
|
@ -39,6 +36,8 @@ sdist: clean
|
||||||
register: clean
|
register: clean
|
||||||
$(PYTHON) setup.py sdist upload register
|
$(PYTHON) setup.py sdist upload register
|
||||||
|
|
||||||
|
VERSION=`$(PYTHON) $(PACKAGE)/__init__.py`
|
||||||
|
DISTFILE=$(PACKAGE)-$(VERSION).tar.gz
|
||||||
WEBDIR=$$HOME/Site/unixuser.org/python/$(PACKAGE)
|
WEBDIR=$$HOME/Site/unixuser.org/python/$(PACKAGE)
|
||||||
publish: sdist
|
publish: sdist
|
||||||
$(CP) dist/$(DISTFILE) $(WEBDIR)
|
$(CP) dist/$(DISTFILE) $(WEBDIR)
|
||||||
|
|
|
@ -1,14 +1,25 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
import sys, re, os, os.path
|
import sys
|
||||||
stderr = sys.stderr
|
import re
|
||||||
from struct import pack, unpack
|
import os
|
||||||
from pdfminer.utils import choplist, nunpack
|
import os.path
|
||||||
from pdfminer.fontmetrics import FONT_METRICS
|
from sys import stderr
|
||||||
from pdfminer.latin_enc import ENCODING
|
from struct import pack
|
||||||
from pdfminer.glyphlist import charname2unicode
|
from struct import unpack
|
||||||
from pdfminer.psparser import PSException, PSSyntaxError, PSTypeError, PSEOF, \
|
from fontmetrics import FONT_METRICS
|
||||||
PSLiteral, PSKeyword, literal_name, keyword_name, \
|
from latin_enc import ENCODING
|
||||||
PSStackParser
|
from glyphlist import charname2unicode
|
||||||
|
from psparser import PSException
|
||||||
|
from psparser import PSSyntaxError
|
||||||
|
from psparser import PSTypeError
|
||||||
|
from psparser import PSEOF
|
||||||
|
from psparser import PSLiteral
|
||||||
|
from psparser import PSKeyword
|
||||||
|
from psparser import literal_name
|
||||||
|
from psparser import keyword_name
|
||||||
|
from psparser import PSStackParser
|
||||||
|
from utils import choplist
|
||||||
|
from utils import nunpack
|
||||||
try:
|
try:
|
||||||
import cdb
|
import cdb
|
||||||
except ImportError:
|
except ImportError:
|
||||||
|
|
|
@ -1,9 +1,20 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
import sys
|
import sys
|
||||||
from pdfminer.pdfdevice import PDFDevice, PDFTextDevice
|
from pdfdevice import PDFDevice
|
||||||
from pdfminer.pdffont import PDFUnicodeNotDefined
|
from pdfdevice import PDFTextDevice
|
||||||
from pdfminer.layout import LayoutContainer, LTPage, LTText, LTLine, LTRect, LTFigure, LTTextItem, LTTextBox, LTTextLine
|
from pdffont import PDFUnicodeNotDefined
|
||||||
from pdfminer.utils import apply_matrix_pt, mult_matrix, enc
|
from layout import LayoutContainer
|
||||||
|
from layout import LTPage
|
||||||
|
from layout import LTText
|
||||||
|
from layout import LTLine
|
||||||
|
from layout import LTRect
|
||||||
|
from layout import LTFigure
|
||||||
|
from layout import LTTextItem
|
||||||
|
from layout import LTTextBox
|
||||||
|
from layout import LTTextLine
|
||||||
|
from utils import apply_matrix_pt
|
||||||
|
from utils import mult_matrix
|
||||||
|
from utils import enc
|
||||||
|
|
||||||
|
|
||||||
## TagExtractor
|
## TagExtractor
|
||||||
|
|
|
@ -1,7 +1,9 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
import sys
|
import sys
|
||||||
from pdfminer.utils import apply_matrix_norm, apply_matrix_pt, bsearch
|
from sys import maxint as INF
|
||||||
INF = sys.maxint
|
from utils import apply_matrix_norm
|
||||||
|
from utils import apply_matrix_pt
|
||||||
|
from utils import bsearch
|
||||||
|
|
||||||
|
|
||||||
## LAParams
|
## LAParams
|
||||||
|
|
|
@ -1,6 +1,6 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
import sys
|
import sys
|
||||||
stderr = sys.stderr
|
from sys import stderr
|
||||||
|
|
||||||
|
|
||||||
## LZWDecoder
|
## LZWDecoder
|
||||||
|
|
|
@ -1,6 +1,5 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
import sys
|
from psparser import PSLiteralTable
|
||||||
from pdfminer.psparser import PSLiteralTable
|
|
||||||
|
|
||||||
|
|
||||||
## PDFColorSpace
|
## PDFColorSpace
|
||||||
|
|
|
@ -1,8 +1,8 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
|
|
||||||
import sys
|
import sys
|
||||||
from pdfminer.utils import mult_matrix, translate_matrix
|
from utils import mult_matrix
|
||||||
from pdfminer.pdffont import PDFUnicodeNotDefined
|
from utils import translate_matrix
|
||||||
|
from pdffont import PDFUnicodeNotDefined
|
||||||
|
|
||||||
|
|
||||||
## PDFDevice
|
## PDFDevice
|
||||||
|
|
|
@ -1,17 +1,33 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
import sys
|
import sys
|
||||||
from struct import pack, unpack
|
from cmap import CMap
|
||||||
|
from cmap import CMapDB
|
||||||
|
from cmap import CMapParser
|
||||||
|
from cmap import FontMetricsDB
|
||||||
|
from cmap import EncodingDB
|
||||||
|
from struct import pack
|
||||||
|
from struct import unpack
|
||||||
|
from psparser import PSLiteralTable
|
||||||
|
from psparser import PSKeywordTable
|
||||||
|
from psparser import PSLiteral
|
||||||
|
from psparser import literal_name
|
||||||
|
from psparser import keyword_name
|
||||||
|
from psparser import STRICT
|
||||||
|
from pdftypes import PDFException
|
||||||
|
from pdftypes import resolve1
|
||||||
|
from pdftypes import int_value
|
||||||
|
from pdftypes import float_value
|
||||||
|
from pdftypes import num_value
|
||||||
|
from pdftypes import str_value
|
||||||
|
from pdftypes import list_value
|
||||||
|
from pdftypes import dict_value
|
||||||
|
from pdftypes import stream_value
|
||||||
|
from utils import apply_matrix_norm
|
||||||
|
from utils import nunpack
|
||||||
try:
|
try:
|
||||||
from cStringIO import StringIO
|
from cStringIO import StringIO
|
||||||
except ImportError:
|
except ImportError:
|
||||||
from StringIO import StringIO
|
from StringIO import StringIO
|
||||||
from pdfminer.psparser import PSLiteralTable, PSKeywordTable, PSLiteral, \
|
|
||||||
literal_name, keyword_name, STRICT
|
|
||||||
from pdfminer.pdftypes import PDFException, \
|
|
||||||
resolve1, int_value, float_value, num_value, \
|
|
||||||
str_value, list_value, dict_value, stream_value
|
|
||||||
from pdfminer.cmap import CMap, CMapDB, CMapParser, FontMetricsDB, EncodingDB
|
|
||||||
from pdfminer.utils import apply_matrix_norm, nunpack
|
|
||||||
|
|
||||||
|
|
||||||
## CFFFont
|
## CFFFont
|
||||||
|
@ -574,4 +590,5 @@ def main(argv):
|
||||||
CFFFont(fp)
|
CFFFont(fp)
|
||||||
fp.close()
|
fp.close()
|
||||||
return
|
return
|
||||||
|
|
||||||
if __name__ == '__main__': sys.exit(main(sys.argv))
|
if __name__ == '__main__': sys.exit(main(sys.argv))
|
||||||
|
|
|
@ -1,23 +1,49 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
import sys, re
|
import re
|
||||||
stderr = sys.stderr
|
from sys import stderr
|
||||||
from struct import pack, unpack
|
from struct import pack, unpack
|
||||||
try:
|
try:
|
||||||
from cStringIO import StringIO
|
from cStringIO import StringIO
|
||||||
except ImportError:
|
except ImportError:
|
||||||
from StringIO import StringIO
|
from StringIO import StringIO
|
||||||
from pdfminer.psparser import PSException, PSTypeError, PSEOF, \
|
from cmap import CMapDB
|
||||||
PSLiteralTable, PSKeywordTable, literal_name, keyword_name, \
|
from psparser import PSException
|
||||||
PSStackParser, PSKeyword, STRICT
|
from psparser import PSTypeError
|
||||||
from pdfminer.pdftypes import PDFException, PDFStream, PDFObjRef, \
|
from psparser import PSEOF
|
||||||
resolve1, int_value, float_value, num_value, \
|
from psparser import PSLiteralTable
|
||||||
str_value, list_value, dict_value, stream_value
|
from psparser import PSKeywordTable
|
||||||
from pdfminer.utils import choplist, mult_matrix, MATRIX_IDENTITY
|
from psparser import literal_name
|
||||||
from pdfminer.pdffont import PDFFontError, PDFType1Font, PDFTrueTypeFont, PDFType3Font, PDFCIDFont
|
from psparser import keyword_name
|
||||||
from pdfminer.pdfparser import PDFDocument, PDFParser, PDFPasswordIncorrect
|
from psparser import PSStackParser
|
||||||
from pdfminer.pdfcolor import PDFColorSpace, PREDEFINED_COLORSPACE, \
|
from psparser import PSKeyword
|
||||||
LITERAL_DEVICE_GRAY, LITERAL_DEVICE_RGB, LITERAL_DEVICE_CMYK
|
from psparser import STRICT
|
||||||
from pdfminer.cmap import CMapDB
|
from pdftypes import PDFException
|
||||||
|
from pdftypes import PDFStream
|
||||||
|
from pdftypes import PDFObjRef
|
||||||
|
from pdftypes import resolve1
|
||||||
|
from pdftypes import int_value
|
||||||
|
from pdftypes import float_value
|
||||||
|
from pdftypes import num_value
|
||||||
|
from pdftypes import str_value
|
||||||
|
from pdftypes import list_value
|
||||||
|
from pdftypes import dict_value
|
||||||
|
from pdftypes import stream_value
|
||||||
|
from pdffont import PDFFontError
|
||||||
|
from pdffont import PDFType1Font
|
||||||
|
from pdffont import PDFTrueTypeFont
|
||||||
|
from pdffont import PDFType3Font
|
||||||
|
from pdffont import PDFCIDFont
|
||||||
|
from pdfparser import PDFDocument
|
||||||
|
from pdfparser import PDFParser
|
||||||
|
from pdfparser import PDFPasswordIncorrect
|
||||||
|
from pdfcolor import PDFColorSpace
|
||||||
|
from pdfcolor import PREDEFINED_COLORSPACE
|
||||||
|
from pdfcolor import LITERAL_DEVICE_GRAY
|
||||||
|
from pdfcolor import LITERAL_DEVICE_RGB
|
||||||
|
from pdfcolor import LITERAL_DEVICE_CMYK
|
||||||
|
from utils import choplist
|
||||||
|
from utils import mult_matrix
|
||||||
|
from utils import MATRIX_IDENTITY
|
||||||
|
|
||||||
|
|
||||||
## Exceptions
|
## Exceptions
|
||||||
|
|
|
@ -1,19 +1,35 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
|
import sys
|
||||||
# pdfparser.py, Yusuke Shinyama
|
import re
|
||||||
# ver 0.1, Dec 24 2004-
|
import md5
|
||||||
# ver 0.2, Dec 24 2007
|
import struct
|
||||||
|
from sys import stderr
|
||||||
import sys, re
|
from utils import choplist
|
||||||
import md5, struct
|
from utils import nunpack
|
||||||
stderr = sys.stderr
|
from utils import decode_text
|
||||||
from pdfminer.utils import choplist, nunpack, decode_text
|
from arcfour import Arcfour
|
||||||
from pdfminer.arcfour import Arcfour
|
from psparser import PSStackParser
|
||||||
from pdfminer.psparser import PSStackParser, PSSyntaxError, PSEOF, \
|
from psparser import PSSyntaxError
|
||||||
PSLiteralTable, PSKeywordTable, literal_name, keyword_name, STRICT
|
from psparser import PSEOF
|
||||||
from pdfminer.pdftypes import PDFException, PDFTypeError, PDFNotImplementedError, \
|
from psparser import PSLiteralTable
|
||||||
PDFStream, PDFObjRef, resolve1, decipher_all, \
|
from psparser import PSKeywordTable
|
||||||
int_value, float_value, num_value, str_value, list_value, dict_value, stream_value
|
from psparser import literal_name
|
||||||
|
from psparser import keyword_name
|
||||||
|
from psparser import STRICT
|
||||||
|
from pdftypes import PDFException
|
||||||
|
from pdftypes import PDFTypeError
|
||||||
|
from pdftypes import PDFNotImplementedError
|
||||||
|
from pdftypes import PDFStream
|
||||||
|
from pdftypes import PDFObjRef
|
||||||
|
from pdftypes import resolve1
|
||||||
|
from pdftypes import decipher_all
|
||||||
|
from pdftypes import int_value
|
||||||
|
from pdftypes import float_value
|
||||||
|
from pdftypes import num_value
|
||||||
|
from pdftypes import str_value
|
||||||
|
from pdftypes import list_value
|
||||||
|
from pdftypes import dict_value
|
||||||
|
from pdftypes import stream_value
|
||||||
|
|
||||||
|
|
||||||
## Exceptions
|
## Exceptions
|
||||||
|
|
|
@ -1,9 +1,16 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
import sys, zlib
|
import sys
|
||||||
from pdfminer.lzw import LZWDecoder
|
import zlib
|
||||||
from pdfminer.psparser import PSException, PSObject, \
|
from lzw import LZWDecoder
|
||||||
PSLiteral, PSKeyword, PSLiteralTable, PSKeywordTable, \
|
from psparser import PSException
|
||||||
literal_name, keyword_name, STRICT
|
from psparser import PSObject
|
||||||
|
from psparser import PSLiteral
|
||||||
|
from psparser import PSKeyword
|
||||||
|
from psparser import PSLiteralTable
|
||||||
|
from psparser import PSKeywordTable
|
||||||
|
from psparser import literal_name
|
||||||
|
from psparser import keyword_name
|
||||||
|
from psparser import STRICT
|
||||||
|
|
||||||
LITERAL_CRYPT = PSLiteralTable.intern('Crypt')
|
LITERAL_CRYPT = PSLiteralTable.intern('Crypt')
|
||||||
LITERALS_FLATE_DECODE = (PSLiteralTable.intern('FlateDecode'), PSLiteralTable.intern('Fl'))
|
LITERALS_FLATE_DECODE = (PSLiteralTable.intern('FlateDecode'), PSLiteralTable.intern('Fl'))
|
||||||
|
|
|
@ -1,7 +1,8 @@
|
||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
import sys, re
|
import sys
|
||||||
stderr = sys.stderr
|
import re
|
||||||
from pdfminer.utils import choplist
|
from sys import stderr
|
||||||
|
from utils import choplist
|
||||||
|
|
||||||
STRICT = 0
|
STRICT = 0
|
||||||
|
|
||||||
|
|
|
@ -6,8 +6,10 @@
|
||||||
# * public domain *
|
# * public domain *
|
||||||
#
|
#
|
||||||
|
|
||||||
import sys, os
|
import sys
|
||||||
from struct import pack, unpack
|
import os
|
||||||
|
from struct import pack
|
||||||
|
from struct import unpack
|
||||||
from array import array
|
from array import array
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -7,7 +7,8 @@
|
||||||
## http://www.efgh.com/software/rijndael.htm
|
## http://www.efgh.com/software/rijndael.htm
|
||||||
##
|
##
|
||||||
import sys
|
import sys
|
||||||
from struct import pack, unpack
|
from struct import pack
|
||||||
|
from struct import unpack
|
||||||
|
|
||||||
def KEYLENGTH(keybits): return (keybits)/8
|
def KEYLENGTH(keybits): return (keybits)/8
|
||||||
def RKLENGTH(keybits): return (keybits)/8+28
|
def RKLENGTH(keybits): return (keybits)/8+28
|
||||||
|
|
Loading…
Reference in New Issue