pdfminer.six/tests/test_tools_pdf2txt.py

50 lines
1.1 KiB
Python

#!/usr/bin/env python
# -*- coding: utf-8 -*-
import nose, logging, os
import tools.pdf2txt as pdf2txt
path=os.path.dirname(os.path.abspath(__file__))+'/'
def run(datapath,filename,options=None):
i=path+datapath+filename+'.pdf'
o=path+filename+'.txt'
if options:
s='pdf2txt -o%s %s %s'%(o,options,i)
else:
s='pdf2txt -o%s %s'%(o,i)
pdf2txt.main(s.split(' ')[1:])
class TestDumpPDF():
def test_1(self):
run('../samples/','jo')
run('../samples/','simple1')
run('../samples/','simple2')
run('../samples/','simple3')
def test_2(self):
run('../samples/nonfree/','dmca')
def test_3(self):
nose.SkipTest()
return # takes too much time
run('../samples/nonfree/','f1040nr')
def test_4(self):
nose.SkipTest()
return # takes too much time
run('../samples/nonfree/','i1040nr')
def test_5(self):
run('../samples/nonfree/','kampo')
def test_6(self):
run('../samples/nonfree/','naacl06-shinyama')
if __name__ == '__main__':
nose.runmodule()