git-svn-id: https://pdfminerr.googlecode.com/svn/trunk/pdfminer@199 1aa58f4a-7d42-0410-adbc-911cccaed67c

2010-04-04 12:18:57 +00:00 · 2010-04-04 12:18:57 +00:00 · 434720f767
parent 71defb2272
commit 434720f767
2 changed files with 8 additions and 3 deletions
--- a/docs/index.html
+++ b/docs/index.html
@ -19,7 +19,7 @@ Python PDF parser and analyzer

 <div align=right class=lastmod>
 <!-- hhmts start -->
-Last Modified: Fri Mar 26 11:14:17 UTC 2010
+Last Modified: Sun Mar 28 07:21:28 UTC 2010
 <!-- hhmts end -->
 </div>

@ -63,6 +63,9 @@ PDF parser that can be used for other purposes instead of text analysis.
 <li> Tagged contents extraction.
 <li> Reconstruct the original layout by grouping text chunks.
 </ul>
+<p>
+On the performance, PDFMiner is about 20 times slower than 
+other C/C++-based software such as XPdf.

 <a name="source"></a>
 <p>
--- a/setup.py
+++ b/setup.py
@ -7,11 +7,12 @@ setup(
    version=__version__,
    description='PDF parser and analyzer',
    long_description='''PDFMiner is a suite of programs that help
-extracting and analyzing text data of PDF documents.
+extracting and analyzing text data from PDF documents.
 Unlike other PDF-related tools, it allows to obtain
 the exact location of texts in a page, as well as 
 other extra information such as font information or ruled lines.
-It includes a PDF converter that can transform PDF files
+It can also infer its text flow and reconstruct the original layout.
+PDFMiner includes a PDF converter that can transform PDF files
 into other text formats (such as HTML). It has an extensible
 PDF parser that can be used for other purposes instead of text analysis.''',
    license='MIT/X',
@ -33,5 +34,6 @@ PDF parser that can be used for other purposes instead of text analysis.''',
    'Intended Audience :: Developers',
    'Intended Audience :: Science/Research',
    'License :: OSI Approved :: MIT License',
+    'Topic :: Text Processing',
    ],
    )