From 696f060d47b52d30d6bb7e8ff20593d7b2cf5e09 Mon Sep 17 00:00:00 2001 From: Sunpoet Po-Chuan Hsieh Date: Fri, 29 Nov 2013 20:02:05 +0000 Subject: [PATCH] - Add py-pdfminer - While I'm here, update to 20131113 PDFMiner is a tool for extracting information from PDF documents. Unlike other PDF-related tools, it focuses entirely on getting and analyzing text data. PDFMiner allows to obtain the exact location of texts in a page, as well as other information such as fonts or lines. It includes a PDF converter that can transform PDF files into other text formats (such as HTML). It has an extensible PDF parser that can be used for other purposes instead of text analysis. WWW: http://www.unixuser.org/~euske/python/pdfminer/index.html PR: ports/181992 Submitted by: Kozlov Sergey --- textproc/Makefile | 1 + textproc/py-pdfminer/Makefile | 18 ++++++++ textproc/py-pdfminer/distinfo | 2 + textproc/py-pdfminer/pkg-descr | 9 ++++ textproc/py-pdfminer/pkg-plist | 79 ++++++++++++++++++++++++++++++++++ 5 files changed, 109 insertions(+) create mode 100644 textproc/py-pdfminer/Makefile create mode 100644 textproc/py-pdfminer/distinfo create mode 100644 textproc/py-pdfminer/pkg-descr create mode 100644 textproc/py-pdfminer/pkg-plist diff --git a/textproc/Makefile b/textproc/Makefile index 42b5be093776..a7e669bc5d88 100644 --- a/textproc/Makefile +++ b/textproc/Makefile @@ -1175,6 +1175,7 @@ SUBDIR += py-markdown2 SUBDIR += py-openpyxl SUBDIR += py-paragrep + SUBDIR += py-pdfminer SUBDIR += py-pss SUBDIR += py-pyctpp2 SUBDIR += py-pyelasticsearch diff --git a/textproc/py-pdfminer/Makefile b/textproc/py-pdfminer/Makefile new file mode 100644 index 000000000000..f512456bfd4f --- /dev/null +++ b/textproc/py-pdfminer/Makefile @@ -0,0 +1,18 @@ +# Created by: Kozlov Sergey +# $FreeBSD$ + +PORTNAME= pdfminer +PORTVERSION= 20131113 +CATEGORIES= textproc python +MASTER_SITES= CHEESESHOP +PKGNAMEPREFIX= ${PYTHON_PKGNAMEPREFIX} + +MAINTAINER= kozlov.sergey.404@gmail.com +COMMENT= PDF parser and analyzer + +LICENSE= MIT + +USE_PYTHON= -2.7 +USE_PYDISTUTILS=yes + +.include diff --git a/textproc/py-pdfminer/distinfo b/textproc/py-pdfminer/distinfo new file mode 100644 index 000000000000..74045709911c --- /dev/null +++ b/textproc/py-pdfminer/distinfo @@ -0,0 +1,2 @@ +SHA256 (pdfminer-20131113.tar.gz) = 1016246265f9d48645229164ef44483e9b9a1b3e6902783782f9ae4e1024ea19 +SIZE (pdfminer-20131113.tar.gz) = 4080763 diff --git a/textproc/py-pdfminer/pkg-descr b/textproc/py-pdfminer/pkg-descr new file mode 100644 index 000000000000..e34f13a09cb7 --- /dev/null +++ b/textproc/py-pdfminer/pkg-descr @@ -0,0 +1,9 @@ +PDFMiner is a tool for extracting information from PDF documents. Unlike other +PDF-related tools, it focuses entirely on getting and analyzing text data. +PDFMiner allows to obtain the exact location of texts in a page, as well as +other information such as fonts or lines. It includes a PDF converter that can +transform PDF files into other text formats (such as HTML). +It has an extensible PDF parser that can be used for other purposes instead +of text analysis. + +WWW: http://www.unixuser.org/~euske/python/pdfminer/index.html diff --git a/textproc/py-pdfminer/pkg-plist b/textproc/py-pdfminer/pkg-plist new file mode 100644 index 000000000000..3505d1805fb8 --- /dev/null +++ b/textproc/py-pdfminer/pkg-plist @@ -0,0 +1,79 @@ +bin/dumppdf.py +bin/latin2ascii.py +bin/pdf2txt.py +%%PYTHON_SITELIBDIR%%/pdfminer/__init__.py +%%PYTHON_SITELIBDIR%%/pdfminer/__init__.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/__init__.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/arcfour.py +%%PYTHON_SITELIBDIR%%/pdfminer/arcfour.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/arcfour.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/ascii85.py +%%PYTHON_SITELIBDIR%%/pdfminer/ascii85.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/ascii85.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/ccitt.py +%%PYTHON_SITELIBDIR%%/pdfminer/ccitt.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/ccitt.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/cmapdb.py +%%PYTHON_SITELIBDIR%%/pdfminer/cmapdb.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/cmapdb.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/converter.py +%%PYTHON_SITELIBDIR%%/pdfminer/converter.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/converter.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/encodingdb.py +%%PYTHON_SITELIBDIR%%/pdfminer/encodingdb.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/encodingdb.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/fontmetrics.py +%%PYTHON_SITELIBDIR%%/pdfminer/fontmetrics.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/fontmetrics.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/glyphlist.py +%%PYTHON_SITELIBDIR%%/pdfminer/glyphlist.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/glyphlist.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/image.py +%%PYTHON_SITELIBDIR%%/pdfminer/image.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/image.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/latin_enc.py +%%PYTHON_SITELIBDIR%%/pdfminer/latin_enc.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/latin_enc.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/layout.py +%%PYTHON_SITELIBDIR%%/pdfminer/layout.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/layout.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/lzw.py +%%PYTHON_SITELIBDIR%%/pdfminer/lzw.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/lzw.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/pdfcolor.py +%%PYTHON_SITELIBDIR%%/pdfminer/pdfcolor.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/pdfcolor.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/pdfdevice.py +%%PYTHON_SITELIBDIR%%/pdfminer/pdfdevice.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/pdfdevice.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/pdfdocument.py +%%PYTHON_SITELIBDIR%%/pdfminer/pdfdocument.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/pdfdocument.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/pdffont.py +%%PYTHON_SITELIBDIR%%/pdfminer/pdffont.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/pdffont.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/pdfinterp.py +%%PYTHON_SITELIBDIR%%/pdfminer/pdfinterp.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/pdfinterp.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/pdfpage.py +%%PYTHON_SITELIBDIR%%/pdfminer/pdfpage.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/pdfpage.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/pdfparser.py +%%PYTHON_SITELIBDIR%%/pdfminer/pdfparser.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/pdfparser.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/pdftypes.py +%%PYTHON_SITELIBDIR%%/pdfminer/pdftypes.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/pdftypes.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/psparser.py +%%PYTHON_SITELIBDIR%%/pdfminer/psparser.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/psparser.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/rijndael.py +%%PYTHON_SITELIBDIR%%/pdfminer/rijndael.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/rijndael.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/runlength.py +%%PYTHON_SITELIBDIR%%/pdfminer/runlength.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/runlength.pyo +%%PYTHON_SITELIBDIR%%/pdfminer/utils.py +%%PYTHON_SITELIBDIR%%/pdfminer/utils.pyc +%%PYTHON_SITELIBDIR%%/pdfminer/utils.pyo +@dirrmtry %%PYTHON_SITELIBDIR%%/pdfminer