git: 2a685ab209b7 - main - databases/py-fastparquet: Add py-fastparquet 2023.2.0
- Go to: [ bottom of page ] [ top of archives ] [ this month ]
Date: Wed, 05 Apr 2023 17:33:14 UTC
The branch main has been updated by sunpoet: URL: https://cgit.FreeBSD.org/ports/commit/?id=2a685ab209b7b7d03f1d03f6bd2d33676f8efd36 commit 2a685ab209b7b7d03f1d03f6bd2d33676f8efd36 Author: Po-Chuan Hsieh <sunpoet@FreeBSD.org> AuthorDate: 2023-04-05 17:07:22 +0000 Commit: Po-Chuan Hsieh <sunpoet@FreeBSD.org> CommitDate: 2023-04-05 17:29:38 +0000 databases/py-fastparquet: Add py-fastparquet 2023.2.0 fastparquet is a python implementation of the parquet format, aiming integrate into python-based big data work-flows. It is used implicitly by the projects Dask, Pandas and intake-parquet. We offer a high degree of support for the features of the parquet format, and very competitive performance, in a small install size and codebase. --- databases/Makefile | 1 + databases/py-fastparquet/Makefile | 30 +++++++++++++++++++++++++++ databases/py-fastparquet/distinfo | 3 +++ databases/py-fastparquet/files/patch-setup.py | 20 ++++++++++++++++++ databases/py-fastparquet/pkg-descr | 6 ++++++ 5 files changed, 60 insertions(+) diff --git a/databases/Makefile b/databases/Makefile index 32b05e235f23..9edea03dced9 100644 --- a/databases/Makefile +++ b/databases/Makefile @@ -747,6 +747,7 @@ SUBDIR += py-duckdb SUBDIR += py-fakeredis SUBDIR += py-fastapi-users-db-ormar + SUBDIR += py-fastparquet SUBDIR += py-fdb SUBDIR += py-firebirdsql SUBDIR += py-flask-sqlalchemy diff --git a/databases/py-fastparquet/Makefile b/databases/py-fastparquet/Makefile new file mode 100644 index 000000000000..6fd05dd8cbe2 --- /dev/null +++ b/databases/py-fastparquet/Makefile @@ -0,0 +1,30 @@ +PORTNAME= fastparquet +PORTVERSION= 2023.2.0 +CATEGORIES= databases python +MASTER_SITES= PYPI +PKGNAMEPREFIX= ${PYTHON_PKGNAMEPREFIX} + +MAINTAINER= sunpoet@FreeBSD.org +COMMENT= Python support for Parquet file format +WWW= https://github.com/dask/fastparquet + +LICENSE= APACHE20 +LICENSE_FILE= ${WRKSRC}/LICENSE + +BUILD_DEPENDS= ${PYTHON_PKGNAMEPREFIX}numpy>=0,1:math/py-numpy@${PY_FLAVOR} \ + ${PYTHON_PKGNAMEPREFIX}setuptools_scm>=1.5.4:devel/py-setuptools_scm@${PY_FLAVOR} \ + ${PYTHON_PKGNAMEPREFIX}wheel>=0:devel/py-wheel@${PY_FLAVOR} \ + thrift:devel/thrift +RUN_DEPENDS= ${PYTHON_PKGNAMEPREFIX}cramjam>=2.3:archivers/py-cramjam@${PY_FLAVOR} \ + ${PYTHON_PKGNAMEPREFIX}fsspec>=0:devel/py-fsspec@${PY_FLAVOR} \ + ${PYTHON_PKGNAMEPREFIX}numpy>=1.20.3,1:math/py-numpy@${PY_FLAVOR} \ + ${PYTHON_PKGNAMEPREFIX}packaging>=0:devel/py-packaging@${PY_FLAVOR} \ + ${PYTHON_PKGNAMEPREFIX}pandas>=1.5.0,1:math/py-pandas@${PY_FLAVOR} + +USES= python:3.8+ +USE_PYTHON= autoplist concurrent cython distutils + +post-install: + ${FIND} ${STAGEDIR}${PYTHON_SITELIBDIR} -name '*.so' -exec ${STRIP_CMD} {} + + +.include <bsd.port.mk> diff --git a/databases/py-fastparquet/distinfo b/databases/py-fastparquet/distinfo new file mode 100644 index 000000000000..1f4e3a5e6f89 --- /dev/null +++ b/databases/py-fastparquet/distinfo @@ -0,0 +1,3 @@ +TIMESTAMP = 1679498488 +SHA256 (fastparquet-2023.2.0.tar.gz) = 7611447ce3ff5696539f7e43289da2491ea41f7cb92d4dbada374012b62c51c3 +SIZE (fastparquet-2023.2.0.tar.gz) = 392472 diff --git a/databases/py-fastparquet/files/patch-setup.py b/databases/py-fastparquet/files/patch-setup.py new file mode 100644 index 000000000000..aa3535977588 --- /dev/null +++ b/databases/py-fastparquet/files/patch-setup.py @@ -0,0 +1,20 @@ +--- setup.py.orig 2022-11-18 01:33:09 UTC ++++ setup.py +@@ -44,7 +44,6 @@ else: + extra = {'ext_modules': cythonize(modules, language_level=3)} + + install_requires = open('requirements.txt').read().strip().split('\n') +-subprocess.call(["git", "status"], stdout=sys.stdout, stderr=sys.stderr) + + setup( + name='fastparquet', +@@ -57,8 +56,7 @@ setup( + 'setuptools>18.0', + 'setuptools-scm>1.5.4', + 'Cython', +- 'pytest-runner', +- 'oldest-supported-numpy' ++ 'numpy' + ], + description='Python support for Parquet file format', + author='Martin Durant', diff --git a/databases/py-fastparquet/pkg-descr b/databases/py-fastparquet/pkg-descr new file mode 100644 index 000000000000..d8b5b47d5700 --- /dev/null +++ b/databases/py-fastparquet/pkg-descr @@ -0,0 +1,6 @@ +fastparquet is a python implementation of the parquet format, aiming integrate +into python-based big data work-flows. It is used implicitly by the projects +Dask, Pandas and intake-parquet. + +We offer a high degree of support for the features of the parquet format, and +very competitive performance, in a small install size and codebase.