New package: py-datasets (#24597)

* [py-datasets] created template

* [py-datasets] added dependencies

* [py-datasets] requires py-pyarrow with +parquet

* [py-datasets] Final cleanup

- added homepage
- added description
- removed fixmes
This commit is contained in:
Jen Herting 2021-06-29 22:28:23 -04:00 committed by GitHub
parent 501f87fb22
commit d00082e70b
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -0,0 +1,35 @@
# Copyright 2013-2021 Lawrence Livermore National Security, LLC and other
# Spack Project Developers. See the top-level COPYRIGHT file for details.
#
# SPDX-License-Identifier: (Apache-2.0 OR MIT)
from spack import *
class PyDatasets(PythonPackage):
"""Datasets is a lightweight library providing two main
features: one-line dataloaders for many public datasets and
efficient data pre-processing."""
homepage = "https://github.com/huggingface/datasets"
pypi = "datasets/datasets-1.8.0.tar.gz"
version('1.8.0', sha256='d57c32bb29e453ee7f3eb0bbca3660ab4dd2d0e4648efcfa987432624cab29d3')
depends_on('python@3.6:', type=('build', 'run'))
depends_on('py-setuptools', type='build')
depends_on('py-numpy@1.17:', type=('build', 'run'))
depends_on('py-pyarrow@1.0.0:3.999+parquet', type=('build', 'run'))
depends_on('py-dill', type=('build', 'run'))
depends_on('py-pandas', type=('build', 'run'))
depends_on('py-requests@2.19:', type=('build', 'run'))
depends_on('py-tqdm@4.27:4.49.999', type=('build', 'run'))
depends_on('py-dataclasses', when='^python@:3.6.999', type=('build', 'run'))
depends_on('py-xxhash', type=('build', 'run'))
depends_on('py-multiprocess', type=('build', 'run'))
depends_on('py-importlib-metadata', when='^python@:3.7.999', type=('build', 'run'))
depends_on('py-huggingface-hub@:0.0.999', type=('build', 'run'))
depends_on('py-packaging', type=('build', 'run'))
depends_on('py-fsspec@:0.8.0', when='^python@:3.7.999', type=('build', 'run'))
depends_on('py-fsspec', when='^python@3.8:', type=('build', 'run'))