summaryrefslogtreecommitdiff
path: root/sci-ml/datasets
diff options
context:
space:
mode:
authorV3n3RiX <venerix@koprulu.sector>2025-04-18 08:46:05 +0100
committerV3n3RiX <venerix@koprulu.sector>2025-04-18 08:46:05 +0100
commitcf1a411e806b434c96329401a6ff0901ec7f0d5c (patch)
tree969527fcceb3b686400c73b5ed22c1d587a8eb3e /sci-ml/datasets
parent6a01345ec5dc673d0ebd4653ceb063eafa7fcf65 (diff)
gentoo auto-resync : 18:04:2025 - 08:46:04next
Diffstat (limited to 'sci-ml/datasets')
-rw-r--r--sci-ml/datasets/Manifest4
-rw-r--r--sci-ml/datasets/datasets-3.5.0.ebuild126
-rw-r--r--sci-ml/datasets/metadata.xml4
3 files changed, 133 insertions, 1 deletions
diff --git a/sci-ml/datasets/Manifest b/sci-ml/datasets/Manifest
index fad5caa1423d..fc2b3f3dd928 100644
--- a/sci-ml/datasets/Manifest
+++ b/sci-ml/datasets/Manifest
@@ -5,9 +5,11 @@ DIST datasets-3.1.0.gh.tar.gz 1877057 BLAKE2B 818cbf10282f775cda5956ae37607bb535
DIST datasets-3.2.0.gh.tar.gz 1877261 BLAKE2B 0169ee27e1128f8b64fda0e3a4dd63d5d603874cdbf703cd73f100ad1ea69294c300b93cddaa4f2dd8c795570b76adb34e40475d38730f4733679008fb593d84 SHA512 2e381d6919ea7f2e934e832d6bff30a4b23cfe929c0b4345703ce39c7882daf8a234fe71ca89d1d9bcd75000e35845156f7036f9604504ac584feb1b8d3239b1
DIST datasets-3.3.2.gh.tar.gz 1886396 BLAKE2B bb51d8e929fbadd9d04f7ca6c8894dc06b88940643f02743b10cea3c2dd5b91b720358d2229a2263e236a6b4911d9dc60e8698da4369393a63f2603274a4f599 SHA512 4c6c4a4e748b5018574c0968929d1dac2aee96bc6f964dedf54c63e872808ca4a4958ed59e0240c958f352ca7a8d333de7ac44095e7c9525e2d9e703afbaeabf
DIST datasets-3.4.1.gh.tar.gz 1888651 BLAKE2B 836f0e0bb55cefd5a0616785c87c867292cc46ec609934b4f7688462aa7ec95b248f06018cd99e68a88b4e179e0aa48dd601a2fc74bc1b809c336bd70ae0bd6a SHA512 c3654fec241b5da1fb2c9349ff2d0f309e184e5158a0bd19ca0477f1bfb7570d9268e93d1828e1648132563c04ba62ec4eabead2f29d8ef1a29b593aec1c62b1
+DIST datasets-3.5.0.gh.tar.gz 1906212 BLAKE2B 2c26b907230eb9256a6056878dc80eae3296869f24597298f262d49a5fc0a31dbcd6ebb8dfaca9cf27faece019a4f39ab0dd07db772659d414e1d3f5ecfe2258 SHA512 ca053187b6b80140136991e5b220136cf22f3cd98d073323e0a72d77211248d52986aa49b0e595759ba023b4551a9dc01ab1cac853c855f032acbd9a023ecd5a
EBUILD datasets-3.0.2-r1.ebuild 3862 BLAKE2B 757bd443b59c6636a4a993d1ed8010a0e331bf98d93e0228d2df15f1b31056c1555f9f9bc5790c682d23866ba3f9b5dec154356f6cfacf1e7b6e9a450759e181 SHA512 9c7e9572592716ddc2ad4a84e5df69fc46cba872f17f92de36ba803ae0e1db0bc65568e9bc9327c42b0053ff1f28dc58533eab57a1753f696510e042c713f916
EBUILD datasets-3.1.0.ebuild 3869 BLAKE2B 4646f5dd6fd885f98321956d3875b656fc49b88d69e3235dfb741e95127aa925a2e64316a43acb47fd2f01c4d2391b65980b28cf206843c785f7aba73bfdfecd SHA512 29269df33350b63b0a7e6ccd847a73eb9647a4c292fb8fe22b9960fdc7152dcc002f54b279249155c194c5db1f665ff4bead14a45bd3c8f83278128dc4d602f3
EBUILD datasets-3.2.0.ebuild 3869 BLAKE2B 4646f5dd6fd885f98321956d3875b656fc49b88d69e3235dfb741e95127aa925a2e64316a43acb47fd2f01c4d2391b65980b28cf206843c785f7aba73bfdfecd SHA512 29269df33350b63b0a7e6ccd847a73eb9647a4c292fb8fe22b9960fdc7152dcc002f54b279249155c194c5db1f665ff4bead14a45bd3c8f83278128dc4d602f3
EBUILD datasets-3.3.2.ebuild 3817 BLAKE2B 8a06e33e8dfcb01f16008bfe3ff80be0751c18b39ce14031b1218c926169d7a790f6d990f9470df91e7b1068a5a92eee114e0af68781366de3ab7ea7d10b4546 SHA512 82948eb49d0730998c039795116e8493ce9b2236b74e2df953b39dcd6b79c94fb7d686f13e80d0d46b1d48d0c78a6725b380000f4cd84baedd190351c8d6584f
EBUILD datasets-3.4.1.ebuild 4109 BLAKE2B afa5500f83907c5a657b2f350e960cf2c21866424efb3c3d7cc3f6266836f23d3557549333a83831d7a5115fd72f159fabcfde8c40f0e9bbf9eec1b28cb86e9f SHA512 1dbee5af66807c2590017b5f6fc5d6065f4e74933e70b882de6e63c21bb922a1d3ed4414f02cfad8f27a5a9515add951a518bdcedc2dc73e8fcad98dec66d255
-MISC metadata.xml 379 BLAKE2B 48ebb9e7bfa8b58b0d15b82c4146def465e08cf3212ab4af04129d09c153b67b00d0fa05b94d6af54f643ec3a202f2335d3254b966f49d1394d3c7b9e5da56a5 SHA512 99560decfaa0e438980f372d99257695e9ca9585167d9aba091e0b775c2f8384657ddc017841c8f06f8b568017a54fb9e31da736f3c875da717e154cdce876d1
+EBUILD datasets-3.5.0.ebuild 4237 BLAKE2B eac02108ad27e8bf772b9ba9531908a980df78288d73a35cfebc91ff2c8bace552fc5f3146257fa70766ea9078e1140a737361eea691a78c58521d3a5e79eb2e SHA512 e29c8387ce8bb2823bfd20a426ac5773921a9a25f822f14fee9ab159ecb70540af1d12b8b27755d6c077712a158ebc74e08b09588da196afd0a8b668c92cc630
+MISC metadata.xml 478 BLAKE2B 8f4309c23cc1b048838c0120e6be9e83d7e796eced3488a32d791896d446f8c27b2e53cbdb04f23e5bf778f9d38e112267f1bae87669e39f3349fd4639fe0e8b SHA512 1583735215d169a07f78e74ad60061ccb49c308e02745e4400dd92ded96d2818b315c8578735ef2166f11c6bd5a240d62021bfa3a82bbd9670a7c3ad9743c78b
diff --git a/sci-ml/datasets/datasets-3.5.0.ebuild b/sci-ml/datasets/datasets-3.5.0.ebuild
new file mode 100644
index 000000000000..98f3234c789b
--- /dev/null
+++ b/sci-ml/datasets/datasets-3.5.0.ebuild
@@ -0,0 +1,126 @@
+# Copyright 2023-2025 Gentoo Authors
+# Distributed under the terms of the GNU General Public License v2
+
+EAPI=8
+
+DISTUTILS_USE_PEP517=setuptools
+PYTHON_COMPAT=( python3_{11..13} )
+DISTUTILS_SINGLE_IMPL=1
+inherit distutils-r1
+
+DESCRIPTION="Access and share datasets for Audio, Computer Vision, and NLP tasks"
+HOMEPAGE="https://pypi.org/project/datasets/"
+SRC_URI="https://github.com/huggingface/${PN}/archive/refs/tags/${PV}.tar.gz
+ -> ${P}.gh.tar.gz"
+
+LICENSE="Apache-2.0"
+SLOT="0"
+KEYWORDS="~amd64"
+IUSE="torch vision"
+REQUIRES_USE="test? ( torch vision )"
+
+RDEPEND="
+ sci-ml/huggingface_hub[${PYTHON_SINGLE_USEDEP}]
+ $(python_gen_cond_dep '
+ dev-python/aiohttp[${PYTHON_USEDEP}]
+ dev-python/dill[${PYTHON_USEDEP}]
+ dev-python/filelock[${PYTHON_USEDEP}]
+ dev-python/fsspec[${PYTHON_USEDEP}]
+ dev-python/multiprocess[${PYTHON_USEDEP}]
+ dev-python/numpy[${PYTHON_USEDEP}]
+ dev-python/packaging[${PYTHON_USEDEP}]
+ dev-python/pandas[${PYTHON_USEDEP}]
+ dev-python/pyarrow[${PYTHON_USEDEP},parquet,snappy]
+ dev-python/pyyaml[${PYTHON_USEDEP}]
+ dev-python/requests[${PYTHON_USEDEP}]
+ dev-python/tqdm[${PYTHON_USEDEP}]
+ dev-python/xxhash[${PYTHON_USEDEP}]
+ vision? (
+ dev-python/pillow[${PYTHON_USEDEP}]
+ )
+ ')
+ torch? (
+ sci-ml/caffe2[${PYTHON_SINGLE_USEDEP},numpy]
+ sci-ml/pytorch[${PYTHON_SINGLE_USEDEP}]
+ )
+"
+DEPEND="${RDEPEND}"
+# Missing x test:
+# joblib
+# joblibspark
+# faiss-cpu
+# jax
+# jaxlib
+# polars
+# pyav
+# pyspark
+# py7zr
+# s3fs
+# tensorflow
+# tiktoken
+# torchdata
+# transformers
+BDEPEND="test? (
+ sci-ml/torchvision[${PYTHON_SINGLE_USEDEP}]
+ $(python_gen_cond_dep '
+ dev-python/absl-py[${PYTHON_USEDEP}]
+ dev-python/decorator[${PYTHON_USEDEP}]
+ dev-python/elasticsearch[${PYTHON_USEDEP}]
+ dev-python/lz4[${PYTHON_USEDEP}]
+ dev-python/moto[${PYTHON_USEDEP}]
+ dev-python/protobuf:=[${PYTHON_USEDEP}]
+ dev-python/pytest-datadir[${PYTHON_USEDEP}]
+ dev-python/pytest-xdist[${PYTHON_USEDEP}]
+ dev-python/soundfile[${PYTHON_USEDEP}]
+ dev-python/sqlalchemy[${PYTHON_USEDEP}]
+ dev-python/zstandard[${PYTHON_USEDEP}]
+ ')
+)"
+
+distutils_enable_tests pytest
+
+src_test() {
+ local EPYTEST_IGNORE=(
+ tests/features/test_audio.py
+ tests/packaged_modules/test_audiofolder.py
+ tests/packaged_modules/test_spark.py
+ tests/test_fingerprint.py
+ tests/test_iterable_dataset.py
+ tests/test_inspect.py
+ tests/test_load.py
+ tests/test_upstream_hub.py
+ )
+
+ local EPYTEST_DESELECT=(
+ tests/commands/test_test.py::test_test_command
+ tests/features/test_video.py::test_video_feature_encode_example
+ tests/features/test_video.py::test_dataset_with_video_feature
+ tests/features/test_video.py::test_dataset_with_video_map_and_formatted
+ tests/io/test_parquet.py::test_parquet_read_geoparquet
+ tests/packaged_modules/test_cache.py::test_cache_multi_configs
+ tests/packaged_modules/test_cache.py::test_cache_single_config
+ tests/test_arrow_dataset.py::BaseDatasetTest::test_filter_caching_on_disk
+ tests/test_arrow_dataset.py::BaseDatasetTest::test_map_caching_on_disk
+ tests/test_distributed.py::test_torch_distributed_run
+ tests/test_file_utils.py::TestxPath::test_xpath_rglob
+ tests/test_file_utils.py::TestxPath::test_xpath_glob
+ tests/test_file_utils.py::test_xexists_private
+ tests/test_file_utils.py::test_xlistdir_private
+ tests/test_file_utils.py::test_xisdir_private
+ tests/test_file_utils.py::test_xisfile_private
+ tests/test_file_utils.py::test_xgetsize_private
+ tests/test_file_utils.py::test_xglob_private
+ tests/test_file_utils.py::test_xwalk_private
+ tests/test_hub.py::test_convert_to_parquet
+ tests/packaged_modules/test_cache.py::test_cache_capital_letters
+ tests/packaged_modules/test_folder_based_builder.py::test_data_files_with_different_levels_no_metadata
+ tests/packaged_modules/test_folder_based_builder.py::test_data_files_with_one_label_no_metadata
+ tests/test_data_files.py::test_DataFilesList_from_patterns_locally_with_extra_files
+ tests/test_data_files.py::test_DataFilesDict_from_patterns_locally_or_remote_hashing
+ tests/test_file_utils.py::test_xopen_remote
+ tests/test_hub.py::test_delete_from_hub
+ tests/test_offline_util.py::test_offline_with_timeout
+ tests/test_search.py::ElasticSearchIndexTest::test_elasticsearch
+ )
+ distutils-r1_src_test
+}
diff --git a/sci-ml/datasets/metadata.xml b/sci-ml/datasets/metadata.xml
index 94c112402049..f7e5d145210a 100644
--- a/sci-ml/datasets/metadata.xml
+++ b/sci-ml/datasets/metadata.xml
@@ -5,6 +5,10 @@
<email>tupone@gentoo.org</email>
<name>Tupone Alfredo</name>
</maintainer>
+ <use>
+ <flag name="torch">Use pytorch</flag>
+ <flag name="vision">Support vision</flag>
+ </use>
<upstream>
<remote-id type="github">huggingface/datasets</remote-id>
<remote-id type="pypi">datasets</remote-id>