summaryrefslogtreecommitdiff
path: root/sci-libs/datasets/files
diff options
context:
space:
mode:
authorV3n3RiX <venerix@koprulu.sector>2024-02-22 11:40:14 +0000
committerV3n3RiX <venerix@koprulu.sector>2024-02-22 11:40:14 +0000
commit8ef9b8c62c1aa79c0bceaf3c0d6fe1e7cdd976d0 (patch)
treef77288f305460b2e91e979db14bf06b8f882238f /sci-libs/datasets/files
parente621d36783ba0760925a62dd23c71495436fe753 (diff)
gentoo auto-resync : 22:02:2024 - 11:40:14
Diffstat (limited to 'sci-libs/datasets/files')
-rw-r--r--sci-libs/datasets/files/datasets-2.14.4-tests.patch10
-rw-r--r--sci-libs/datasets/files/datasets-2.17.1-tests.patch (renamed from sci-libs/datasets/files/datasets-2.16.0-tests.patch)29
2 files changed, 10 insertions, 29 deletions
diff --git a/sci-libs/datasets/files/datasets-2.14.4-tests.patch b/sci-libs/datasets/files/datasets-2.14.4-tests.patch
index 5dd322309b20..b9791c04e8e0 100644
--- a/sci-libs/datasets/files/datasets-2.14.4-tests.patch
+++ b/sci-libs/datasets/files/datasets-2.14.4-tests.patch
@@ -8,16 +8,6 @@
@pytest.mark.filterwarnings("ignore:metric_module_factory is deprecated:FutureWarning")
@pytest.mark.filterwarnings("ignore:load_metric is deprecated:FutureWarning")
def test_load_metric(self, metric_name):
---- a/tests/test_hf_gcp.py 2023-05-04 19:33:31.150825303 +0200
-+++ b/tests/test_hf_gcp.py 2023-05-04 19:40:08.401759538 +0200
-@@ -75,6 +75,7 @@
- self.assertTrue(os.path.exists(datset_info_path))
-
-
-+@pytest.mark.skip(reason="require apache_beam")
- @pytest.mark.integration
- def test_as_dataset_from_hf_gcs(tmp_path_factory):
- tmp_dir = tmp_path_factory.mktemp("test_hf_gcp") / "test_wikipedia_simple"
--- a/tests/test_distributed.py 2023-05-04 19:43:09.861275030 +0200
+++ b/tests/test_distributed.py 2023-05-04 19:44:17.608326722 +0200
@@ -74,6 +74,7 @@
diff --git a/sci-libs/datasets/files/datasets-2.16.0-tests.patch b/sci-libs/datasets/files/datasets-2.17.1-tests.patch
index 8cb89e824b3b..14ae50602d10 100644
--- a/sci-libs/datasets/files/datasets-2.16.0-tests.patch
+++ b/sci-libs/datasets/files/datasets-2.17.1-tests.patch
@@ -1,6 +1,6 @@
--- a/tests/test_arrow_dataset.py 2024-02-20 21:53:24.248470991 +0100
+++ b/tests/test_arrow_dataset.py 2024-02-20 21:53:29.441804737 +0100
-@@ -3982,7 +3982,6 @@
+@@ -4016,7 +4016,6 @@
[
"relative/path",
"/absolute/path",
@@ -10,15 +10,15 @@
],
--- a/tests/test_load.py 2024-02-20 22:12:13.699209107 +0100
+++ b/tests/test_load.py 2024-02-20 22:13:10.862626708 +0100
-@@ -386,6 +386,7 @@
+@@ -388,6 +388,7 @@
hf_modules_cache=self.hf_modules_cache,
)
+ @pytest.mark.skip(reason="")
def test_HubDatasetModuleFactoryWithScript_dont_trust_remote_code(self):
- # "squad" has a dataset script
+ # "lhoestq/test" has a dataset script
factory = HubDatasetModuleFactoryWithScript(
-@@ -402,6 +402,7 @@
+@@ -403,6 +404,7 @@
)
self.assertRaises(ValueError, factory.get_module)
@@ -26,7 +26,7 @@
def test_HubDatasetModuleFactoryWithScript_with_github_dataset(self):
# "wmt_t2t" has additional imports (internal)
factory = HubDatasetModuleFactoryWithScript(
-@@ -411,6 +412,7 @@
+@@ -412,6 +414,7 @@
assert importlib.import_module(module_factory_result.module_path) is not None
assert module_factory_result.builder_kwargs["base_path"].startswith(config.HF_ENDPOINT)
@@ -34,7 +34,7 @@
def test_GithubMetricModuleFactory_with_internal_import(self):
# "squad_v2" requires additional imports (internal)
factory = GithubMetricModuleFactory(
-@@ -419,6 +421,7 @@
+@@ -420,6 +423,7 @@
module_factory_result = factory.get_module()
assert importlib.import_module(module_factory_result.module_path) is not None
@@ -42,7 +42,7 @@
@pytest.mark.filterwarnings("ignore:GithubMetricModuleFactory is deprecated:FutureWarning")
def test_GithubMetricModuleFactory_with_external_import(self):
# "bleu" requires additional imports (external from github)
-@@ -1032,6 +1035,7 @@
+@@ -1033,6 +1037,7 @@
datasets.load_dataset_builder(SAMPLE_DATASET_TWO_CONFIG_IN_METADATA, "non-existing-config")
@@ -50,7 +50,7 @@
@pytest.mark.parametrize("serializer", [pickle, dill])
def test_load_dataset_builder_with_metadata_configs_pickable(serializer):
builder = datasets.load_dataset_builder(SAMPLE_DATASET_SINGLE_CONFIG_IN_METADATA)
-@@ -1153,6 +1157,7 @@
+@@ -1154,6 +1159,7 @@
assert len(builder.config.data_files["test"]) > 0
@@ -58,7 +58,7 @@
def test_load_dataset_builder_fail():
with pytest.raises(DatasetNotFoundError):
datasets.load_dataset_builder("blabla")
-@@ -1168,6 +1173,7 @@
+@@ -1169,6 +1175,7 @@
assert isinstance(next(iter(dataset["train"])), dict)
@@ -68,7 +68,7 @@
assert isinstance(dataset, DatasetDict)
--- a/tests/test_hf_gcp.py 2024-02-21 09:59:26.918397895 +0100
+++ b/tests/test_hf_gcp.py 2024-02-21 09:59:46.335100597 +0100
-@@ -47,6 +47,7 @@
+@@ -45,6 +45,7 @@
]
@@ -78,15 +78,6 @@
dataset = None
--- a/tests/test_inspect.py 2024-02-21 10:03:32.315520016 +0100
+++ b/tests/test_inspect.py 2024-02-21 10:03:50.345553490 +0100
-@@ -18,7 +18,7 @@
- pytestmark = pytest.mark.integration
-
-
--@pytest.mark.parametrize("path", ["paws", csv.__file__])
-+@pytest.mark.parametrize("path", [csv.__file__])
- def test_inspect_dataset(path, tmp_path):
- inspect_dataset(path, tmp_path)
- script_name = Path(path).stem + ".py"
@@ -49,6 +49,7 @@
assert list(info.splits.keys()) == expected_splits