diff options
author | V3n3RiX <venerix@koprulu.sector> | 2024-02-22 11:40:14 +0000 |
---|---|---|
committer | V3n3RiX <venerix@koprulu.sector> | 2024-02-22 11:40:14 +0000 |
commit | 8ef9b8c62c1aa79c0bceaf3c0d6fe1e7cdd976d0 (patch) | |
tree | f77288f305460b2e91e979db14bf06b8f882238f /sci-libs/datasets | |
parent | e621d36783ba0760925a62dd23c71495436fe753 (diff) |
gentoo auto-resync : 22:02:2024 - 11:40:14
Diffstat (limited to 'sci-libs/datasets')
-rw-r--r-- | sci-libs/datasets/Manifest | 8 | ||||
-rw-r--r-- | sci-libs/datasets/datasets-2.17.1.ebuild (renamed from sci-libs/datasets/datasets-2.16.0.ebuild) | 8 | ||||
-rw-r--r-- | sci-libs/datasets/files/datasets-2.14.4-tests.patch | 10 | ||||
-rw-r--r-- | sci-libs/datasets/files/datasets-2.17.1-tests.patch (renamed from sci-libs/datasets/files/datasets-2.16.0-tests.patch) | 29 |
4 files changed, 20 insertions, 35 deletions
diff --git a/sci-libs/datasets/Manifest b/sci-libs/datasets/Manifest index 21c1c02b3ecd..32934c5c4a4c 100644 --- a/sci-libs/datasets/Manifest +++ b/sci-libs/datasets/Manifest @@ -1,5 +1,5 @@ -AUX datasets-2.14.4-tests.patch 8616 BLAKE2B 8a65d1315b27658a5f741ebc022c83692252a4833ec4d7b79873799c2bb4bb68534a9e13e7fae1c9a6c051b3615fbb783e6e7885ed93968b31aea6629b4116c4 SHA512 2c6d27c297995466a0aebefa46e86113bdce7d84ea00bb1630549fc379fbb51d66f8f01a8d098d56ec2b26d5200f129460567abdbf6a63d4e2a61372fbfbc6a3 -AUX datasets-2.16.0-tests.patch 5619 BLAKE2B b143a97aa1ce2a4f793370557b18cb948872c856e20129c9d29159a531a1f1a7781957c8eb64420622865d52510376b1d7c757f51d6f0320613200e739212135 SHA512 a865fcb7e0d0437b1dc6cbac905772b5fdec2107f27abe331419111b49ffff237b877568edea354f57165ce7b66df0d3ac2506966259c229495f34722de23e9e -DIST datasets-2.16.0.gh.tar.gz 2163874 BLAKE2B baec91a0e39fac3e07f11e352a286c0940cbc672e7233267e70d1abb64dd31bae18c55213a20fafaeaf2f60268104f294c77c9b73ddc1b289175904288a7c440 SHA512 f2a17ffab192163cfc196cc2bad0adb2ca657b5cf911f74f299b6e29eb4fcfacc377505b1857974a6b55252eedf8775a8706f9e991450c55e5d613020dc03735 -EBUILD datasets-2.16.0.ebuild 2304 BLAKE2B 4af6b595b3344e5df5ddcc46146d637e1091a1b7237e4ab2c3f49299a14c22af32dd180902cac16a3723e3a67613951325d8e47481e0bd5081ce6daa9741286a SHA512 1c7df28fd520eb30bb40f42347cfa106d3f12bbc5c8b9eaf93cfcf956078ab2217b51f50f865949b0bd90e85f569adb59ad06ef350db79038dfa38ccb549b2c2 +AUX datasets-2.14.4-tests.patch 8198 BLAKE2B fbff05d38b138796f48a09cbf2e4499a63840bc24cc24b14e49cc8a7ef87bd6cf2fed24de4f9b45ff6a5581e8af407a734cd29f2172028592437d8bb54a5c6c9 SHA512 b9b87fce4ae2866ff23f038d5df799431600f1d7de5ef46d0c871401d6f47f45390d39c20342074f86eb31087336d80954d3ce288f317bf83c044ff65edece5a +AUX datasets-2.17.1-tests.patch 5335 BLAKE2B 2d006dfd847d8e5424754fd3f1f855a909f407f80a3846e1959f726fff9b1076e46f5e2b4c5257dad51710e94312dba0fce98d79211fe4ffb6c72b01f2c6dd2d SHA512 be8df0b3b15371963d59054314134cbc3e263cdc4ab09eb54509842de000a21c0a0f52b0202656a1ae5cbbba5f77651f7a1e2a3d76a955211c7a8fbee01fca3b +DIST datasets-2.17.1.gh.tar.gz 2168860 BLAKE2B ad7e9be7e60125d53b19b6277b6be6ae6050321e4210293a37737a345a4806d4901e9507fbf7a51c5e00a91912656d68a94e76cf70e070433beccc6e1ad54643 SHA512 43617c3d98cc3ad17fb577d6e917d164c8b6ec24740604ca281adaa2f0e5a6538633721792c9fa6621b7f1980161d8acf62dcdcdacca56e1739a8f28e3c71cdf +EBUILD datasets-2.17.1.ebuild 2456 BLAKE2B 475c5d4dda897f61735a93811e5350e8e20159b2a00e448425fefae396cc8fccca4f8d8debf229e938403c59981f8461cfc78a865fc47e201351e6049830a334 SHA512 61d09cc8b95baf414523a80f8db5b01cfa5517c94e79217684d629ad7ec79f1b1f1d9115405e2734e3dc17d80158182310919bf94f44fb8ddb6e04979361d2eb MISC metadata.xml 379 BLAKE2B 48ebb9e7bfa8b58b0d15b82c4146def465e08cf3212ab4af04129d09c153b67b00d0fa05b94d6af54f643ec3a202f2335d3254b966f49d1394d3c7b9e5da56a5 SHA512 99560decfaa0e438980f372d99257695e9ca9585167d9aba091e0b775c2f8384657ddc017841c8f06f8b568017a54fb9e31da736f3c875da717e154cdce876d1 diff --git a/sci-libs/datasets/datasets-2.16.0.ebuild b/sci-libs/datasets/datasets-2.17.1.ebuild index a34fcaa2f89c..9b6295db1a0e 100644 --- a/sci-libs/datasets/datasets-2.16.0.ebuild +++ b/sci-libs/datasets/datasets-2.17.1.ebuild @@ -27,12 +27,16 @@ RDEPEND=" $(python_gen_cond_dep ' dev-python/absl-py[${PYTHON_USEDEP}] dev-python/aiohttp[${PYTHON_USEDEP}] + dev-python/dill[${PYTHON_USEDEP}] + dev-python/filelock[${PYTHON_USEDEP}] <=dev-python/fsspec-2023.10.0[${PYTHON_USEDEP}] dev-python/multiprocess[${PYTHON_USEDEP}] + dev-python/numpy[${PYTHON_USEDEP}] dev-python/packaging[${PYTHON_USEDEP}] dev-python/pandas[${PYTHON_USEDEP}] dev-python/pyarrow[${PYTHON_USEDEP},parquet,snappy] dev-python/pyyaml[${PYTHON_USEDEP}] + dev-python/requests[${PYTHON_USEDEP}] dev-python/tqdm[${PYTHON_USEDEP}] dev-python/xxhash[${PYTHON_USEDEP}] dev-python/zstandard[${PYTHON_USEDEP}] @@ -46,7 +50,7 @@ BDEPEND="test? ( dev-python/absl-py[${PYTHON_USEDEP}] dev-python/pytest-datadir[${PYTHON_USEDEP}] dev-python/decorator[${PYTHON_USEDEP}] - =dev-python/sqlalchemy-1*[${PYTHON_USEDEP}] + dev-python/sqlalchemy[${PYTHON_USEDEP}] sci-libs/jiwer[${PYTHON_USEDEP}] sci-libs/seqeval[${PYTHON_USEDEP}] ') @@ -79,5 +83,5 @@ src_prepare() { tests/test_streaming_download_manager.py \ tests/commands/test_test.py \ tests/packaged_modules/test_cache.py \ - die + || die } diff --git a/sci-libs/datasets/files/datasets-2.14.4-tests.patch b/sci-libs/datasets/files/datasets-2.14.4-tests.patch index 5dd322309b20..b9791c04e8e0 100644 --- a/sci-libs/datasets/files/datasets-2.14.4-tests.patch +++ b/sci-libs/datasets/files/datasets-2.14.4-tests.patch @@ -8,16 +8,6 @@ @pytest.mark.filterwarnings("ignore:metric_module_factory is deprecated:FutureWarning") @pytest.mark.filterwarnings("ignore:load_metric is deprecated:FutureWarning") def test_load_metric(self, metric_name): ---- a/tests/test_hf_gcp.py 2023-05-04 19:33:31.150825303 +0200 -+++ b/tests/test_hf_gcp.py 2023-05-04 19:40:08.401759538 +0200 -@@ -75,6 +75,7 @@ - self.assertTrue(os.path.exists(datset_info_path)) - - -+@pytest.mark.skip(reason="require apache_beam") - @pytest.mark.integration - def test_as_dataset_from_hf_gcs(tmp_path_factory): - tmp_dir = tmp_path_factory.mktemp("test_hf_gcp") / "test_wikipedia_simple" --- a/tests/test_distributed.py 2023-05-04 19:43:09.861275030 +0200 +++ b/tests/test_distributed.py 2023-05-04 19:44:17.608326722 +0200 @@ -74,6 +74,7 @@ diff --git a/sci-libs/datasets/files/datasets-2.16.0-tests.patch b/sci-libs/datasets/files/datasets-2.17.1-tests.patch index 8cb89e824b3b..14ae50602d10 100644 --- a/sci-libs/datasets/files/datasets-2.16.0-tests.patch +++ b/sci-libs/datasets/files/datasets-2.17.1-tests.patch @@ -1,6 +1,6 @@ --- a/tests/test_arrow_dataset.py 2024-02-20 21:53:24.248470991 +0100 +++ b/tests/test_arrow_dataset.py 2024-02-20 21:53:29.441804737 +0100 -@@ -3982,7 +3982,6 @@ +@@ -4016,7 +4016,6 @@ [ "relative/path", "/absolute/path", @@ -10,15 +10,15 @@ ], --- a/tests/test_load.py 2024-02-20 22:12:13.699209107 +0100 +++ b/tests/test_load.py 2024-02-20 22:13:10.862626708 +0100 -@@ -386,6 +386,7 @@ +@@ -388,6 +388,7 @@ hf_modules_cache=self.hf_modules_cache, ) + @pytest.mark.skip(reason="") def test_HubDatasetModuleFactoryWithScript_dont_trust_remote_code(self): - # "squad" has a dataset script + # "lhoestq/test" has a dataset script factory = HubDatasetModuleFactoryWithScript( -@@ -402,6 +402,7 @@ +@@ -403,6 +404,7 @@ ) self.assertRaises(ValueError, factory.get_module) @@ -26,7 +26,7 @@ def test_HubDatasetModuleFactoryWithScript_with_github_dataset(self): # "wmt_t2t" has additional imports (internal) factory = HubDatasetModuleFactoryWithScript( -@@ -411,6 +412,7 @@ +@@ -412,6 +414,7 @@ assert importlib.import_module(module_factory_result.module_path) is not None assert module_factory_result.builder_kwargs["base_path"].startswith(config.HF_ENDPOINT) @@ -34,7 +34,7 @@ def test_GithubMetricModuleFactory_with_internal_import(self): # "squad_v2" requires additional imports (internal) factory = GithubMetricModuleFactory( -@@ -419,6 +421,7 @@ +@@ -420,6 +423,7 @@ module_factory_result = factory.get_module() assert importlib.import_module(module_factory_result.module_path) is not None @@ -42,7 +42,7 @@ @pytest.mark.filterwarnings("ignore:GithubMetricModuleFactory is deprecated:FutureWarning") def test_GithubMetricModuleFactory_with_external_import(self): # "bleu" requires additional imports (external from github) -@@ -1032,6 +1035,7 @@ +@@ -1033,6 +1037,7 @@ datasets.load_dataset_builder(SAMPLE_DATASET_TWO_CONFIG_IN_METADATA, "non-existing-config") @@ -50,7 +50,7 @@ @pytest.mark.parametrize("serializer", [pickle, dill]) def test_load_dataset_builder_with_metadata_configs_pickable(serializer): builder = datasets.load_dataset_builder(SAMPLE_DATASET_SINGLE_CONFIG_IN_METADATA) -@@ -1153,6 +1157,7 @@ +@@ -1154,6 +1159,7 @@ assert len(builder.config.data_files["test"]) > 0 @@ -58,7 +58,7 @@ def test_load_dataset_builder_fail(): with pytest.raises(DatasetNotFoundError): datasets.load_dataset_builder("blabla") -@@ -1168,6 +1173,7 @@ +@@ -1169,6 +1175,7 @@ assert isinstance(next(iter(dataset["train"])), dict) @@ -68,7 +68,7 @@ assert isinstance(dataset, DatasetDict) --- a/tests/test_hf_gcp.py 2024-02-21 09:59:26.918397895 +0100 +++ b/tests/test_hf_gcp.py 2024-02-21 09:59:46.335100597 +0100 -@@ -47,6 +47,7 @@ +@@ -45,6 +45,7 @@ ] @@ -78,15 +78,6 @@ dataset = None --- a/tests/test_inspect.py 2024-02-21 10:03:32.315520016 +0100 +++ b/tests/test_inspect.py 2024-02-21 10:03:50.345553490 +0100 -@@ -18,7 +18,7 @@ - pytestmark = pytest.mark.integration - - --@pytest.mark.parametrize("path", ["paws", csv.__file__]) -+@pytest.mark.parametrize("path", [csv.__file__]) - def test_inspect_dataset(path, tmp_path): - inspect_dataset(path, tmp_path) - script_name = Path(path).stem + ".py" @@ -49,6 +49,7 @@ assert list(info.splits.keys()) == expected_splits |