From abe7947ec079840b4e1c7305480752fd017569ad Mon Sep 17 00:00:00 2001 From: Charles Beauville Date: Mon, 16 Oct 2023 11:02:40 +0200 Subject: [PATCH 1/2] Fix CI by downgrading torch on fastai E2E (#2518) --- e2e/fastai/pyproject.toml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/e2e/fastai/pyproject.toml b/e2e/fastai/pyproject.toml index ebc19f6328ee..66fcb393d988 100644 --- a/e2e/fastai/pyproject.toml +++ b/e2e/fastai/pyproject.toml @@ -12,4 +12,4 @@ authors = ["The Flower Authors "] python = ">=3.8,<3.10" flwr = { path = "../../", develop = true, extras = ["simulation"] } fastai = "^2.7.12" -torch = ">=2.0.0, !=2.0.1" +torch = ">=2.0.0, !=2.0.1, < 2.1.0" From 73ff3e034646586c6872d44231b2c0ab2e8c1b4a Mon Sep 17 00:00:00 2001 From: Adam Narozniak <51029327+adam-narozniak@users.noreply.github.com> Date: Mon, 16 Oct 2023 11:07:58 +0200 Subject: [PATCH 2/2] Add 'subset' keyword to FederatedDataset (#2420) --- datasets/flwr_datasets/federated_dataset.py | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/datasets/flwr_datasets/federated_dataset.py b/datasets/flwr_datasets/federated_dataset.py index 8d171db2afa4..c4691da397fe 100644 --- a/datasets/flwr_datasets/federated_dataset.py +++ b/datasets/flwr_datasets/federated_dataset.py @@ -35,6 +35,9 @@ class FederatedDataset: ---------- dataset: str The name of the dataset in the Hugging Face Hub. + subset: str + Secondary information regarding the dataset, most often subset or version + (that is passed to the name in datasets.load_dataset). partitioners: Dict[str, Union[Partitioner, int]] A dictionary mapping the Dataset split (a `str`) to a `Partitioner` or an `int` (representing the number of IID partitions that this split should be partitioned @@ -59,10 +62,12 @@ def __init__( self, *, dataset: str, + subset: Optional[str] = None, partitioners: Dict[str, Union[Partitioner, int]], ) -> None: _check_if_dataset_tested(dataset) self._dataset_name: str = dataset + self._subset: Optional[str] = subset self._partitioners: Dict[str, Partitioner] = _instantiate_partitioners( partitioners ) @@ -121,7 +126,9 @@ def load_full(self, split: str) -> Dataset: def _download_dataset_if_none(self) -> None: """Lazily load (and potentially download) the Dataset instance into memory.""" if self._dataset is None: - self._dataset = datasets.load_dataset(self._dataset_name) + self._dataset = datasets.load_dataset( + path=self._dataset_name, name=self._subset + ) def _check_if_split_present(self, split: str) -> None: """Check if the split (for partitioning or full return) is in the dataset."""