Make datasets in `ConcatDataset` not need to be sized (#64114)

author Santiago Castro <sacastro@umich.edu>

Wed, 1 Sep 2021 22:18:14 +0000 (15:18 -0700)

committer Facebook GitHub Bot <facebook-github-bot@users.noreply.github.com>

Wed, 1 Sep 2021 22:32:50 +0000 (15:32 -0700)
author Santiago Castro <sacastro@umich.edu>
Wed, 1 Sep 2021 22:18:14 +0000 (15:18 -0700)
committer Facebook GitHub Bot <facebook-github-bot@users.noreply.github.com>
Wed, 1 Sep 2021 22:32:50 +0000 (15:32 -0700)
diff --git a/torch/utils/data/dataset.py b/torch/utils/data/dataset.py

index 609e1a1..50488d1 100644 (file)
--- a/torch/utils/data/dataset.py
+++ b/torch/utils/data/dataset.py
@@ -271,9 +271,8 @@ class ConcatDataset(Dataset[T_co]):
  
      def __init__(self, datasets: Iterable[Dataset]) -> None:
          super(ConcatDataset, self).__init__()
-        # Cannot verify that datasets is Sized
-        assert len(datasets) > 0, 'datasets should not be an empty iterable'  # type: ignore[arg-type]
          self.datasets = list(datasets)
+        assert len(self.datasets) > 0, 'datasets should not be an empty iterable'  # type: ignore[arg-type]
          for d in self.datasets:
              assert not isinstance(d, IterableDataset), "ConcatDataset does not support IterableDataset"
          self.cumulative_sizes = self.cumsum(self.datasets)
author	Santiago Castro <sacastro@umich.edu>
	Wed, 1 Sep 2021 22:18:14 +0000 (15:18 -0700)
committer	Facebook GitHub Bot <facebook-github-bot@users.noreply.github.com>
	Wed, 1 Sep 2021 22:32:50 +0000 (15:32 -0700)