add tests for prototype datasets API (#4667)

* add tests for prototype datasets API * add pytest-mock as test dependency * remove unnecessary fixtures * Apply suggestions from code review Co-authored-by: Nicolas Hug <contact@nicolas-hug.com> * address first batch of review comments * remove dynamic class generation * aggregate similar tests * split immutable tests once again * removed unused fixture * remove re.escape usages * fix dataset mock Co-authored-by: Nicolas Hug <contact@nicolas-hug.com>

add tests for prototype datasets API (#4667)
* add tests for prototype datasets API * add pytest-mock as test dependency * remove unnecessary fixtures * Apply suggestions from code review Co-authored-by: Nicolas Hug <contact@nicolas-hug.com> * address first batch of review comments * remove dynamic class generation * aggregate similar tests * split immutable tests once again * removed unused fixture * remove re.escape usages * fix dataset mock Co-authored-by: Nicolas Hug <contact@nicolas-hug.com>
f63f4658 · Philip Meier · GitHub · 48ebc0bb · f63f4658 · f63f4658
Unverified Commit f63f4658 authored Oct 31, 2021 by Philip Meier Committed by GitHub Oct 31, 2021
Showing with 249 additions and 4 deletions

.circleci/config.yml .circleci/config.yml +1 -1

.circleci/config.yml.in .circleci/config.yml.in +1 -1

test/test_prototype_datasets.py test/test_prototype_datasets.py +247 -2

No files found.
--- a/.circleci/config.yml
+++ b/.circleci/config.yml
@@ -274,7 +274,7 @@ jobs:
          command: pip install --user --progress-bar off --no-build-isolation .
      - run:
          name: Install test utilities
-          command: pip install --user --progress-bar=off pytest
+          command: pip install --user --progress-bar=off pytest pytest-mock
      - run:
          name: Run tests
          command: pytest test/test_prototype_*.py

--- a/.circleci/config.yml.in
+++ b/.circleci/config.yml.in
@@ -274,7 +274,7 @@ jobs:
          command: pip install --user --progress-bar off --no-build-isolation .
      - run:
          name: Install test utilities
-          command: pip install --user --progress-bar=off pytest
+          command: pip install --user --progress-bar=off pytest pytest-mock
      - run:
          name: Run tests
          command: pytest test/test_prototype_*.py

--- a/test/test_prototype_datasets.py
+++ b/test/test_prototype_datasets.py
-def test_smoke():
+import unittest.mock
-    import torchvision.prototype.datasets  # noqa: F401
+import pytest
+from torchvision.prototype import datasets
+from torchvision.prototype.datasets.utils._internal import FrozenMapping, FrozenBunch
+def make_minimal_dataset_info(name="name", type=datasets.utils.DatasetType.RAW, categories=None, **kwargs):
+    return datasets.utils.DatasetInfo(name, type=type, categories=categories or [], **kwargs)
+class TestFrozenMapping:
+    @pytest.mark.parametrize(
+        ("args", "kwargs"),
+        [
+            pytest.param((dict(foo="bar", baz=1),), dict(), id="from_dict"),
+            pytest.param((), dict(foo="bar", baz=1), id="from_kwargs"),
+            pytest.param((dict(foo="bar"),), dict(baz=1), id="mixed"),
+        ],
+    )
+    def test_instantiation(self, args, kwargs):
+        FrozenMapping(*args, **kwargs)
+    def test_unhashable_items(self):
+        with pytest.raises(TypeError, match="unhashable type"):
+            FrozenMapping(foo=[])
+    def test_getitem(self):
+        options = dict(foo="bar", baz=1)
+        config = FrozenMapping(options)
+        for key, value in options.items():
+            assert config[key] == value
+    def test_getitem_unknown(self):
+        with pytest.raises(KeyError):
+            FrozenMapping()["unknown"]
+    def test_iter(self):
+        options = dict(foo="bar", baz=1)
+        assert set(iter(FrozenMapping(options))) == set(options.keys())
+    def test_len(self):
+        options = dict(foo="bar", baz=1)
+        assert len(FrozenMapping(options)) == len(options)
+    def test_immutable_setitem(self):
+        frozen_mapping = FrozenMapping()
+        with pytest.raises(RuntimeError, match="immutable"):
+            frozen_mapping["foo"] = "bar"
+    def test_immutable_delitem(
+        self,
+    ):
+        frozen_mapping = FrozenMapping(foo="bar")
+        with pytest.raises(RuntimeError, match="immutable"):
+            del frozen_mapping["foo"]
+    def test_eq(self):
+        options = dict(foo="bar", baz=1)
+        assert FrozenMapping(options) == FrozenMapping(options)
+    def test_ne(self):
+        options1 = dict(foo="bar", baz=1)
+        options2 = options1.copy()
+        options2["baz"] += 1
+        assert FrozenMapping(options1) != FrozenMapping(options2)
+    def test_repr(self):
+        options = dict(foo="bar", baz=1)
+        output = repr(FrozenMapping(options))
+        assert isinstance(output, str)
+        for key, value in options.items():
+            assert str(key) in output and str(value) in output
+class TestFrozenBunch:
+    def test_getattr(self):
+        options = dict(foo="bar", baz=1)
+        config = FrozenBunch(options)
+        for key, value in options.items():
+            assert getattr(config, key) == value
+    def test_getattr_unknown(self):
+        with pytest.raises(AttributeError, match="no attribute 'unknown'"):
+            datasets.utils.DatasetConfig().unknown
+    def test_immutable_setattr(self):
+        frozen_bunch = FrozenBunch()
+        with pytest.raises(RuntimeError, match="immutable"):
+            frozen_bunch.foo = "bar"
+    def test_immutable_delattr(
+        self,
+    ):
+        frozen_bunch = FrozenBunch(foo="bar")
+        with pytest.raises(RuntimeError, match="immutable"):
+            del frozen_bunch.foo
+    def test_repr(self):
+        options = dict(foo="bar", baz=1)
+        output = repr(FrozenBunch(options))
+        assert isinstance(output, str)
+        assert output.startswith("FrozenBunch")
+        for key, value in options.items():
+            assert f"{key}={value}" in output
+class TestDatasetInfo:
+    @pytest.fixture
+    def info(self):
+        return make_minimal_dataset_info(valid_options=dict(split=("train", "test"), foo=("bar", "baz")))
+    def test_default_config(self, info):
+        valid_options = info._valid_options
+        default_config = datasets.utils.DatasetConfig({key: values[0] for key, values in valid_options.items()})
+        assert info.default_config == default_config
+    @pytest.mark.parametrize(
+        "valid_options",
+        [
+            pytest.param(None, id="default"),
+            pytest.param(dict(option=("value",)), id="no_split"),
+        ],
+    )
+    def test_default_config_split_train(self, valid_options):
+        info = make_minimal_dataset_info(valid_options=valid_options)
+        assert info.default_config.split == "train"
+    def test_valid_options_split_but_no_train(self):
+        with pytest.raises(ValueError, match="'train' has to be a valid argument for option 'split'"):
+            make_minimal_dataset_info(valid_options=dict(split=("test",)))
+    @pytest.mark.parametrize(
+        ("options", "expected_error_msg"),
+        [
+            pytest.param(dict(unknown_option=None), "Unknown option 'unknown_option'", id="unknown_option"),
+            pytest.param(dict(split="unknown_split"), "Invalid argument 'unknown_split'", id="invalid_argument"),
+        ],
+    )
+    def test_make_config_invalid_inputs(self, info, options, expected_error_msg):
+        with pytest.raises(ValueError, match=expected_error_msg):
+            info.make_config(**options)
+    def test_repr(self, info):
+        output = repr(info)
+        assert isinstance(output, str)
+        assert "DatasetInfo" in output
+        for key, value in info._valid_options.items():
+            assert f"{key}={str(value)[1:-1]}" in output
+    @pytest.mark.parametrize("optional_info", ("citation", "homepage", "license"))
+    def test_repr_optional_info(self, optional_info):
+        sentinel = "sentinel"
+        info = make_minimal_dataset_info(**{optional_info: sentinel})
+        assert f"{optional_info}={sentinel}" in repr(info)
+class TestDataset:
+    class DatasetMock(datasets.utils.Dataset):
+        def __init__(self, name="name", *, valid_options=None, resources=None):
+            self._name = name
+            self._valid_options = valid_options or dict(split=("train", "test"))
+            self.resources = unittest.mock.Mock(return_value=[]) if resources is None else lambda config: resources
+            self._make_datapipe = unittest.mock.Mock()
+            super().__init__()
+        def _make_info(self):
+            return datasets.utils.DatasetInfo(
+                self._name,
+                type=datasets.utils.DatasetType.RAW,
+                categories=[],
+                valid_options=self._valid_options,
+            )
+        def resources(self, config):
+            # This method is just defined to appease the ABC, but will be overwritten at instantiation
+            pass
+        def _make_datapipe(self, resource_dps, *, config, decoder):
+            # This method is just defined to appease the ABC, but will be overwritten at instantiation
+            pass
+    def test_name(self):
+        name = "sentinel"
+        dataset = self.DatasetMock(name=name)
+        assert dataset.name == name
+    def test_default_config(self):
+        sentinel = "sentinel"
+        valid_options = dict(split=(sentinel, "train"))
+        dataset = self.DatasetMock(valid_options=valid_options)
+        assert dataset.default_config == datasets.utils.DatasetConfig(split=sentinel)
+    @pytest.mark.parametrize(
+        ("config", "kwarg"),
+        [
+            pytest.param(*(datasets.utils.DatasetConfig(split="test"),) * 2, id="specific"),
+            pytest.param(make_minimal_dataset_info().default_config, None, id="default"),
+        ],
+    )
+    def test_to_datapipe_config(self, config, kwarg):
+        dataset = self.DatasetMock()
+        dataset.to_datapipe("", config=kwarg)
+        dataset.resources.assert_called_with(config)
+        (_, call_kwargs) = dataset._make_datapipe.call_args
+        assert call_kwargs["config"] == config
+    def test_resources(self, mocker):
+        resource_mock = mocker.Mock(spec=["to_datapipe"])
+        sentinel = object()
+        resource_mock.to_datapipe.return_value = sentinel
+        dataset = self.DatasetMock(resources=[resource_mock])
+        root = "root"
+        dataset.to_datapipe(root)
+        resource_mock.to_datapipe.assert_called_with(root)
+        (call_args, _) = dataset._make_datapipe.call_args
+        assert call_args[0][0] is sentinel
+    def test_decoder(self):
+        dataset = self.DatasetMock()
+        sentinel = object()
+        dataset.to_datapipe("", decoder=sentinel)
+        (_, call_kwargs) = dataset._make_datapipe.call_args
+        assert call_kwargs["decoder"] is sentinel