"vscode:/vscode.git/clone" did not exist on "3e3d46924b4fd1fa36ccbc5605ed619cdcc00dbf"
Unverified Commit 0cba9b78 authored by Philip Meier's avatar Philip Meier Committed by GitHub
Browse files

enforce shuffling before sharding (#5680)

* enforce shuffling before sharding

* revert test changes and add comment
parent 96aecd2d
...@@ -72,6 +72,6 @@ class SVHN(Dataset): ...@@ -72,6 +72,6 @@ class SVHN(Dataset):
dp = resource_dps[0] dp = resource_dps[0]
dp = Mapper(dp, self._read_images_and_labels) dp = Mapper(dp, self._read_images_and_labels)
dp = UnBatcher(dp) dp = UnBatcher(dp)
dp = hint_sharding(dp)
dp = hint_shuffling(dp) dp = hint_shuffling(dp)
dp = hint_sharding(dp)
return Mapper(dp, self._prepare_sample) return Mapper(dp, self._prepare_sample)
...@@ -49,6 +49,6 @@ class USPS(Dataset): ...@@ -49,6 +49,6 @@ class USPS(Dataset):
) -> IterDataPipe[Dict[str, Any]]: ) -> IterDataPipe[Dict[str, Any]]:
dp = Decompressor(resource_dps[0]) dp = Decompressor(resource_dps[0])
dp = LineReader(dp, decode=True, return_path=False) dp = LineReader(dp, decode=True, return_path=False)
dp = hint_sharding(dp)
dp = hint_shuffling(dp) dp = hint_shuffling(dp)
dp = hint_sharding(dp)
return Mapper(dp, self._prepare_sample) return Mapper(dp, self._prepare_sample)
...@@ -154,8 +154,8 @@ class VOC(Dataset): ...@@ -154,8 +154,8 @@ class VOC(Dataset):
split_dp = Filter(split_dp, functools.partial(self._is_in_folder, name=self._SPLIT_FOLDER[config.task])) split_dp = Filter(split_dp, functools.partial(self._is_in_folder, name=self._SPLIT_FOLDER[config.task]))
split_dp = Filter(split_dp, path_comparator("name", f"{config.split}.txt")) split_dp = Filter(split_dp, path_comparator("name", f"{config.split}.txt"))
split_dp = LineReader(split_dp, decode=True) split_dp = LineReader(split_dp, decode=True)
split_dp = hint_sharding(split_dp)
split_dp = hint_shuffling(split_dp) split_dp = hint_shuffling(split_dp)
split_dp = hint_sharding(split_dp)
dp = split_dp dp = split_dp
for level, data_dp in enumerate((images_dp, anns_dp)): for level, data_dp in enumerate((images_dp, anns_dp)):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment