@@ -73,10 +73,12 @@ class TestBasicCastsHalf(_TestBasicCasts):
...
@@ -73,10 +73,12 @@ class TestBasicCastsHalf(_TestBasicCasts):
deftearDown(self):
deftearDown(self):
self.handle._deactivate()
self.handle._deactivate()
@unittest.skip("The failing unit test is introduced by a PyTorch commit sometime in between rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 and 2021/12/01. Same error is also observed on CUDA. Please refer to https://github.com/ROCmSoftwarePlatform/apex/issues/62")
deftest_linear_is_half(self):
deftest_linear_is_half(self):
self._test_linear(ALWAYS_HALF)
self._test_linear(ALWAYS_HALF)
@unittest.skip("The failing unit test is introduced by a PyTorch commit sometime in between rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 and 2021/12/01. Same error is also observed on CUDA. Please refer to https://github.com/ROCmSoftwarePlatform/apex/issues/62")
@unittest.skip("The failing unit test is introduced by a PyTorch commit sometime in between rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 and 2021/12/01. Same error is also observed on CUDA. Please refer to https://github.com/ROCmSoftwarePlatform/apex/issues/62")
@@ -69,6 +69,7 @@ class TestCheckpointing(unittest.TestCase):
...
@@ -69,6 +69,7 @@ class TestCheckpointing(unittest.TestCase):
'key: {}\nparam: {}\nrestored: {}\ndiff: {} for {}'.format(
'key: {}\nparam: {}\nrestored: {}\ndiff: {} for {}'.format(
key,paramA,paramB,paramA-paramB,test_setup))
key,paramA,paramB,paramA-paramB,test_setup))
@unittest.skip("The failing unit test is introduced by a PyTorch commit sometime in between rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 and 2021/12/01. Same error is also observed on CUDA. Please refer to https://github.com/ROCmSoftwarePlatform/apex/issues/62")
deftest_restoring(self):
deftest_restoring(self):
nb_epochs=10
nb_epochs=10
nb_epochs_restore=nb_epochs//2
nb_epochs_restore=nb_epochs//2
...
@@ -220,6 +221,7 @@ class TestCheckpointing(unittest.TestCase):
...
@@ -220,6 +221,7 @@ class TestCheckpointing(unittest.TestCase):
@unittest.skip("The failing unit test is introduced by a PyTorch commit sometime in between rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 and 2021/12/01. Same error is also observed on CUDA. Please refer to https://github.com/ROCmSoftwarePlatform/apex/issues/62")
@@ -39,15 +39,18 @@ class TestRnnCells(unittest.TestCase):
...
@@ -39,15 +39,18 @@ class TestRnnCells(unittest.TestCase):
outputs[-1].float().sum().backward()
outputs[-1].float().sum().backward()
fori,xinenumerate(xs):
fori,xinenumerate(xs):
self.assertEqual(x.grad.dtype,x.dtype)
self.assertEqual(x.grad.dtype,x.dtype)
@unittest.skip("The failing unit test is introduced by a PyTorch commit sometime in between rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 and 2021/12/01. Same error is also observed on CUDA. Please refer to https://github.com/ROCmSoftwarePlatform/apex/issues/62")
deftest_rnn_cell_is_half(self):
deftest_rnn_cell_is_half(self):
cell=nn.RNNCell(self.h,self.h)
cell=nn.RNNCell(self.h,self.h)
self.run_cell_test(cell)
self.run_cell_test(cell)
@unittest.skip("The failing unit test is introduced by a PyTorch commit sometime in between rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 and 2021/12/01. Same error is also observed on CUDA. Please refer to https://github.com/ROCmSoftwarePlatform/apex/issues/62")
deftest_gru_cell_is_half(self):
deftest_gru_cell_is_half(self):
cell=nn.GRUCell(self.h,self.h)
cell=nn.GRUCell(self.h,self.h)
self.run_cell_test(cell)
self.run_cell_test(cell)
@unittest.skip("The failing unit test is introduced by a PyTorch commit sometime in between rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 and 2021/12/01. Same error is also observed on CUDA. Please refer to https://github.com/ROCmSoftwarePlatform/apex/issues/62")
@@ -96,7 +96,8 @@ class TestFusedAdam(TestFusedOptimizer):
...
@@ -96,7 +96,8 @@ class TestFusedAdam(TestFusedOptimizer):
deftest_float(self):
deftest_float(self):
self.gen_single_type_test(param_type=torch.float)
self.gen_single_type_test(param_type=torch.float)
@unittest.skip("NaN issue observed on ROCm as of 12/1/2021. The failing unit test is introduced by a PyTorch commit sometime in between rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 and 2021/12/01. Please refer to https://github.com/ROCmSoftwarePlatform/apex/issues/63")