Unverified Commit 88d802ce authored by zhanggefan's avatar zhanggefan Committed by GitHub
Browse files

[Fix] Fix the invalid cuda memory access when training s2anet (#1660)

parent b04ad69d
...@@ -14,7 +14,7 @@ void ActiveRotatedFilterForwardCUDAKernelLauncher(const Tensor input, ...@@ -14,7 +14,7 @@ void ActiveRotatedFilterForwardCUDAKernelLauncher(const Tensor input,
int kW = input.size(4); int kW = input.size(4);
int num_rotations = indices.size(3); int num_rotations = indices.size(3);
int nEntry = num_orientations * kH * kW; int nEntry = num_orientations * kH * kW;
int output_size = output.numel(); int output_size = input.numel();
at::cuda::CUDAGuard device_guard(input.device()); at::cuda::CUDAGuard device_guard(input.device());
cudaStream_t stream = at::cuda::getCurrentCUDAStream(); cudaStream_t stream = at::cuda::getCurrentCUDAStream();
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment