[Fix] Fix Correlation op (#2274)

* fix correlation * fix lint

[Fix] Fix Correlation op (#2274)
* fix correlation * fix lint
b0646e0e · q.yao · Zaida Zhou · 6c89b717 · b0646e0e · b0646e0e
Commit b0646e0e authored Oct 24, 2022 by q.yao Committed by Zaida Zhou Nov 23, 2022
Showing with 6 additions and 2 deletions

mmcv/ops/csrc/common/cuda/correlation_cuda.cuh mmcv/ops/csrc/common/cuda/correlation_cuda.cuh +5 -1

mmcv/ops/csrc/pytorch/cuda/correlation_cuda.cu mmcv/ops/csrc/pytorch/cuda/correlation_cuda.cu +1 -1

No files found.
--- a/mmcv/ops/csrc/common/cuda/correlation_cuda.cuh
+++ b/mmcv/ops/csrc/common/cuda/correlation_cuda.cuh
@@ -36,7 +36,8 @@ template <typename scalar_t>
 __global__ void correlation_forward_cuda_kernel(
    const TensorAcc4R rInput1, const TensorAcc4R rInput2, TensorAcc5R output,
    int kH, int kW, int patchH, int patchW, int padH, int padW, int dilationH,
-    int dilationW, int dilation_patchH, int dilation_patchW, int dH, int dW) {
+    int dilationW, int dilation_patchH, int dilation_patchW, int dH, int dW,
+    int oH, int oW) {
  const int iH = rInput1.size(1);
  const int iW = rInput1.size(2);
  const int C = rInput1.size(3);
@@ -44,6 +45,9 @@ __global__ void correlation_forward_cuda_kernel(
  const int n = blockIdx.x;
  const int h = blockIdx.y * blockDim.y + threadIdx.y;
  const int w = blockIdx.z * blockDim.z + threadIdx.z;
+  if (h >= oH || w >= oW) return;
  const int thread = threadIdx.x;
  const int start_i = -padH + h * dH;

--- a/mmcv/ops/csrc/pytorch/cuda/correlation_cuda.cu
+++ b/mmcv/ops/csrc/pytorch/cuda/correlation_cuda.cu
@@ -42,7 +42,7 @@ void CorrelationForwardCUDAKernelLauncher(Tensor input1, Tensor input2,
            <<<blocks, threads, 0, at::cuda::getCurrentCUDAStream()>>>(
                trInput1_acc, trInput2_acc, output_acc, kH, kW, patchH, patchW,
                padH, padW, dilationH, dilationW, dilation_patchH,
-                dilation_patchW, dH, dW);
+                dilation_patchW, dH, dW, oH, oW);
      }));
 }