Unverified Commit eaebb306 authored by Shilong Zhang's avatar Shilong Zhang Committed by GitHub
Browse files

fix dcn forward and backward when batchsize is larger than im2col_step (#1212)

parent 571e3e5f
...@@ -278,6 +278,8 @@ void DeformConvForwardCUDAKernelLauncher(Tensor input, Tensor weight, ...@@ -278,6 +278,8 @@ void DeformConvForwardCUDAKernelLauncher(Tensor input, Tensor weight,
} }
columns = columns =
columns.view({columns.size(0) * columns.size(1), columns.size(2)}); columns.view({columns.size(0) * columns.size(1), columns.size(2)});
weight = weight.view({weight.size(0) * weight.size(1), weight.size(2),
weight.size(3), weight.size(4)});
} }
output_buffer = output_buffer.view( output_buffer = output_buffer.view(
...@@ -384,6 +386,8 @@ void DeformConvBackwardInputCUDAKernelLauncher( ...@@ -384,6 +386,8 @@ void DeformConvBackwardInputCUDAKernelLauncher(
deformable_col2im(columns, offset[elt], nInputPlane, inputHeight, deformable_col2im(columns, offset[elt], nInputPlane, inputHeight,
inputWidth, kH, kW, padH, padW, dH, dW, dilationH, inputWidth, kH, kW, padH, padW, dH, dW, dilationH,
dilationW, im2col_step, deformable_group, gradInput[elt]); dilationW, im2col_step, deformable_group, gradInput[elt]);
weight = weight.view({weight.size(0) * weight.size(1), weight.size(2),
weight.size(3), weight.size(4)});
} }
gradOutput.transpose_(1, 2); gradOutput.transpose_(1, 2);
......
...@@ -386,6 +386,8 @@ void DeformConvBackwardInputCUDAKernelLauncher( ...@@ -386,6 +386,8 @@ void DeformConvBackwardInputCUDAKernelLauncher(
deformable_col2im(columns, offset[elt], nInputPlane, inputHeight, deformable_col2im(columns, offset[elt], nInputPlane, inputHeight,
inputWidth, kH, kW, padH, padW, dH, dW, dilationH, inputWidth, kH, kW, padH, padW, dH, dW, dilationH,
dilationW, im2col_step, deformable_group, gradInput[elt]); dilationW, im2col_step, deformable_group, gradInput[elt]);
weight = weight.view({weight.size(0) * weight.size(1), weight.size(2),
weight.size(3), weight.size(4)});
} }
gradOutput.transpose_(1, 2); gradOutput.transpose_(1, 2);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment