Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
vision
Commits
7b5075fc
"vscode:/vscode.git/clone" did not exist on "f0b2f6ce054c9f42e5515699da299f8ff69ed77f"
Unverified
Commit
7b5075fc
authored
Oct 17, 2019
by
Francisco Massa
Committed by
GitHub
Oct 17, 2019
Browse files
Fix CUDA builds on Windows (#1485)
parent
53b062ca
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
16 additions
and
4 deletions
+16
-4
torchvision/csrc/cuda/PSROIAlign_cuda.cu
torchvision/csrc/cuda/PSROIAlign_cuda.cu
+8
-2
torchvision/csrc/cuda/PSROIPool_cuda.cu
torchvision/csrc/cuda/PSROIPool_cuda.cu
+8
-2
No files found.
torchvision/csrc/cuda/PSROIAlign_cuda.cu
View file @
7b5075fc
...
@@ -336,7 +336,10 @@ std::tuple<at::Tensor, at::Tensor> PSROIAlign_forward_cuda(
...
@@ -336,7 +336,10 @@ std::tuple<at::Tensor, at::Tensor> PSROIAlign_forward_cuda(
cudaStream_t
stream
=
at
::
cuda
::
getCurrentCUDAStream
();
cudaStream_t
stream
=
at
::
cuda
::
getCurrentCUDAStream
();
dim3
grid
(
std
::
min
(
at
::
cuda
::
ATenCeilDiv
(
output_size
,
512L
),
4096L
));
dim3
grid
(
std
::
min
(
at
::
cuda
::
ATenCeilDiv
(
static_cast
<
int64_t
>
(
output_size
),
static_cast
<
int64_t
>
(
512
)),
static_cast
<
int64_t
>
(
4096
)));
dim3
block
(
512
);
dim3
block
(
512
);
AT_DISPATCH_FLOATING_TYPES_AND_HALF
(
AT_DISPATCH_FLOATING_TYPES_AND_HALF
(
...
@@ -395,7 +398,10 @@ at::Tensor PSROIAlign_backward_cuda(
...
@@ -395,7 +398,10 @@ at::Tensor PSROIAlign_backward_cuda(
cudaStream_t
stream
=
at
::
cuda
::
getCurrentCUDAStream
();
cudaStream_t
stream
=
at
::
cuda
::
getCurrentCUDAStream
();
dim3
grid
(
std
::
min
(
at
::
cuda
::
ATenCeilDiv
(
grad
.
numel
(),
512L
),
4096L
));
dim3
grid
(
std
::
min
(
at
::
cuda
::
ATenCeilDiv
(
static_cast
<
int64_t
>
(
grad
.
numel
()),
static_cast
<
int64_t
>
(
512
)),
static_cast
<
int64_t
>
(
4096
)));
dim3
block
(
512
);
dim3
block
(
512
);
// handle possibly empty gradients
// handle possibly empty gradients
...
...
torchvision/csrc/cuda/PSROIPool_cuda.cu
View file @
7b5075fc
...
@@ -173,7 +173,10 @@ std::tuple<at::Tensor, at::Tensor> PSROIPool_forward_cuda(
...
@@ -173,7 +173,10 @@ std::tuple<at::Tensor, at::Tensor> PSROIPool_forward_cuda(
cudaStream_t
stream
=
at
::
cuda
::
getCurrentCUDAStream
();
cudaStream_t
stream
=
at
::
cuda
::
getCurrentCUDAStream
();
dim3
grid
(
std
::
min
(
at
::
cuda
::
ATenCeilDiv
(
output_size
,
512L
),
4096L
));
dim3
grid
(
std
::
min
(
at
::
cuda
::
ATenCeilDiv
(
static_cast
<
int64_t
>
(
output_size
),
static_cast
<
int64_t
>
(
512
)),
static_cast
<
int64_t
>
(
4096
)));
dim3
block
(
512
);
dim3
block
(
512
);
AT_DISPATCH_FLOATING_TYPES_AND_HALF
(
AT_DISPATCH_FLOATING_TYPES_AND_HALF
(
...
@@ -229,7 +232,10 @@ at::Tensor PSROIPool_backward_cuda(
...
@@ -229,7 +232,10 @@ at::Tensor PSROIPool_backward_cuda(
cudaStream_t
stream
=
at
::
cuda
::
getCurrentCUDAStream
();
cudaStream_t
stream
=
at
::
cuda
::
getCurrentCUDAStream
();
dim3
grid
(
std
::
min
(
at
::
cuda
::
ATenCeilDiv
(
grad
.
numel
(),
512L
),
4096L
));
dim3
grid
(
std
::
min
(
at
::
cuda
::
ATenCeilDiv
(
static_cast
<
int64_t
>
(
grad
.
numel
()),
static_cast
<
int64_t
>
(
512
)),
static_cast
<
int64_t
>
(
4096
)));
dim3
block
(
512
);
dim3
block
(
512
);
// handle possibly empty gradients
// handle possibly empty gradients
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment