Merge pull request #1329 from NVIDIA/leave_bottleneck_masks_as_bool

Leave bottleneck masks as bool

Merge pull request #1329 from NVIDIA/leave_bottleneck_masks_as_bool
Leave bottleneck masks as bool
1a43f292 · Thor Johnsen · GitHub · 7e1c22d0 · bd7c1a0f · 1a43f292
Unverified Commit 1a43f292 authored Mar 15, 2022 by Thor Johnsen Committed by GitHub Mar 15, 2022
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

apex/contrib/bottleneck/bottleneck.py apex/contrib/bottleneck/bottleneck.py +2 -2

No files found.
--- a/apex/contrib/bottleneck/bottleneck.py
+++ b/apex/contrib/bottleneck/bottleneck.py
@@ -36,14 +36,14 @@ class FrozenBatchNorm2d(torch.nn.Module):
 @torch.jit.script
 def drelu_dscale1(grad_o, output, scale1):
-    relu_mask = (output>0).half()
+    relu_mask = (output>0)
    dx_relu = relu_mask * grad_o
    g1 = dx_relu * scale1
    return g1, dx_relu
 @torch.jit.script
 def drelu_dscale2(grad_o, output, scale1, scale2):
-    relu_mask = (output>0).half()
+    relu_mask = (output>0)
    dx_relu = relu_mask * grad_o
    g1 = dx_relu * scale1
    g2 = dx_relu * scale2