Merge branch 'master' of https://github.com/NVIDIA/apex

6e39bee3 · Michael Carilli · bfa3e0ee · 251cddaf · 6e39bee3 · 6e39bee3
Commit 6e39bee3 authored Jun 22, 2018 by Michael Carilli
5 changed files
--- a/apex/amp/wrap.py
+++ b/apex/amp/wrap.py
@@ -191,11 +191,11 @@ def rnn_cast(backend, fn, verbose=False):
            # 2) Inputs: either a tuple (for LSTM) or single tensor
            if isinstance(hiddens, tuple):
                new_args.append(tuple(cast_fn(x) for x in hiddens))
-            elif utils.is_fp_tensor(hidden):
-                new_args.append(cast_fn(hidden))
+            elif utils.is_fp_tensor(hiddens):
+                new_args.append(cast_fn(hiddens))
            else:
-                # Hidden can, in principle, be `None` -- pass through
-                new_args.append(hidden)
+                # Hiddens can, in principle, be `None` -- pass through
+                new_args.append(hiddens)

            # 3) Batch sizes (0.4 or later only)
            if len(fargs) == 4:

--- a/csrc/scale_cuda.cu
+++ b/csrc/scale_cuda.cu
 #include <ATen/ATen.h>
 // #include "ATen/AccumulateType.h"
 #include "ATen/cuda/CUDATensorMethods.cuh"
-#include "ATen/cuda/CUDATypeConversion.cuh"
+// #include "ATen/cuda/CUDATypeConversion.cuh"
 // #include <THC/THCTensorMathReduce.cuh>
 #include <THC/THCGeneral.h>


--- a/csrc/weight_norm_bwd_cuda.cu
+++ b/csrc/weight_norm_bwd_cuda.cu
@@ -9,7 +9,7 @@
 #endif

 #include "ATen/cuda/CUDATensorMethods.cuh"
-#include "ATen/cuda/CUDATypeConversion.cuh"
+// #include "ATen/cuda/CUDATypeConversion.cuh"
 // #include <THC/THCTensorMathReduce.cuh>

 template

--- a/csrc/weight_norm_fwd_cuda.cu
+++ b/csrc/weight_norm_fwd_cuda.cu
@@ -9,7 +9,7 @@
 #endif

 #include "ATen/cuda/CUDATensorMethods.cuh"
-#include "ATen/cuda/CUDATypeConversion.cuh"
+// #include "ATen/cuda/CUDATypeConversion.cuh"
 // #include <THC/THCTensorMathReduce.cuh>

 template

--- a/setup.py
+++ b/setup.py
 import torch.cuda
+import ctypes
 import os
 import re
 import subprocess