Unverified Commit 6e453f1a authored by kkHuang-amd's avatar kkHuang-amd Committed by GitHub
Browse files

Merge pull request #99 from ROCmSoftwarePlatform/dev/hubertlu/fused_dense_debug

Fix a bug in fused_dense_cuda on ROCm
parents 4dcf30a6 d63b5d1f
......@@ -2,7 +2,7 @@ import unittest
import sys
test_dirs = ["groupbn", "layer_norm", "multihead_attn", "transducer", "focal_loss", "index_mul_2d", "."] # "." for test_label_smoothing.py
test_dirs = ["groupbn", "fused_dense", "layer_norm", "multihead_attn", "transducer", "focal_loss", "index_mul_2d", "."] # "." for test_label_smoothing.py
ROCM_BLACKLIST = [
"layer_norm"
]
......
......@@ -62,7 +62,7 @@ std::vector<at::Tensor> linear_bias_backward(at::Tensor input, at::Tensor weight
// create output/workspace tensor
auto d_weight = at::empty({out_features, in_features}, input.type());
#if defined(CUBLAS_VERSION) && CUBLAS_VERSION < 11600
#if (defined(CUBLAS_VERSION) && CUBLAS_VERSION < 11600) || __HIP_PLATFORM_HCC__
auto d_bias = d_output.view({-1, out_features}).sum(0, false);
#else
auto d_bias = at::empty({out_features}, input.type());
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment