Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
apex
Commits
4d3ee390
You need to sign in or sign up before continuing.
Commit
4d3ee390
authored
Oct 08, 2023
by
flyingdown
Browse files
fix revert fused_dense to fp32_r
parent
0f6bf5a9
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
0 additions
and
48 deletions
+0
-48
csrc/fused_dense_cuda.cu
csrc/fused_dense_cuda.cu
+0
-48
No files found.
csrc/fused_dense_cuda.cu
View file @
4d3ee390
...
@@ -163,53 +163,6 @@ cublasStatus_t gemm_bias(
...
@@ -163,53 +163,6 @@ cublasStatus_t gemm_bias(
const
float
*
beta
,
const
float
*
beta
,
at
::
Half
*
C
,
at
::
Half
*
C
,
int
ldc
)
{
int
ldc
)
{
<<<<<<<
HEAD
if
(
parseEnvVarFlag
(
"APEX_ROCBLAS_GEMM_ALLOW_HALF"
))
{
half
h_alpha
=
__float2half
(
*
alpha
);
half
h_beta
=
__float2half
(
*
beta
);
return
cublasGemmEx
(
handle
,
transa
,
transb
,
m
,
n
,
k
,
/* alpha */
&
h_alpha
,
A
,
CUDA_R_16F
,
lda
,
B
,
CUDA_R_16F
,
ldb
,
/* beta */
&
h_beta
,
C
,
CUDA_R_16F
,
ldc
,
/* CUDA_R_32F */
CUDA_R_16F
,
CUBLAS_GEMM_DEFAULT_TENSOR_OP
);
}
else
{
return
cublasGemmEx
(
handle
,
transa
,
transb
,
m
,
n
,
k
,
alpha
,
A
,
CUDA_R_16F
,
lda
,
B
,
CUDA_R_16F
,
ldb
,
beta
,
C
,
CUDA_R_16F
,
ldc
,
CUDA_R_32F
,
CUBLAS_GEMM_DEFAULT_TENSOR_OP
);
}
=======
#ifdef __HIP_PLATFORM_HCC__
#ifdef __HIP_PLATFORM_HCC__
return
rocblas_gemm_ex
(
return
rocblas_gemm_ex
(
handle
,
handle
,
...
@@ -258,7 +211,6 @@ cublasStatus_t gemm_bias(
...
@@ -258,7 +211,6 @@ cublasStatus_t gemm_bias(
CUDA_R_32F
,
CUDA_R_32F
,
CUBLAS_GEMM_DEFAULT_TENSOR_OP
);
CUBLAS_GEMM_DEFAULT_TENSOR_OP
);
#endif
#endif
>>>>>>>
mirror
/
master
}
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment