Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
apex
Commits
4d3ee390
Commit
4d3ee390
authored
Oct 08, 2023
by
flyingdown
Browse files
fix revert fused_dense to fp32_r
parent
0f6bf5a9
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
0 additions
and
48 deletions
+0
-48
csrc/fused_dense_cuda.cu
csrc/fused_dense_cuda.cu
+0
-48
No files found.
csrc/fused_dense_cuda.cu
View file @
4d3ee390
...
@@ -163,53 +163,6 @@ cublasStatus_t gemm_bias(
...
@@ -163,53 +163,6 @@ cublasStatus_t gemm_bias(
const
float
*
beta
,
const
float
*
beta
,
at
::
Half
*
C
,
at
::
Half
*
C
,
int
ldc
)
{
int
ldc
)
{
<<<<<<<
HEAD
if
(
parseEnvVarFlag
(
"APEX_ROCBLAS_GEMM_ALLOW_HALF"
))
{
half
h_alpha
=
__float2half
(
*
alpha
);
half
h_beta
=
__float2half
(
*
beta
);
return
cublasGemmEx
(
handle
,
transa
,
transb
,
m
,
n
,
k
,
/* alpha */
&
h_alpha
,
A
,
CUDA_R_16F
,
lda
,
B
,
CUDA_R_16F
,
ldb
,
/* beta */
&
h_beta
,
C
,
CUDA_R_16F
,
ldc
,
/* CUDA_R_32F */
CUDA_R_16F
,
CUBLAS_GEMM_DEFAULT_TENSOR_OP
);
}
else
{
return
cublasGemmEx
(
handle
,
transa
,
transb
,
m
,
n
,
k
,
alpha
,
A
,
CUDA_R_16F
,
lda
,
B
,
CUDA_R_16F
,
ldb
,
beta
,
C
,
CUDA_R_16F
,
ldc
,
CUDA_R_32F
,
CUBLAS_GEMM_DEFAULT_TENSOR_OP
);
}
=======
#ifdef __HIP_PLATFORM_HCC__
#ifdef __HIP_PLATFORM_HCC__
return
rocblas_gemm_ex
(
return
rocblas_gemm_ex
(
handle
,
handle
,
...
@@ -258,7 +211,6 @@ cublasStatus_t gemm_bias(
...
@@ -258,7 +211,6 @@ cublasStatus_t gemm_bias(
CUDA_R_32F
,
CUDA_R_32F
,
CUBLAS_GEMM_DEFAULT_TENSOR_OP
);
CUBLAS_GEMM_DEFAULT_TENSOR_OP
);
#endif
#endif
>>>>>>>
mirror
/
master
}
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment