Commit ab239e0a authored by yuguo960516yuguo's avatar yuguo960516yuguo
Browse files

hgemm fp32 ctype

parent d2d32668
...@@ -922,7 +922,7 @@ inline void Blas<paddle::platform::CUDADeviceContext>::GEMM( ...@@ -922,7 +922,7 @@ inline void Blas<paddle::platform::CUDADeviceContext>::GEMM(
C, C,
rocblas_datatype_f16_r, rocblas_datatype_f16_r,
N, N,
rocblas_datatype_f16_r); rocblas_datatype_f32_r);
} }
template <> template <>
template <> template <>
...@@ -977,7 +977,7 @@ inline void Blas<phi::GPUContext>::GEMM(CBLAS_TRANSPOSE transA, ...@@ -977,7 +977,7 @@ inline void Blas<phi::GPUContext>::GEMM(CBLAS_TRANSPOSE transA,
C, C,
rocblas_datatype_f16_r, rocblas_datatype_f16_r,
N, N,
rocblas_datatype_f16_r); rocblas_datatype_f32_r);
} }
template <> template <>
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment