Commit a8409d7f authored by Khalique Ahmed's avatar Khalique Ahmed
Browse files

hardcode compute type

parent 00d5d880
......@@ -65,11 +65,13 @@ void gemm_impl(context& ctx,
output_type = rocblas_datatype_i32_r;
}
auto compute_type = output_type;
if(ctx.get_stream().get_device_name() == "gfx908")
{
if(args[0].get_shape().type() == shape::half_type)
if(args[0].get_shape().type() == shape::half_type)
compute_type = rocblas_datatype_f32_r;
}
// if(ctx.get_stream().get_device_name() == "gfx908")
// {
// if(args[0].get_shape().type() == shape::half_type)
// compute_type = rocblas_datatype_f32_r;
// }
#if ROCBLAS_VERSION_MAJOR >= 2 && ROCBLAS_VERSION_MINOR >= 38
rocblas_gemm_flags flag =
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment