Commit 21cac0e5 authored by Jing Zhang's avatar Jing Zhang
Browse files

enabled dwordx4 for fp16

parent 3c71fe87
...@@ -269,7 +269,7 @@ amd_buffer_load_impl_v2(int32x4_t src_wave_buffer_resource, ...@@ -269,7 +269,7 @@ amd_buffer_load_impl_v2(int32x4_t src_wave_buffer_resource,
else if constexpr(N == 8) else if constexpr(N == 8)
{ {
#if 1 #if 0
vector_type<half_t, 8> tmp; vector_type<half_t, 8> tmp;
tmp.AsType<half4_t>()(Number<0>{}) = __llvm_amdgcn_raw_buffer_load_fp16x4( tmp.AsType<half4_t>()(Number<0>{}) = __llvm_amdgcn_raw_buffer_load_fp16x4(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment