"driver/vscode:/vscode.git/clone" did not exist on "f2f35201f40d2a36c6c475554ec2b33fc4e0bbf1"
Commit 85a7aa89 authored by mtgu0705's avatar mtgu0705
Browse files

fix bug, function now passes.

parent 279e2eaf
...@@ -339,19 +339,21 @@ struct DeviceGemm_Xdl_CShuffleV3_BPreshuffle : public DeviceGemmV2BPreshuffle<AL ...@@ -339,19 +339,21 @@ struct DeviceGemm_Xdl_CShuffleV3_BPreshuffle : public DeviceGemmV2BPreshuffle<AL
if(arg.KBatch > 1) if(arg.KBatch > 1)
{ {
const auto kernel = const auto kernel =
kernel_gemm_xdl_cshuffle_v3<GridwiseGemm, kernel_gemm_xdl_cshuffle_v3_b_preshuffle<GridwiseGemm,
false, false,
InMemoryDataOperationEnum::AtomicAdd, InMemoryDataOperationEnum::AtomicAdd,
minimum_occupancy>; minimum_occupancy,
TailNumber::Odd>;
Run(kernel); Run(kernel);
} }
else else
{ {
const auto kernel = const auto kernel =
kernel_gemm_xdl_cshuffle_v3<GridwiseGemm, kernel_gemm_xdl_cshuffle_v3_b_preshuffle<GridwiseGemm,
false, false,
InMemoryDataOperationEnum::Set, InMemoryDataOperationEnum::Set,
minimum_occupancy>; minimum_occupancy,
TailNumber::Odd>;
Run(kernel); Run(kernel);
} }
} }
......
...@@ -377,14 +377,14 @@ struct ThreadwiseTensorSliceTransfer_v2 ...@@ -377,14 +377,14 @@ struct ThreadwiseTensorSliceTransfer_v2
if constexpr(InvalidElementAsNaN) if constexpr(InvalidElementAsNaN)
{ {
dst_buf(Number<dst_offset / PackedSize>{}) = dst_buf(Number<dst_offset>{}) =
is_src_valid is_src_valid
? type_convert<DstData>(src_vector.template AsType<SrcData>()[i]) ? type_convert<DstData>(src_vector.template AsType<SrcData>()[i])
: NumericLimits<DstData>::QuietNaN(); : NumericLimits<DstData>::QuietNaN();
} }
else else
{ {
dst_buf(Number<dst_offset / PackedSize>{}) = dst_buf(Number<dst_offset>{}) =
type_convert<DstData>(src_vector.template AsType<SrcData>()[i]); type_convert<DstData>(src_vector.template AsType<SrcData>()[i]);
} }
}); });
...@@ -1619,7 +1619,7 @@ struct ThreadwiseTensorSliceTransfer_StaticToStatic ...@@ -1619,7 +1619,7 @@ struct ThreadwiseTensorSliceTransfer_StaticToStatic
constexpr index_t src_offset = src_desc.CalculateOffset( constexpr index_t src_offset = src_desc.CalculateOffset(
src_slice_origin_idx + idx_md + i * dst_scalar_step_in_vector); src_slice_origin_idx + idx_md + i * dst_scalar_step_in_vector);
src_tmp_vector.template AsType<SrcData>()(i) = src_buf[Number<src_offset / PackedSize>{}]; src_tmp_vector.template AsType<SrcData>()(i) = src_buf[Number<src_offset>{}];
}); });
// copy data from src_tmp_vector to dst_tmp_vector (data cast data from SrcData to // copy data from src_tmp_vector to dst_tmp_vector (data cast data from SrcData to
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment