Commit 1af0a0a4 authored by letaoqin's avatar letaoqin
Browse files

change the check for vector load

parent b19fe02b
...@@ -120,7 +120,7 @@ using DeviceGemmInstance = ...@@ -120,7 +120,7 @@ using DeviceGemmInstance =
8, 8,
8, 8,
true, true,
4, 1,
S<16, 16, 1>, // B1BlockTransfer S<16, 16, 1>, // B1BlockTransfer
S<0, 2, 1>, S<0, 2, 1>,
S<0, 2, 1>, S<0, 2, 1>,
......
...@@ -1028,8 +1028,7 @@ struct DeviceBatchedMultiheadAttentionForward_Xdl_CShuffle_V2 ...@@ -1028,8 +1028,7 @@ struct DeviceBatchedMultiheadAttentionForward_Xdl_CShuffle_V2
{ {
if(arg.d0_n_length_stride_[1] == 1) if(arg.d0_n_length_stride_[1] == 1)
{ {
if(!(arg.d0_n_length_stride_[0] % Acc0BiasTransferSrcScalarPerVector == 0 || if(arg.d0_n_length_stride_[0] % Acc0BiasTransferSrcScalarPerVector != 0)
Transform::matrix_padder.PadN))
return false; return false;
} }
else if(Acc0BiasTransferSrcScalarPerVector != 1) else if(Acc0BiasTransferSrcScalarPerVector != 1)
......
...@@ -744,8 +744,7 @@ struct DeviceBatchedMultiheadAttentionInfer_Xdl_CShuffle ...@@ -744,8 +744,7 @@ struct DeviceBatchedMultiheadAttentionInfer_Xdl_CShuffle
{ {
if(arg.d0_n_length_stride_[1] == 1) if(arg.d0_n_length_stride_[1] == 1)
{ {
if(!(arg.d0_n_length_stride_[0] % Acc0BiasTransferSrcScalarPerVector == 0 || if(arg.d0_n_length_stride_[0] % Acc0BiasTransferSrcScalarPerVector != 0)
Transform::matrix_padder.PadN))
return false; return false;
} }
else if(Acc0BiasTransferSrcScalarPerVector != 1) else if(Acc0BiasTransferSrcScalarPerVector != 1)
......
...@@ -1104,9 +1104,7 @@ struct DeviceGroupedMultiheadAttentionForward_Xdl_CShuffle_V2 ...@@ -1104,9 +1104,7 @@ struct DeviceGroupedMultiheadAttentionForward_Xdl_CShuffle_V2
{ {
if(device_arg.d0_n_length_stride_[1] == 1) if(device_arg.d0_n_length_stride_[1] == 1)
{ {
if(!(device_arg.d0_n_length_stride_[0] % Acc0BiasTransferSrcScalarPerVector == if(device_arg.d0_n_length_stride_[0] % Acc0BiasTransferSrcScalarPerVector != 0)
0 ||
Transform::matrix_padder.PadN))
return false; return false;
} }
else if(Acc0BiasTransferSrcScalarPerVector != 1) else if(Acc0BiasTransferSrcScalarPerVector != 1)
......
...@@ -788,9 +788,7 @@ struct DeviceGroupedMultiheadAttentionInfer_Xdl_CShuffle ...@@ -788,9 +788,7 @@ struct DeviceGroupedMultiheadAttentionInfer_Xdl_CShuffle
if(device_arg.d0_n_length_stride_[1] == 1) if(device_arg.d0_n_length_stride_[1] == 1)
{ {
if(!(device_arg.d0_n_length_stride_[0] % Acc0BiasTransferSrcScalarPerVector == if(device_arg.d0_n_length_stride_[0] % Acc0BiasTransferSrcScalarPerVector != 0)
0 ||
Transform::matrix_padder.PadN))
{ {
return false; return false;
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment