Commit 5024f317 authored by carlushuang's avatar carlushuang
Browse files

fix bug

parent 02684438
...@@ -623,10 +623,6 @@ struct GridwiseGemmBiasActivationAddAvx2_MxN ...@@ -623,10 +623,6 @@ struct GridwiseGemmBiasActivationAddAvx2_MxN
c_threadwise_copy.SetSrc2SliceOrigin(c_block_desc, c_threadwise_copy.SetSrc2SliceOrigin(c_block_desc,
GetCIndex(i_mc, i_nc)); GetCIndex(i_mc, i_nc));
_mm_prefetch(reinterpret_cast<const float*>(c1_grid_buf.p_data_) +
c_threadwise_copy.src2_offset,
_MM_HINT_T1);
if constexpr(!UseCLocalBuffer) if constexpr(!UseCLocalBuffer)
{ {
c_threadwise_copy.SetSrcSliceOrigin(c_block_desc, c_threadwise_copy.SetSrcSliceOrigin(c_block_desc,
......
...@@ -2403,7 +2403,7 @@ struct ThreadwiseTensorSliceTransferAvx2Specialization_MatC_Store_Bias_Residual_ ...@@ -2403,7 +2403,7 @@ struct ThreadwiseTensorSliceTransferAvx2Specialization_MatC_Store_Bias_Residual_
// dst_slice_origin_step_idx need to be known at compile-time, for performance reason // dst_slice_origin_step_idx need to be known at compile-time, for performance reason
void MoveDstSliceWindow(const DstDesc&, const Index&) {} void MoveDstSliceWindow(const DstDesc&, const Index&) {}
// private: private:
const ElementwiseOperation element_op_; const ElementwiseOperation element_op_;
intptr_t i_dst_gemm_m; intptr_t i_dst_gemm_m;
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment