Commit 25ae3d1b authored by rocking's avatar rocking
Browse files

use raw store to improve performance

parent 62fa36cf
...@@ -204,7 +204,7 @@ float layernorm2d_fwd_(const S& s, A a) ...@@ -204,7 +204,7 @@ float layernorm2d_fwd_(const S& s, A a)
using TwoPassPipeline = ck_tile::Layernorm2dFwdPipelineTwoPass<PipelineProblem>; using TwoPassPipeline = ck_tile::Layernorm2dFwdPipelineTwoPass<PipelineProblem>;
using Pipeline = std::conditional_t<Traits_::kTwoPass, TwoPassPipeline, OnePassPipeline>; using Pipeline = std::conditional_t<Traits_::kTwoPass, TwoPassPipeline, OnePassPipeline>;
using Default2DEpilogueProblem = ck_tile::Default2DEpilogueProblem<ComputeDataType, YDataType, false, Traits_::kPadN, false>; using Default2DEpilogueProblem = ck_tile::Default2DEpilogueProblem<ComputeDataType, YDataType, false, Traits_::kPadN, true>;
using Default2DEpilogue = ck_tile::Default2DEpilogue<Default2DEpilogueProblem>; using Default2DEpilogue = ck_tile::Default2DEpilogue<Default2DEpilogueProblem>;
static constexpr bool UseSmoothInputScale = Traits_::kFusedQuant == 1; static constexpr bool UseSmoothInputScale = Traits_::kFusedQuant == 1;
...@@ -327,7 +327,7 @@ float layernorm2d_fwd(layernorm2d_fwd_traits t, ...@@ -327,7 +327,7 @@ float layernorm2d_fwd(layernorm2d_fwd_traits t,
@dataclass @dataclass
class k_pipeline_one_pass: class k_pipeline_one_pass:
F_Problem : Any #k_problem F_Problem : Any #k_problem
@dataclass @dataclass
class k_pipeline_two_pass: class k_pipeline_two_pass:
F_Problem : Any #k_problem F_Problem : Any #k_problem
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment