Commit 94e983ad authored by Paul's avatar Paul
Browse files

Improve calculation with vectorization

parent 7b82fd5b
......@@ -52,12 +52,12 @@ struct softmax_compiler : compiler<softmax_compiler>
auto faxis = find_fast_axis({inputs.front()});
vectorize vec{};
// Vectorize if the axis is a reduction axis
if(inputs.back().lens()[faxis] == 1)
if(faxis == axis)
{
vec = vectorize::elements(faxis, inputs);
}
auto relements = inputs[0].lens()[axis] / vec.size;
auto nelements = inputs.back().elements() / relements;
auto nelements = (inputs.back().elements() / inputs[0].lens()[axis]) / vec.size;
auto block_size = compute_block_size(relements, 256);
hip_compile_options options;
options.set_launch_params(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment