Commit 83f75313 authored by rocking's avatar rocking
Browse files

Let it be the multiple number of CU

parent b7a82d29
...@@ -86,7 +86,7 @@ struct DeviceBinaryElementwise : public BaseOperator ...@@ -86,7 +86,7 @@ struct DeviceBinaryElementwise : public BaseOperator
p_c_(p_c), p_c_(p_c),
functor_(functor), functor_(functor),
threadPerBlock_(threadPerBlock), threadPerBlock_(threadPerBlock),
gridSize_(128) // FIXME - Calculate the grid size by number of CU in the future gridSize_(120) // FIXME - Calculate the grid size by number of CU in the future
{ {
a_grid_desc_m0_ = MakeDescriptor_M0(shape, stride_a, gridSize_, threadPerBlock_); a_grid_desc_m0_ = MakeDescriptor_M0(shape, stride_a, gridSize_, threadPerBlock_);
b_grid_desc_m0_ = MakeDescriptor_M0(shape, stride_b, gridSize_, threadPerBlock_); b_grid_desc_m0_ = MakeDescriptor_M0(shape, stride_b, gridSize_, threadPerBlock_);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment