Commit 93e7f92a authored by Astha Rai's avatar Astha Rai
Browse files

removed debugging print statements

parent 16f02f76
...@@ -48,10 +48,10 @@ int main() ...@@ -48,10 +48,10 @@ int main()
bool do_verification = true; bool do_verification = true;
bool time_kernel = true; bool time_kernel = true;
const int N = 128; const int N = 120;
const int H = 128;
const int W = 128;
const int C = 128; const int C = 128;
const int H = 32;
const int W = 1024;
/**const int N = 120; /**const int N = 120;
const int H = 32; const int H = 32;
......
...@@ -83,10 +83,7 @@ struct DeviceElementwise : public DeviceElementwiseBase<InDataTypeTuple, ...@@ -83,10 +83,7 @@ struct DeviceElementwise : public DeviceElementwiseBase<InDataTypeTuple,
const index_t loop_step_n = num_threads_n * NPerThread; const index_t loop_step_n = num_threads_n * NPerThread;
const auto pad_m = math::integer_least_multiple(m, loop_step_m) - m; const auto pad_m = math::integer_least_multiple(m, loop_step_m) - m;
const auto pad_n = math::integer_least_multiple(n, loop_step_n) - n; const auto pad_n = math::integer_least_multiple(n, loop_step_n) - n;
std::cout << NumDim_m << " m: " << m << " loop_step_m: " << loop_step_m
<< " pad_m: " << pad_m << std::endl;
std::cout << NumDim_n << " n: " << n << " loop_step_n: " << loop_step_n
<< " pad_n: " << pad_n << std::endl;
const auto desc_mn_pad = transform_tensor_descriptor( const auto desc_mn_pad = transform_tensor_descriptor(
desc_mn, desc_mn,
make_tuple(make_right_pad_transform(m, pad_m), make_right_pad_transform(n, pad_n)), make_tuple(make_right_pad_transform(m, pad_m), make_right_pad_transform(n, pad_n)),
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment