"profiler/vscode:/vscode.git/clone" did not exist on "f3aceeabf1f2ab3a44e30d08761a7235019b715d"
Commit 480cc884 authored by ltqin's avatar ltqin
Browse files

change input parameter

parent 84e76a16
...@@ -40,19 +40,19 @@ cmake \ ...@@ -40,19 +40,19 @@ cmake \
#arg3: run kernel # of times (>1) #arg3: run kernel # of times (>1)
#arg4: is show log (0=no, 1=yes) #arg4: is show log (0=no, 1=yes)
#arg5 to 19: N, K, C, Y, X, Hi, Wi, Sy, Sx, Dy, Dx, LeftPy, LeftPx, RightPy, RightPx, split-k #arg5 to 19: N, K, C, Y, X, Hi, Wi, Sy, Sx, Dy, Dx, LeftPy, LeftPx, RightPy, RightPx, split-k
./example/conv2d_fwd_xdl 0 1 5 1 ./example/conv2d_fwd_xdl 0 1 5 0 4
``` ```
Result Result
``` ```
in_n_c_hi_wi: dim 4, lengths {128, 128, 71, 71}, strides {645248, 1, 9088, 128} in_n_c_hi_wi: dim 4, lengths {128, 1024, 14, 14}, strides {200704, 1, 14336, 1024}
wei_k_c_y_x: dim 4, lengths {256, 128, 3, 3}, strides {1152, 1, 384, 128} wei_k_c_y_x: dim 4, lengths {256, 1024, 3, 3}, strides {9216, 1, 3072, 1024}
out_n_k_ho_wo: dim 4, lengths {128, 256, 36, 36}, strides {331776, 1, 9216, 256} out_n_k_ho_wo: dim 4, lengths {128, 256, 6, 6}, strides {9216, 1, 1536, 256}
arg.a_grid_desc_kbatch_k0_m_k1_{1, 20736, 256} arg.a_grid_desc_kbatch_k0_m_k1_{4, 144, 256, 8}
arg.b_grid_desc_kbatch_k0_n_k1_{1, 20736, 1152} arg.b_grid_desc_kbatch_k0_n_k1_{4, 144, 9216, 8}
arg.c_grid_desc_m_n_{ 256, 1152} arg.c_grid_desc_m_n_{ 256, 9216}
launch_and_time_kernel: grid_dim {18, 1, 1}, block_dim {256, 1, 1} launch_and_time_kernel: grid_dim {576, 1, 1}, block_dim {256, 1, 1}
Warm up Warm up
Start running 5 times... Start running 5 times...
Perf: 12.0997 ms, 8.08653 TFlops, 20.7201 GB/s Perf: 0.401084 ms, 54.2112 TFlops, 145.75 GB/s
``` ```
...@@ -79,24 +79,24 @@ int main(int argc, char* argv[]) ...@@ -79,24 +79,24 @@ int main(int argc, char* argv[])
int init_method = 0; int init_method = 0;
int nrepeat = 5; int nrepeat = 5;
int do_log = 0; int do_log = 0;
int split_k = 1; int split_k = 4;
// Conv shape // Conv shape
ck::index_t N = 128; ck::index_t N = 128;
ck::index_t K = 256; ck::index_t K = 256;
ck::index_t C = 128; ck::index_t C = 1024;
ck::index_t Y = 3; ck::index_t Y = 3;
ck::index_t X = 3; ck::index_t X = 3;
ck::index_t Hi = 71; ck::index_t Hi = 14;
ck::index_t Wi = 71; ck::index_t Wi = 14;
ck::index_t conv_stride_h = 2; ck::index_t conv_stride_h = 2;
ck::index_t conv_stride_w = 2; ck::index_t conv_stride_w = 2;
ck::index_t conv_dilation_h = 1; ck::index_t conv_dilation_h = 1;
ck::index_t conv_dilation_w = 1; ck::index_t conv_dilation_w = 1;
ck::index_t in_left_pad_h = 1; ck::index_t in_left_pad_h = 0;
ck::index_t in_left_pad_w = 1; ck::index_t in_left_pad_w = 0;
ck::index_t in_right_pad_h = 1; ck::index_t in_right_pad_h = 0;
ck::index_t in_right_pad_w = 1; ck::index_t in_right_pad_w = 0;
if(argc == 6) if(argc == 6)
{ {
...@@ -136,8 +136,9 @@ int main(int argc, char* argv[]) ...@@ -136,8 +136,9 @@ int main(int argc, char* argv[])
printf("arg2: initialization (0=no init, 1=integer value, 2=decimal value)\n"); printf("arg2: initialization (0=no init, 1=integer value, 2=decimal value)\n");
printf("arg3: run kernel # of times (>1)\n"); printf("arg3: run kernel # of times (>1)\n");
printf("arg4: is show log (0=no, 1=yes)\n"); printf("arg4: is show log (0=no, 1=yes)\n");
printf("arg5 to 19: N, K, C, Y, X, Hi, Wi, Sy, Sx, Dy, Dx, LeftPy, LeftPx, RightPy, " printf("arg5: split-k \n");
"RightPx, split-k\n"); printf("arg6 to 19: N, K, C, Y, X, Hi, Wi, Sy, Sx, Dy, Dx, LeftPy, LeftPx, RightPy, "
"RightPx\n");
exit(0); exit(0);
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment