Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
11ec07e9
Unverified
Commit
11ec07e9
authored
Jul 01, 2021
by
Chao Liu
Committed by
GitHub
Jul 01, 2021
Browse files
fix complain about divide by zero (#40)
parent
3835318c
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
8 additions
and
8 deletions
+8
-8
composable_kernel/src/kernel_wrapper/dynamic_convolution_forward_implicit_gemm_v4r4_nchw_kcyx_nkhw.cpp
...convolution_forward_implicit_gemm_v4r4_nchw_kcyx_nkhw.cpp
+4
-4
composable_kernel/src/kernel_wrapper/dynamic_convolution_forward_implicit_gemm_v4r5_nchw_kcyx_nkhw.cpp
...convolution_forward_implicit_gemm_v4r5_nchw_kcyx_nkhw.cpp
+4
-4
No files found.
composable_kernel/src/kernel_wrapper/dynamic_convolution_forward_implicit_gemm_v4r4_nchw_kcyx_nkhw.cpp
View file @
11ec07e9
...
...
@@ -226,17 +226,17 @@ extern "C" __global__ void
constexpr
auto
I2
=
Number
<
2
>
{};
constexpr
auto
in_n_c_hi_wi_desc
=
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
64
,
4
,
35
,
35
));
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
256
,
256
,
28
,
28
));
constexpr
auto
wei_k_c_y_x_desc
=
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
8
,
4
,
3
,
3
));
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
256
,
256
,
3
,
3
));
constexpr
auto
out_n_k_ho_wo_desc
=
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
64
,
8
,
1
8
,
1
8
));
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
256
,
256
,
2
8
,
2
8
));
constexpr
auto
descs
=
transform_forward_convolution_into_gemm_v4r4_nchw_kcyx_nkhw_pad
(
wei_k_c_y_x_desc
,
in_n_c_hi_wi_desc
,
out_n_k_ho_wo_desc
,
make_tuple
(
2
,
2
),
make_tuple
(
1
,
1
),
make_tuple
(
1
,
1
),
make_tuple
(
1
,
1
),
make_tuple
(
1
,
1
));
...
...
composable_kernel/src/kernel_wrapper/dynamic_convolution_forward_implicit_gemm_v4r5_nchw_kcyx_nkhw.cpp
View file @
11ec07e9
...
...
@@ -236,18 +236,18 @@ extern "C" __global__ void
constexpr
auto
I2
=
Number
<
2
>
{};
constexpr
auto
in_n_c_hi_wi_desc
=
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
64
,
4
,
35
,
35
));
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
256
,
256
,
28
,
28
));
constexpr
auto
wei_k_c_y_x_desc
=
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
8
,
4
,
3
,
3
));
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
256
,
256
,
3
,
3
));
constexpr
auto
out_n_k_ho_wo_desc
=
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
64
,
8
,
1
8
,
1
8
));
make_dynamic_naive_tensor_descriptor_packed_v2
(
make_tuple
(
256
,
256
,
2
8
,
2
8
));
constexpr
auto
descs
=
transform_forward_convolution_into_contraction_v4r5_nchw_kcyx_nkhw_pad
<
N0
>
(
wei_k_c_y_x_desc
,
in_n_c_hi_wi_desc
,
out_n_k_ho_wo_desc
,
make_tuple
(
2
,
2
),
make_tuple
(
1
,
1
),
make_tuple
(
1
,
1
),
make_tuple
(
1
,
1
),
make_tuple
(
1
,
1
));
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment