Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
7b1ec41e
Commit
7b1ec41e
authored
Aug 06, 2021
by
Chao Liu
Browse files
refactor
parent
49c33aae
Changes
8
Hide whitespace changes
Inline
Side-by-side
Showing
8 changed files
with
5 additions
and
3 deletions
+5
-3
host/driver_offline/CMakeLists.txt
host/driver_offline/CMakeLists.txt
+1
-0
host/driver_online/CMakeLists.txt
host/driver_online/CMakeLists.txt
+1
-0
host/driver_online/include/online_device_dynamic_convolution_forward_implicit_gemm_v6r1_dlops_nchw_kcyx_nkhw.hpp
...ution_forward_implicit_gemm_v6r1_dlops_nchw_kcyx_nkhw.hpp
+3
-3
host/solver/include/conv_igemm_fwd_v6r1_dlops_nchw_kcyx_nkhw.hpp
...lver/include/conv_igemm_fwd_v6r1_dlops_nchw_kcyx_nkhw.hpp
+0
-0
host/solver/include/conv_tunable_fwd_v4r4_dlops_nchw_kcyx_nkhw.hpp
...er/include/conv_tunable_fwd_v4r4_dlops_nchw_kcyx_nkhw.hpp
+0
-0
host/solver/include/conv_tunable_fwd_v4r4_xdlops_nchw_kcyx_nkhw.hpp
...r/include/conv_tunable_fwd_v4r4_xdlops_nchw_kcyx_nkhw.hpp
+0
-0
host/solver/include/conv_tunable_fwd_v4r4_xdlops_nhwc_kyxc_nhwk.hpp
...r/include/conv_tunable_fwd_v4r4_xdlops_nhwc_kyxc_nhwk.hpp
+0
-0
host/solver/include/convolution_problem_descriptor.hpp
host/solver/include/convolution_problem_descriptor.hpp
+0
-0
No files found.
host/driver_offline/CMakeLists.txt
View file @
7b1ec41e
include_directories
(
BEFORE
include
${
PROJECT_SOURCE_DIR
}
/host/host_tensor/include
${
PROJECT_SOURCE_DIR
}
/host/solver/include
${
PROJECT_SOURCE_DIR
}
/composable_kernel/include
${
PROJECT_SOURCE_DIR
}
/composable_kernel/include/utility
${
PROJECT_SOURCE_DIR
}
/composable_kernel/include/tensor_description
...
...
host/driver_online/CMakeLists.txt
View file @
7b1ec41e
...
...
@@ -3,6 +3,7 @@ include_directories(BEFORE
${
PROJECT_BINARY_DIR
}
/host/online_compile/include
${
PROJECT_SOURCE_DIR
}
/host/online_compile/include
${
PROJECT_SOURCE_DIR
}
/host/host_tensor/include
${
PROJECT_SOURCE_DIR
}
/host/solver/include
${
PROJECT_SOURCE_DIR
}
/composable_kernel/include
${
PROJECT_SOURCE_DIR
}
/composable_kernel/include/utility
${
PROJECT_SOURCE_DIR
}
/composable_kernel/include/tensor_description
...
...
host/driver_online/include/online_device_dynamic_convolution_forward_implicit_gemm_v6r1_dlops_nchw_kcyx_nkhw.hpp
View file @
7b1ec41e
...
...
@@ -106,7 +106,7 @@ void online_device_dynamic_convolution_forward_implicit_gemm_v6r1_dlops_nchw_kcy
std
::
vector
<
float
>
kernel1_times
;
std
::
vector
<
float
>
kernel2_times
;
for
(
index_t
i
=
0
;
i
<
nrepeat
;
++
i
)
for
(
index_t
i
=
0
;
i
<
nrepeat
+
1
;
++
i
)
{
KernelTimer
timer1
,
timer2
;
std
::
string
kernel_name
;
...
...
@@ -164,11 +164,11 @@ void online_device_dynamic_convolution_forward_implicit_gemm_v6r1_dlops_nchw_kcy
auto
ave_time1
=
std
::
accumulate
(
std
::
next
(
kernel1_times
.
begin
()),
kernel1_times
.
end
(),
0.
,
std
::
plus
<
float
>
{})
/
(
nrepeat
-
1
)
;
nrepeat
;
auto
ave_time2
=
std
::
accumulate
(
std
::
next
(
kernel2_times
.
begin
()),
kernel2_times
.
end
(),
0.
,
std
::
plus
<
float
>
{})
/
(
nrepeat
-
1
)
;
nrepeat
;
float
perf
=
(
float
)(
conv_problem_desc
.
CalculateFlop
())
/
(
std
::
size_t
(
1000
)
*
1000
*
1000
)
/
(
ave_time1
+
ave_time2
);
...
...
host/
driver_online
/include/conv_igemm_fwd_v6r1_dlops_nchw_kcyx_nkhw.hpp
→
host/
solver
/include/conv_igemm_fwd_v6r1_dlops_nchw_kcyx_nkhw.hpp
View file @
7b1ec41e
File moved
host/
driver_online
/include/conv_tunable_fwd_v4r4_dlops_nchw_kcyx_nkhw.hpp
→
host/
solver
/include/conv_tunable_fwd_v4r4_dlops_nchw_kcyx_nkhw.hpp
View file @
7b1ec41e
File moved
host/
driver_online
/include/conv_tunable_fwd_v4r4_xdlops_nchw_kcyx_nkhw.hpp
→
host/
solver
/include/conv_tunable_fwd_v4r4_xdlops_nchw_kcyx_nkhw.hpp
View file @
7b1ec41e
File moved
host/
driver_online
/include/conv_tunable_fwd_v4r4_xdlops_nhwc_kyxc_nhwk.hpp
→
host/
solver
/include/conv_tunable_fwd_v4r4_xdlops_nhwc_kyxc_nhwk.hpp
View file @
7b1ec41e
File moved
host/
driver_online
/include/convolution_problem_descriptor.hpp
→
host/
solver
/include/convolution_problem_descriptor.hpp
View file @
7b1ec41e
File moved
gaoqiong
@gaoqiong
mentioned in commit
6fe3627a
·
Dec 05, 2023
mentioned in commit
6fe3627a
mentioned in commit 6fe3627a9eb35f1237266f1b6cc8fd3456aed67d
Toggle commit list
gaoqiong
@gaoqiong
mentioned in commit
dfb80c4e
·
Dec 05, 2023
mentioned in commit
dfb80c4e
mentioned in commit dfb80c4e39ec7b304c3ebc88bab2a204bc4906b9
Toggle commit list
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment