Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
0aa899aa
"...composable_kernel_rocm.git" did not exist on "43a889b72e3faabf04c16ff410d387ce28486c3e"
Commit
0aa899aa
authored
Apr 06, 2022
by
Jehandad Khan
Browse files
add hipEvent based timing to kernels
parent
44757d6b
Changes
46
Hide whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
9 additions
and
7 deletions
+9
-7
library/include/ck/library/reference_tensor_operation/cpu/reference_gemm_bias_activation.hpp
...e_tensor_operation/cpu/reference_gemm_bias_activation.hpp
+1
-1
library/include/ck/library/reference_tensor_operation/cpu/reference_gemm_bias_activation_add.hpp
...nsor_operation/cpu/reference_gemm_bias_activation_add.hpp
+1
-1
library/src/tensor_operation_instance/gpu/CMakeLists.txt
library/src/tensor_operation_instance/gpu/CMakeLists.txt
+0
-1
library/src/tensor_operation_instance/gpu/device_conv2d.cpp
library/src/tensor_operation_instance/gpu/device_conv2d.cpp
+4
-4
profiler/CMakeLists.txt
profiler/CMakeLists.txt
+2
-0
test/CMakeLists.txt
test/CMakeLists.txt
+1
-0
No files found.
library/include/ck/library/reference_tensor_operation/cpu/reference_gemm_bias_activation.hpp
View file @
0aa899aa
...
...
@@ -85,7 +85,7 @@ struct ReferenceGemmBiasActivation : public device::BaseOperator
return
0
;
}
float
Run
(
const
device
::
BaseArgument
*
p_arg
,
int
,
hipStream_t
)
override
float
Run
(
const
device
::
BaseArgument
*
p_arg
,
int
,
hipStream_t
,
bool
)
override
{
return
Run
(
*
dynamic_cast
<
const
Argument
*>
(
p_arg
));
}
...
...
library/include/ck/library/reference_tensor_operation/cpu/reference_gemm_bias_activation_add.hpp
View file @
0aa899aa
...
...
@@ -91,7 +91,7 @@ struct ReferenceGemmBiasActivationAdd : public device::BaseOperator
return
0
;
}
float
Run
(
const
device
::
BaseArgument
*
p_arg
,
int
,
hipStream_t
)
override
float
Run
(
const
device
::
BaseArgument
*
p_arg
,
int
,
hipStream_t
,
bool
)
override
{
return
Run
(
*
dynamic_cast
<
const
Argument
*>
(
p_arg
));
}
...
...
library/src/tensor_operation_instance/gpu/CMakeLists.txt
View file @
0aa899aa
...
...
@@ -82,7 +82,6 @@ PUBLIC -DCK_AMD_GPU_GFX908)
target_compile_options
(
device_operations
PRIVATE -amdgpu-target=gfx908
PRIVATE -O3
)
# install(TARGETS device_operations LIBRARY DESTINATION lib)
install
(
TARGETS device_operations
...
...
library/src/tensor_operation_instance/gpu/device_conv2d.cpp
View file @
0aa899aa
...
...
@@ -37,12 +37,12 @@ struct DeviceConvFwdPtr_t::DeviceConvFwdPtrImpl
std
::
vector
<
ck
::
index_t
>
conv_filter_strides
,
std
::
vector
<
ck
::
index_t
>
conv_filter_dilations
,
std
::
vector
<
ck
::
index_t
>
input_left_pads
,
std
::
vector
<
ck
::
index_t
>
input_right_pads
)
std
::
vector
<
ck
::
index_t
>
input_right_pads
)
const
{
return
el
->
MakeArgumentPointer
(
in_ptr
,
wei_ptr
,
out_ptr
,
N
,
K
,
C
,
input_spatial_lengths
,
filter_spatial_lengths
,
output_spatial_lengths
,
conv_filter_strides
,
conv_filter_dilations
,
input_left_pads
,
input_right_pads
,
PassThrough
{},
PassThrough
{},
PassThrough
{});
}
std
::
unique_ptr
<
DeviceConvFwdPtr_t
::
BaseInvoker
>
MakeInvokerPointer
()
std
::
unique_ptr
<
DeviceConvFwdPtr_t
::
BaseInvoker
>
MakeInvokerPointer
()
const
{
return
el
->
MakeInvokerPointer
();
}
...
...
@@ -73,13 +73,13 @@ std::unique_ptr<DeviceConvFwdPtr_t::BaseArgument> DeviceConvFwdPtr_t::MakeArgume
std
::
vector
<
ck
::
index_t
>
conv_filter_strides
,
std
::
vector
<
ck
::
index_t
>
conv_filter_dilations
,
std
::
vector
<
ck
::
index_t
>
input_left_pads
,
std
::
vector
<
ck
::
index_t
>
input_right_pads
)
std
::
vector
<
ck
::
index_t
>
input_right_pads
)
const
{
return
pImpl
->
MakeArgumentPointer
(
in_ptr
,
wei_ptr
,
out_ptr
,
N
,
K
,
C
,
input_spatial_lengths
,
filter_spatial_lengths
,
output_spatial_lengths
,
conv_filter_strides
,
conv_filter_dilations
,
input_left_pads
,
input_right_pads
);
}
std
::
unique_ptr
<
DeviceConvFwdPtr_t
::
BaseInvoker
>
DeviceConvFwdPtr_t
::
MakeInvokerPointer
()
std
::
unique_ptr
<
DeviceConvFwdPtr_t
::
BaseInvoker
>
DeviceConvFwdPtr_t
::
MakeInvokerPointer
()
const
{
return
pImpl
->
MakeInvokerPointer
();
}
...
...
profiler/CMakeLists.txt
View file @
0aa899aa
...
...
@@ -49,3 +49,5 @@ target_link_libraries(ckProfiler PRIVATE device_conv2d_fwd_bias_relu_add_instanc
target_link_libraries
(
ckProfiler PRIVATE device_conv2d_fwd_bias_relu_atomic_add_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_conv2d_bwd_data_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_reduce_instance
)
set_target_properties
(
ckProfiler PROPERTIES EXCLUDE_FROM_ALL 1
)
\ No newline at end of file
test/CMakeLists.txt
View file @
0aa899aa
...
...
@@ -28,6 +28,7 @@ function(add_test_executable TEST_NAME)
add_test
(
NAME
${
TEST_NAME
}
COMMAND $<TARGET_FILE:
${
TEST_NAME
}
>
)
add_dependencies
(
tests
${
TEST_NAME
}
)
add_dependencies
(
check
${
TEST_NAME
}
)
set_target_properties
(
${
TEST_NAME
}
PROPERTIES EXCLUDE_FROM_ALL 1
)
endfunction
(
add_test_executable TEST_NAME
)
add_subdirectory
(
magic_number_division
)
...
...
Prev
1
2
3
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment