Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
e276fc95
Commit
e276fc95
authored
Dec 05, 2023
by
Artur Wojcik
Browse files
merge 'uif2-temp' to uif2-initial
parent
9b3a0d42
Changes
27
Show whitespace changes
Inline
Side-by-side
Showing
7 changed files
with
8 additions
and
20 deletions
+8
-20
example/34_batchnorm/batchnorm_infer_impl.hpp
example/34_batchnorm/batchnorm_infer_impl.hpp
+2
-2
example/CMakeLists.txt
example/CMakeLists.txt
+4
-4
include/ck/tensor_operation/gpu/grid/gridwise_elementwise_layernorm_welford_variance.hpp
.../grid/gridwise_elementwise_layernorm_welford_variance.hpp
+2
-2
library/CMakeLists.txt
library/CMakeLists.txt
+0
-3
library/src/tensor_operation_instance/gpu/CMakeLists.txt
library/src/tensor_operation_instance/gpu/CMakeLists.txt
+0
-3
library/src/utility/CMakeLists.txt
library/src/utility/CMakeLists.txt
+0
-3
test/CMakeLists.txt
test/CMakeLists.txt
+0
-3
No files found.
example/34_batchnorm/batchnorm_infer_impl.hpp
View file @
e276fc95
...
...
@@ -36,7 +36,7 @@ int bnorm_infer(
const
void
*
p_x
,
const
void
*
p_scale
,
const
void
*
p_bias
,
double
_
epsilon
,
double
epsilon
,
const
void
*
p_estimatedMean
,
const
void
*
p_estimatedVariance
,
void
*
p_y
)
...
...
@@ -101,7 +101,7 @@ int bnorm_infer(
{
yStrides
},
{
p_x
,
p_estimatedMean
,
p_estimatedVariance
,
p_scale
,
p_bias
},
{
p_y
},
NormalizeInInfer
{
_
epsilon
});
NormalizeInInfer
{
epsilon
});
if
(
!
dev_normalize
.
IsSupportedArgument
(
argument_ptr1
.
get
()))
{
...
...
example/CMakeLists.txt
View file @
e276fc95
...
...
@@ -47,7 +47,7 @@ function(add_example_executable EXAMPLE_NAME FILE_NAME)
#only continue if there are some source files left on the list
if
(
FILE_NAME
)
add_executable
(
${
EXAMPLE_NAME
}
${
FILE_NAME
}
)
target_link_libraries
(
${
EXAMPLE_NAME
}
PRIVATE utility
getopt::getopt
)
target_link_libraries
(
${
EXAMPLE_NAME
}
PRIVATE utility
)
add_test
(
NAME
${
EXAMPLE_NAME
}
COMMAND $<TARGET_FILE:
${
EXAMPLE_NAME
}
>
${
ARGN
}
)
add_dependencies
(
examples
${
EXAMPLE_NAME
}
)
add_dependencies
(
check
${
EXAMPLE_NAME
}
)
...
...
@@ -56,7 +56,7 @@ function(add_example_executable EXAMPLE_NAME FILE_NAME)
endif
()
#message("add_example returns ${result}")
set
(
result
${
result
}
PARENT_SCOPE
)
endfunction
()
endfunction
(
add_example_executable EXAMPLE_NAME
)
function
(
add_example_dependencies EXAMPLE_NAME FILE_NAME
)
if
(
result EQUAL 0
)
...
...
@@ -106,14 +106,14 @@ function(add_example_executable_no_testing EXAMPLE_NAME FILE_NAME)
#only continue if there are some source files left on the list
if
(
FILE_NAME
)
add_executable
(
${
EXAMPLE_NAME
}
${
FILE_NAME
}
)
target_link_libraries
(
${
EXAMPLE_NAME
}
PRIVATE utility
getopt::getopt
)
target_link_libraries
(
${
EXAMPLE_NAME
}
PRIVATE utility
)
add_dependencies
(
examples
${
EXAMPLE_NAME
}
)
rocm_install
(
TARGETS
${
EXAMPLE_NAME
}
COMPONENT examples
)
set
(
result 0
)
endif
()
#message("add_example returns ${result}")
set
(
result
${
result
}
PARENT_SCOPE
)
endfunction
()
endfunction
(
add_example_executable_no_testing EXAMPLE_NAME
)
# add all example subdir
file
(
GLOB dir_list LIST_DIRECTORIES true *
)
...
...
include/ck/tensor_operation/gpu/grid/gridwise_elementwise_layernorm_welford_variance.hpp
View file @
e276fc95
...
...
@@ -119,7 +119,7 @@ struct GridwiseElementwiseLayernormWelfordVariance_mk_to_mk
index_t
num_k_block_tile_iteration
,
AccDataType
epsilon
,
const
InDataTypePointerTuple
p_in_global_tuple
,
XDataType
*
const
__restrict__
_
p_x_lds
,
XDataType
*
const
__restrict__
p_x_lds
_
,
const
GammaDataType
*
const
__restrict__
p_gamma_global
,
const
BetaDataType
*
const
__restrict__
p_beta_global
,
YDataType
*
const
__restrict__
p_y_global
,
...
...
@@ -149,7 +149,7 @@ struct GridwiseElementwiseLayernormWelfordVariance_mk_to_mk
p_y_global
,
y_grid_desc_m_k
.
GetElementSpaceSize
());
auto
x_lds_val_buf
=
make_dynamic_buffer
<
AddressSpaceEnum
::
Lds
>
(
_
p_x_lds
,
x_grid_desc_m_k
.
GetElementSpaceSize
()
/
grid_size
);
p_x_lds
_
,
x_grid_desc_m_k
.
GetElementSpaceSize
()
/
grid_size
);
auto
in_thread_buf_tuple
=
generate_tuple
(
[
&
](
auto
)
{
...
...
library/CMakeLists.txt
View file @
e276fc95
# SPDX-License-Identifier: MIT
# Copyright (c) 2018-2022, Advanced Micro Devices, Inc. All rights reserved.
add_subdirectory
(
src/tensor_operation_instance/gpu
)
add_subdirectory
(
src/utility
)
library/src/tensor_operation_instance/gpu/CMakeLists.txt
View file @
e276fc95
# SPDX-License-Identifier: MIT
# Copyright (c) 2018-2022, Advanced Micro Devices, Inc. All rights reserved.
function
(
add_instance_library INSTANCE_NAME
)
message
(
"adding instance
${
INSTANCE_NAME
}
"
)
set
(
result 1
)
...
...
library/src/utility/CMakeLists.txt
View file @
e276fc95
# SPDX-License-Identifier: MIT
# Copyright (c) 2018-2022, Advanced Micro Devices, Inc. All rights reserved.
add_library
(
utility STATIC
device_memory.cpp
host_tensor.cpp
...
...
test/CMakeLists.txt
View file @
e276fc95
# SPDX-License-Identifier: MIT
# Copyright (c) 2018-2022, Advanced Micro Devices, Inc. All rights reserved.
include_directories
(
BEFORE
${
PROJECT_SOURCE_DIR
}
/
${
PROJECT_SOURCE_DIR
}
/profiler/include
...
...
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment