Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
49de8944
"vscode:/vscode.git/clone" did not exist on "a402431de07be1c7cfc471a406b7c64998d96f02"
Unverified
Commit
49de8944
authored
Feb 16, 2023
by
Rostyslav Geyyer
Committed by
GitHub
Feb 16, 2023
Browse files
Merge branch 'develop' into lwpck-471
parents
340cb150
bef0cb20
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
10 additions
and
3 deletions
+10
-3
Jenkinsfile
Jenkinsfile
+9
-3
include/ck/tensor_operation/gpu/device/impl/device_batched_gemm_softmax_gemm_permute_xdl_cshuffle.hpp
...device_batched_gemm_softmax_gemm_permute_xdl_cshuffle.hpp
+1
-0
No files found.
Jenkinsfile
View file @
49de8944
...
@@ -471,6 +471,12 @@ def Build_CK(Map conf=[:]){
...
@@ -471,6 +471,12 @@ def Build_CK(Map conf=[:]){
//we only need the ckProfiler to run the performance tests, so we pack and stash it
//we only need the ckProfiler to run the performance tests, so we pack and stash it
sh
'tar -zcvf ckProfiler.tar.gz bin/ckProfiler'
sh
'tar -zcvf ckProfiler.tar.gz bin/ckProfiler'
stash
"ckProfiler.tar.gz"
stash
"ckProfiler.tar.gz"
if
(
params
.
RUN_FULL_QA
){
// build deb packages
sh
'make -j package'
archiveArtifacts
artifacts:
'composablekernel-ckprofiler_*.deb'
archiveArtifacts
artifacts:
'composablekernel-tests_*.deb'
}
}
}
}
}
}
}
...
@@ -651,8 +657,8 @@ pipeline {
...
@@ -651,8 +657,8 @@ pipeline {
{
{
agent
{
label
rocmnode
(
"gfx908 || gfx90a"
)
}
agent
{
label
rocmnode
(
"gfx908 || gfx90a"
)
}
environment
{
environment
{
setup_args
=
"${params.COMPILER_VERSION == "
ck
-
9110
" ? """
-
DBUILD_DEV
=
Off
-
DCMAKE_INSTALL_PREFIX
=..
/install -DGPU_TARGETS="gfx908;gfx90a" -DCMAKE_CXX_FLAGS="-O3 -Xclang -mlink-builtin-bitcode -Xclang /
opt
/rocm/
amdgcn
/bitcode/
oclc_abi_version_400
.
bc
" """
:
""" -DBUILD_DEV=Off -DCMAKE_INSTALL_PREFIX=../install -DGPU_TARGETS="gfx908;gfx90a" -DCMAKE_CXX_FLAGS="-O3 " """
}
"
setup_args
=
"${params.COMPILER_VERSION == "
ck
-
9110
" ? """
-
DBUILD_DEV
=
Off
-
DCMAKE_INSTALL_PREFIX
=..
/install -DGPU_TARGETS="gfx908;gfx90a
;gfx1030
" -DCMAKE_CXX_FLAGS="-O3 -Xclang -mlink-builtin-bitcode -Xclang /
opt
/rocm/
amdgcn
/bitcode/
oclc_abi_version_400
.
bc
" """
:
""" -DBUILD_DEV=Off -DCMAKE_INSTALL_PREFIX=../install -DGPU_TARGETS="gfx908;gfx90a
;gfx1030
" -DCMAKE_CXX_FLAGS="-O3 " """
}
"
execute_args
=
"${params.COMPILER_VERSION == "
ck
-
9110
" ? """
cd
..
/client_example && rm -rf build && mkdir build && cd build && cmake -D CMAKE_PREFIX_PATH="${env.WORKSPACE}/
install
;
/opt/
rocm
" -DGPU_TARGETS="
gfx908
;
gfx90a
" -DCMAKE_CXX_FLAGS="
-
O3
-
Xclang
-
mlink
-
builtin
-
bitcode
-
Xclang
/opt/
rocm
/amdgcn/
bitcode
/oclc_abi_version_400.bc" -D CMAKE_CXX_COMPILER="${build_compiler()}" .. && make -j """ : """ cd ../
client_example
&&
rm
-
rf
build
&&
mkdir
build
&&
cd
build
&&
cmake
-
D
CMAKE_PREFIX_PATH
=
"${env.WORKSPACE}/install;/opt/rocm"
-
DGPU_TARGETS
=
"gfx908,gfx90a"
-
DCMAKE_CXX_FLAGS
=
"-O3"
-
D
CMAKE_CXX_COMPILER
=
"${build_compiler()}"
..
&&
make
-
j
""" }"
execute_args
=
"${params.COMPILER_VERSION == "
ck
-
9110
" ? """
cd
..
/client_example && rm -rf build && mkdir build && cd build && cmake -D CMAKE_PREFIX_PATH="${env.WORKSPACE}/
install
;
/opt/
rocm
" -DGPU_TARGETS="
gfx908
;
gfx90a
;
gfx1030
" -DCMAKE_CXX_FLAGS="
-
O3
-
Xclang
-
mlink
-
builtin
-
bitcode
-
Xclang
/opt/
rocm
/amdgcn/
bitcode
/oclc_abi_version_400.bc" -D CMAKE_CXX_COMPILER="${build_compiler()}" .. && make -j """ : """ cd ../
client_example
&&
rm
-
rf
build
&&
mkdir
build
&&
cd
build
&&
cmake
-
D
CMAKE_PREFIX_PATH
=
"${env.WORKSPACE}/install;/opt/rocm"
-
DGPU_TARGETS
=
"gfx908,gfx90a
;gfx1030
"
-
DCMAKE_CXX_FLAGS
=
"-O3"
-
D
CMAKE_CXX_COMPILER
=
"${build_compiler()}"
..
&&
make
-
j
""" }"
}
}
steps{
steps{
Build_CK_and_Reboot(setup_args: setup_args, config_targets: "install", no_reboot:true, build_type: 'Release', execute_cmd: execute_args, prefixpath: '/usr/local')
Build_CK_and_Reboot(setup_args: setup_args, config_targets: "install", no_reboot:true, build_type: 'Release', execute_cmd: execute_args, prefixpath: '/usr/local')
...
@@ -674,7 +680,7 @@ pipeline {
...
@@ -674,7 +680,7 @@ pipeline {
options { retry(2) }
options { retry(2) }
agent{ label rocmnode("gfx908 || gfx90a")}
agent{ label rocmnode("gfx908 || gfx90a")}
environment{
environment{
setup_args = "${params.COMPILER_VERSION == "ck-9110" ? """
-
DGPU_TARGETS
=
"gfx908;gfx90a"
-
DCMAKE_CXX_FLAGS
=
" -O3 -Xclang -mlink-builtin-bitcode -Xclang /opt/rocm/amdgcn/bitcode/oclc_abi_version_400.bc"
-
DBUILD_DEV
=
On
""" : """
-
DGPU_TARGETS
=
"gfx908;gfx90a"
-
DCMAKE_CXX_FLAGS
=
" -O3 "
-
DBUILD_DEV
=
On
"""}"
setup_args = "${params.COMPILER_VERSION == "ck-9110" ? """
-
DGPU_TARGETS
=
"gfx908;gfx90a
;gfx1030
"
-
DCMAKE_CXX_FLAGS
=
" -O3 -Xclang -mlink-builtin-bitcode -Xclang /opt/rocm/amdgcn/bitcode/oclc_abi_version_400.bc"
-
DBUILD_DEV
=
On
""" : """
-
DGPU_TARGETS
=
"gfx908;gfx90a
;gfx1030
"
-
DCMAKE_CXX_FLAGS
=
" -O3 "
-
DBUILD_DEV
=
On
"""}"
}
}
steps{
steps{
runPerfTest(setup_args:setup_args, config_targets: "ckProfiler", no_reboot:true, build_type: 'Release')
runPerfTest(setup_args:setup_args, config_targets: "ckProfiler", no_reboot:true, build_type: 'Release')
...
...
include/ck/tensor_operation/gpu/device/impl/device_batched_gemm_softmax_gemm_permute_xdl_cshuffle.hpp
View file @
49de8944
...
@@ -111,6 +111,7 @@ __global__ void
...
@@ -111,6 +111,7 @@ __global__ void
ignore
=
p_b_grid
;
ignore
=
p_b_grid
;
ignore
=
p_b1_grid
;
ignore
=
p_b1_grid
;
ignore
=
p_c_grid
;
ignore
=
p_c_grid
;
ignore
=
p_d0s_grid
;
ignore
=
a_element_op
;
ignore
=
a_element_op
;
ignore
=
b_element_op
;
ignore
=
b_element_op
;
ignore
=
c0de_element_op
;
ignore
=
c0de_element_op
;
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment