Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
207021c0
Commit
207021c0
authored
Jun 23, 2020
by
Chao Liu
Browse files
update build script
parent
a4adf0ac
Changes
8
Hide whitespace changes
Inline
Side-by-side
Showing
8 changed files
with
36 additions
and
33 deletions
+36
-33
script/cmake-cuda.sh
script/cmake-cuda.sh
+11
-12
script/cmake-rocm3.1.sh
script/cmake-rocm3.1.sh
+3
-3
script/cmake-rocm3.5.sh
script/cmake-rocm3.5.sh
+22
-0
script/compile-rocm3.1.sh
script/compile-rocm3.1.sh
+0
-0
script/docker-cuda.sh
script/docker-cuda.sh
+0
-3
script/hack_isa.sh
script/hack_isa.sh
+0
-9
script/trace.sh
script/trace.sh
+0
-3
script/tracer-hip.sh
script/tracer-hip.sh
+0
-3
No files found.
script/cmake-cuda.sh
View file @
207021c0
#!/bin/bash
rm
-f
CMakeCache.txt
rm
-f
*
.cmake
rm
-rf
CMakeFiles
MY_PROJECT_SOURCE
=
/home/chao/code/modular_convolution
MY_PROJECT_SOURCE
=
../
MY_PROJECT_INSTALL
=
../install.dir
export
CUDA_ROOT
=
/usr/local/cuda
export
CPATH
=
$CPATH
:
$CUDA_ROOT
/include
export
LIBRARY_PATH
=
$LIBRARY_PATH
:
$CUDA_ROOT
/lib64
export
LD_LIBRARY_PATH
=
$LD_LIBRARY_PATH
:
$CUDA_ROOT
/lib64
cmake
\
-D
CMAKE_INSTALL_PREFIX
=
${
MY_PROJECT_INSTALL
}
\
-D
CMAKE_CXX_COMPILER
=
clang++
\
-D
CMAKE_CXX_COMPILER
=
clang++
-6.0
\
-D
CMAKE_BUILD_TYPE
=
Release
\
-D
CMAKE_VERBOSE_MAKEFILE:BOOL
=
ON
\
-D
DEVICE_BACKEND
=
NVIDIA
\
-D
CUDA_COMMON_INCLUDE_DIR
=
"/
package/install/cuda/10.1
/NVIDIA_CUDA-10.1_Samples/common/inc"
\
-D
CMAKE_CUDA_FLAGS
=
"-ccbin clang++ -m64 -Xcompiler -fopenmp -lineinfo --source-in-ptx -keep -Xptxas -v -gencode=arch=compute_
61
,code=sm_
61
-Xptxas -v -maxrregcount=128"
\
-D
CUDA_COMMON_INCLUDE_DIR
=
"/
root
/NVIDIA_CUDA-10.1_Samples/common/inc"
\
-D
CMAKE_CUDA_FLAGS
=
"-ccbin clang++ -m64 -Xcompiler -fopenmp -lineinfo --source-in-ptx -keep -Xptxas -v -gencode=arch=compute_
70
,code=sm_
70
-Xptxas -v -maxrregcount=128"
\
${
MY_PROJECT_SOURCE
}
#-D BOOST_ROOT="/package/install/boost_1.67.0" \
#-D CMAKE_CUDA_COMPILER="/package/install/cuda_10.0/bin/nvcc" \
#-D CMAKE_CUDA_FLAGS="-ccbin clang++ -m64 -Xcompiler -fopenmp -lineinfo --source-in-ptx -keep -Xptxas -v -gencode=arch=compute_61,code=sm_61" \
#-D CMAKE_CUDA_FLAGS="-ccbin clang++ -m64 -Xcompiler -fopenmp -lineinfo --source-in-ptx -keep -Xptxas -v -gencode=arch=compute_61,code=sm_61 -Xptxas -v -maxrregcount=128" \
#-D CMAKE_CUDA_FLAGS="-ccbin clang++ -m64 -Xcompiler -fopenmp -lineinfo --source-in-ptx -keep -Xptxas -v -gencode=arch=compute_70,code=sm_70" \
#-D CMAKE_CUDA_FLAGS="-ccbin clang++ -m64 -Xcompiler -fopenmp -lineinfo --source-in-ptx -keep -Xptxas -v -gencode=arch=compute_70,code=sm_70 -Xptxas -v -maxrregcount=128" \
script/cmake-
hip
.sh
→
script/cmake-
rocm3.1
.sh
View file @
207021c0
#!/bin/bash
rm
-f
CMakeCache.txt
rm
-f
*
.cmake
rm
-rf
CMakeFiles
...
...
@@ -11,9 +10,10 @@ cmake
-D
CMAKE_INSTALL_PREFIX
=
${
MY_PROJECT_INSTALL
}
\
-D
CMAKE_BUILD_TYPE
=
Release
\
-D
DEVICE_BACKEND
=
"AMD"
\
-D
HIP_HIPCC_FLAGS
=
"
${
HIP_HIPCC_FLAGS
}
-gline-tables-only -v"
\
-D
CMAKE_CXX_FLAGS
=
"-gline-tables-only --amdgpu-target=gfx906"
\
-D
CMAKE_CXX_FLAGS
=
"--amdgpu-target=gfx906"
\
-D
CMAKE_CXX_COMPILER
=
/opt/rocm/hip/bin/hipcc
\
-D
CMAKE_PREFIX_PATH
=
"/opt/rocm"
\
-D
CMAKE_VERBOSE_MAKEFILE:BOOL
=
ON
\
${
MY_PROJECT_SOURCE
}
#-D CMAKE_CXX_FLAGS="-gline-tables-only -v --amdgpu-target=gfx906" \
script/cmake-
cuda_docker
.sh
→
script/cmake-
rocm3.5
.sh
View file @
207021c0
#!/bin/bash
rm
-f
CMakeCache.txt
rm
-f
*
.cmake
rm
-rf
CMakeFiles
MY_PROJECT_SOURCE
=
../
MY_PROJECT_SOURCE
=
../
../../
MY_PROJECT_INSTALL
=
../install.dir
export
CUDA_ROOT
=
/usr/local/cuda
export
CPATH
=
$CPATH
:
$CUDA_ROOT
/include
export
LIBRARY_PATH
=
$LIBRARY_PATH
:
$CUDA_ROOT
/lib64
export
LD_LIBRARY_PATH
=
$LD_LIBRARY_PATH
:
$CUDA_ROOT
/lib64
cmake
\
-D
CMAKE_INSTALL_PREFIX
=
${
MY_PROJECT_INSTALL
}
\
-D
CMAKE_CXX_COMPILER
=
clang++-6.0
\
-D
CMAKE_BUILD_TYPE
=
Release
\
-D
DEVICE_BACKEND
=
"AMD"
\
-D
CMAKE_CXX_FLAGS
=
"-O3 --amdgpu-target=gfx906 -mllvm --amdgpu-enable-global-sgpr-addr -mllvm --amdgpu-spill-vgpr-to-agpr=0"
\
-D
CMAKE_CXX_COMPILER
=
/opt/rocm/bin/hipcc
\
-D
CMAKE_PREFIX_PATH
=
"/opt/rocm"
\
-D
CMAKE_VERBOSE_MAKEFILE:BOOL
=
ON
\
-D
DEVICE_BACKEND
=
NVIDIA
\
-D
CUDA_COMMON_INCLUDE_DIR
=
"/root/NVIDIA_CUDA-10.1_Samples/common/inc"
\
-D
CMAKE_CUDA_FLAGS
=
"-ccbin clang++ -m64 -Xcompiler -fopenmp -lineinfo --source-in-ptx -keep -Xptxas -v -gencode=arch=compute_70,code=sm_70 -Xptxas -v -maxrregcount=128"
\
${
MY_PROJECT_SOURCE
}
#-D HIP_HIPCC_FLAGS="${HIP_HIPCC_FLAGS} -gline-tables-only -v" \
#-D CMAKE_CXX_FLAGS="-gline-tables-only --amdgpu-target=gfx906" \
#-D CMAKE_CUDA_FLAGS="-ccbin clang++ -m64 -Xcompiler -fopenmp -lineinfo --source-in-ptx -keep -Xptxas -v -gencode=arch=compute_70,code=sm_70" \
#-D CMAKE_CUDA_FLAGS="-ccbin clang++ -m64 -Xcompiler -fopenmp -lineinfo --source-in-ptx -keep -Xptxas -v -gencode=arch=compute_70,code=sm_70 -Xptxas -v -maxrregcount=128" \
script/compile-
hip
.sh
→
script/compile-
rocm3.1
.sh
View file @
207021c0
File moved
script/docker-cuda.sh
deleted
100755 → 0
View file @
a4adf0ac
WORKSPACE
=
$1
echo
"workspace: "
$WORKSPACE
sudo
docker run
-it
-v
$WORKSPACE
:/root/workspace
--group-add
sudo
--runtime
=
nvidia asroy/cuda:10.1-cudnn7-devel-ubuntu18.04-latest /bin/bash
script/hack_isa.sh
deleted
100755 → 0
View file @
a4adf0ac
# step 1: GET ISA DUMP
#cd /root/workspace/mlopen/modular_convolution/build/hipcc/build.dir/driver && KMDUMPISA=1 /opt/rocm/hip/bin/hipcc -I/root/workspace/mlopen/modular_convolution/build/hipcc/build.dir/composable_kernel/include/utility -I/root/workspace/mlopen/modular_convolution/driver/include -I/root/workspace/mlopen/modular_convolution/composable_kernel/include/kernel_algorithm -I/root/workspace/mlopen/modular_convolution/composable_kernel/include/tensor_operation -I/root/workspace/mlopen/modular_convolution/composable_kernel/include/tensor_description -I/root/workspace/mlopen/modular_convolution/composable_kernel/include/utility -I/root/workspace/mlopen/modular_convolution/composable_kernel/include -gline-tables-only --amdgpu-target=gfx906 -fopenmp=libomp -O3 -DNDEBUG -std=c++14 -o CMakeFiles/driver.dir/src/driver.cpp.o -c /root/workspace/mlopen/modular_convolution/driver/src/driver.cpp -fno-gpu-rdc
# step 2: HACK ISA
#cd /root/workspace/mlopen/modular_convolution/build/hipcc/build.dir/driver && KMHACKISA=1 /opt/rocm/hip/bin/hipcc -I/root/workspace/mlopen/modular_convolution/build/hipcc/build.dir/composable_kernel/include/utility -I/root/workspace/mlopen/modular_convolution/driver/include -I/root/workspace/mlopen/modular_convolution/composable_kernel/include/kernel_algorithm -I/root/workspace/mlopen/modular_convolution/composable_kernel/include/tensor_operation -I/root/workspace/mlopen/modular_convolution/composable_kernel/include/tensor_description -I/root/workspace/mlopen/modular_convolution/composable_kernel/include/utility -I/root/workspace/mlopen/modular_convolution/composable_kernel/include -gline-tables-only --amdgpu-target=gfx906 -fopenmp=libomp -O3 -DNDEBUG -std=c++14 -o CMakeFiles/driver.dir/src/driver.cpp.o -c /root/workspace/mlopen/modular_convolution/driver/src/driver.cpp -fno-gpu-rdc
# step 3: LINK
#/opt/rocm/hip/bin/hipcc -gline-tables-only --amdgpu-target=gfx906 -fopenmp=libomp -O3 -DNDEBUG CMakeFiles/driver.dir/src/driver.cpp.o -o driver -rdynamic libhost.so -Wl,-rpath,/root/workspace/mlopen/modular_convolution/build/hipcc/build.dir/driver
script/trace.sh
deleted
100755 → 0
View file @
a4adf0ac
#!/bin/bash
/root/workspace/rocprofiler_pkg/bin/rpl_run.sh
--timestamp
on
-i
/root/workspace/rocprofiler_pkg/input.xml
-d
./trace ./driver/driver 0 10
script/tracer-hip.sh
deleted
100755 → 0
View file @
a4adf0ac
#!/bin/bash
/root/workspace/rocprofiler_pkg/bin/rpl_run.sh
--timestamp
on
-i
/root/workspace/rocprofiler_pkg/input.xml
-d
./trace ./driver/driver 0 10
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment