Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
bitsandbytes
Commits
f2dd7032
Commit
f2dd7032
authored
Jul 25, 2022
by
Tim Dettmers
Browse files
Added matmul build and flags.
parent
9268dc9d
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
170 additions
and
24 deletions
+170
-24
Makefile
Makefile
+25
-8
deploy_from_slurm.sh
deploy_from_slurm.sh
+145
-16
No files found.
Makefile
View file @
f2dd7032
...
...
@@ -27,14 +27,13 @@ COMPUTE_CAPABILITY += -gencode arch=compute_60,code=sm_60 # Pascal
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_61,code
=
sm_61
# Pascal
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_70,code
=
sm_70
# Volta
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_72,code
=
sm_72
# Volta
COMPUTE_CAPABILITY
:=
-gencode
arch
=
compute_75,code
=
sm_75
# Volta
# CUDA 9.2 supports CC 3.0, but CUDA >= 11.0 does not
CC_CUDA92
:=
-gencode
arch
=
compute_30,code
=
sm_30
# Later versions of CUDA support the new architectures
CC_CUDA10x
:=
-gencode
arch
=
compute_30,code
=
sm_30
CC_CUDA10x
:
=
-gencode
arch
=
compute_75,code
=
sm_75
CC_CUDA10x
+
=
-gencode
arch
=
compute_75,code
=
sm_75
CC_CUDA110
:=
-gencode
arch
=
compute_75,code
=
sm_75
CC_CUDA110
+=
-gencode
arch
=
compute_80,code
=
sm_80
...
...
@@ -43,6 +42,14 @@ CC_CUDA11x := -gencode arch=compute_75,code=sm_75
CC_CUDA11x
+=
-gencode
arch
=
compute_80,code
=
sm_80
CC_CUDA11x
+=
-gencode
arch
=
compute_86,code
=
sm_86
CC_cublasLt110
:=
-gencode
arch
=
compute_75,code
=
sm_75
CC_cublasLt110
+=
-gencode
arch
=
compute_80,code
=
sm_80
CC_cublasLt111
:=
-gencode
arch
=
compute_75,code
=
sm_75
CC_cublasLt111
+=
-gencode
arch
=
compute_80,code
=
sm_80
CC_cublasLt111
+=
-gencode
arch
=
compute_86,code
=
sm_86
all
:
$(ROOT_DIR)/dependencies/cub $(BUILD_DIR) env
$(NVCC)
$(COMPUTE_CAPABILITY)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
-D
NO_CUBLASLT
$(NVCC)
$(COMPUTE_CAPABILITY)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
...
...
@@ -53,21 +60,31 @@ cuda92: $(ROOT_DIR)/dependencies/cub $(BUILD_DIR) env
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA92)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++14
-DBUILD_CUDA
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cuda10x
:
$(ROOT_DIR)/dependencies/cub $(BUILD_DIR) env
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA10x)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
cuda10x
_nomatmul
:
$(ROOT_DIR)/dependencies/cub $(BUILD_DIR) env
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA10x)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
-D
NO_CUBLASLT
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA10x)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++14
-DBUILD_CUDA
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cuda110
:
$(BUILD_DIR) env
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA110)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
cuda110
_nomatmul
:
$(BUILD_DIR) env
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA110)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
-D
NO_CUBLASLT
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA110)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++14
-DBUILD_CUDA
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cuda11x
:
$(BUILD_DIR) env
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA11x)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
cuda11x
_nomatmul
:
$(BUILD_DIR) env
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA11x)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
-D
NO_CUBLASLT
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA11x)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++14
-DBUILD_CUDA
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cuda110
:
$(BUILD_DIR) env
$(NVCC)
$(CC_cublasLt110)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(CC_cublasLt110)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++14
-DBUILD_CUDA
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cuda11x
:
$(BUILD_DIR) env
$(NVCC)
$(CC_cublasLt111)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(CC_cublasLt111)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++14
-DBUILD_CUDA
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cpuonly
:
$(BUILD_DIR) env
$(GPP)
-std
=
c++14
-shared
-fPIC
-I
$(ROOT_DIR)
/csrc
-I
$(ROOT_DIR)
/include
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
...
...
deploy_from_slurm.sh
View file @
f2dd7032
...
...
@@ -4,88 +4,217 @@ BASE_PATH=$1
module unload cuda
module unload gcc
#rm -rf dist build
#make clean
#make cleaneggs
#export CUDA_HOME=$BASE_PATH/cuda-11.0
#make cuda110
#
#if [ ! -f "./bitsandbytes/libbitsandbytes.so" ]; then
# # Control will enter here if $DIRECTORY doesn't exist.
# echo "Compilation unsuccessul!" 1>&2
# exit 64
#fi
##CUDA_VERSION=110 python -m build
##python -m twine upload dist/* --verbose
#
#rm -rf dist build
#make clean
#make cleaneggs
#export CUDA_HOME=$BASE_PATH/cuda-11.1
#make cuda11x
#
#if [ ! -f "./bitsandbytes/libbitsandbytes.so" ]; then
# # Control will enter here if $DIRECTORY doesn't exist.
# echo "Compilation unsuccessul!" 1>&2
# exit 64
#fi
##CUDA_VERSION=111 python -m build
##python -m twine upload dist/* --verbose
#
#rm -rf dist build
#make clean
#make cleaneggs
#export CUDA_HOME=$BASE_PATH/cuda-11.2
#make cuda11x
#
#if [ ! -f "./bitsandbytes/libbitsandbytes.so" ]; then
# # Control will enter here if $DIRECTORY doesn't exist.
# echo "Compilation unsuccessul!" 1>&2
# exit 64
#fi
##CUDA_VERSION=112 python -m build
##python -m twine upload dist/* --verbose
#
#rm -rf dist build
#make clean
#make cleaneggs
#export CUDA_HOME=$BASE_PATH/cuda-11.3
#make cuda11x
#
#if [ ! -f "./bitsandbytes/libbitsandbytes.so" ]; then
# # Control will enter here if $DIRECTORY doesn't exist.
# echo "Compilation unsuccessul!" 1>&2
# exit 64
#fi
##CUDA_VERSION=113 python -m build
##python -m twine upload dist/* --verbose
#
#rm -rf dist build
#make clean
#make cleaneggs
#export CUDA_HOME=$BASE_PATH/cuda-11.4
#make cuda11x
#
#if [ ! -f "./bitsandbytes/libbitsandbytes.so" ]; then
# # Control will enter here if $DIRECTORY doesn't exist.
# echo "Compilation unsuccessul!" 1>&2
# exit 64
#fi
##CUDA_VERSION=114 python -m build
###python -m twine upload dist/* --verbose
#
#rm -rf dist build
#make clean
#make cleaneggs
#export CUDA_HOME=$BASE_PATH/cuda-11.5
#make cuda11x
#
#if [ ! -f "./bitsandbytes/libbitsandbytes.so" ]; then
# # Control will enter here if $DIRECTORY doesn't exist.
# echo "Compilation unsuccessul!" 1>&2
# exit 64
#fi
##CUDA_VERSION=115 python -m build
##python -m twine upload dist/* --verbose
#
#rm -rf dist build
#make clean
#make cleaneggs
#export CUDA_HOME=$BASE_PATH/cuda-11.6
#
#make cuda11x
#if [ ! -f "./bitsandbytes/libbitsandbytes.so" ]; then
# # Control will enter here if $DIRECTORY doesn't exist.
# echo "Compilation unsuccessul!" 1>&2
# exit 64
#fi
##CUDA_VERSION=116 python -m build
##python -m twine upload dist/* --verbose
#
#rm -rf dist build
#make clean
#make cleaneggs
#export CUDA_HOME=$BASE_PATH/cuda-11.7
#make cuda11x
#
#if [ ! -f "./bitsandbytes/libbitsandbytes.so" ]; then
# # Control will enter here if $DIRECTORY doesn't exist.
# echo "Compilation unsuccessul!" 1>&2
# exit 64
#fi
##CUDA_VERSION=117 python -m build
##python -m twine upload dist/* --verbose
rm
-rf
dist build
make clean
make cleaneggs
export
CUDA_HOME
=
$BASE_PATH
/cuda-10.2
make cuda10x_nomatmul
if
[
!
-f
"./bitsandbytes/libbitsandbytes.so"
]
;
then
# Control will enter here if $DIRECTORY doesn't exist.
echo
"Compilation unsuccessul!"
1>&2
exit
64
fi
#CUDA_VERSION=102-nomatmul python -m build
#python -m twine upload dist/* --verbose
rm
-rf
dist build
make clean
make cleaneggs
export
CUDA_HOME
=
$BASE_PATH
/cuda-11.0
make cuda110
make cuda110
_nomatmul
if
[
!
-f
"./bitsandbytes/libbitsandbytes.so"
]
;
then
# Control will enter here if $DIRECTORY doesn't exist.
echo
"Compilation unsuccessul!"
1>&2
exit
64
fi
#CUDA_VERSION=110 python -m build
#CUDA_VERSION=110
-nomatmul
python -m build
#python -m twine upload dist/* --verbose
rm
-rf
dist build
make clean
make cleaneggs
export
CUDA_HOME
=
$BASE_PATH
/cuda-11.1
make cuda11x
make cuda11x
_nomatmul
if
[
!
-f
"./bitsandbytes/libbitsandbytes.so"
]
;
then
# Control will enter here if $DIRECTORY doesn't exist.
echo
"Compilation unsuccessul!"
1>&2
exit
64
fi
#CUDA_VERSION=111 python -m build
#CUDA_VERSION=111
-nomatmul
python -m build
#python -m twine upload dist/* --verbose
rm
-rf
dist build
make clean
make cleaneggs
export
CUDA_HOME
=
$BASE_PATH
/cuda-11.2
make cuda11x
make cuda11x
_nomatmul
if
[
!
-f
"./bitsandbytes/libbitsandbytes.so"
]
;
then
# Control will enter here if $DIRECTORY doesn't exist.
echo
"Compilation unsuccessul!"
1>&2
exit
64
fi
#CUDA_VERSION=112 python -m build
#CUDA_VERSION=112
-nomatmul
python -m build
#python -m twine upload dist/* --verbose
rm
-rf
dist build
make clean
make cleaneggs
export
CUDA_HOME
=
$BASE_PATH
/cuda-11.3
make cuda11x
make cuda11x
_nomatmul
if
[
!
-f
"./bitsandbytes/libbitsandbytes.so"
]
;
then
# Control will enter here if $DIRECTORY doesn't exist.
echo
"Compilation unsuccessul!"
1>&2
exit
64
fi
#CUDA_VERSION=113 python -m build
#CUDA_VERSION=113
-nomatmul
python -m build
#python -m twine upload dist/* --verbose
rm
-rf
dist build
make clean
make cleaneggs
export
CUDA_HOME
=
$BASE_PATH
/cuda-11.4
make cuda11x
make cuda11x
_nomatmul
if
[
!
-f
"./bitsandbytes/libbitsandbytes.so"
]
;
then
# Control will enter here if $DIRECTORY doesn't exist.
echo
"Compilation unsuccessul!"
1>&2
exit
64
fi
#CUDA_VERSION=114 python -m build
#CUDA_VERSION=114
-nomatmul
python -m build
##python -m twine upload dist/* --verbose
rm
-rf
dist build
make clean
make cleaneggs
export
CUDA_HOME
=
$BASE_PATH
/cuda-11.5
make cuda11x
make cuda11x
_nomatmul
if
[
!
-f
"./bitsandbytes/libbitsandbytes.so"
]
;
then
# Control will enter here if $DIRECTORY doesn't exist.
echo
"Compilation unsuccessul!"
1>&2
exit
64
fi
#CUDA_VERSION=115 python -m build
#CUDA_VERSION=115
-nomatmul
python -m build
#python -m twine upload dist/* --verbose
rm
-rf
dist build
...
...
@@ -93,25 +222,25 @@ make clean
make cleaneggs
export
CUDA_HOME
=
$BASE_PATH
/cuda-11.6
make cuda11x
make cuda11x
_nomatmul
if
[
!
-f
"./bitsandbytes/libbitsandbytes.so"
]
;
then
# Control will enter here if $DIRECTORY doesn't exist.
echo
"Compilation unsuccessul!"
1>&2
exit
64
fi
#CUDA_VERSION=116 python -m build
#CUDA_VERSION=116
-nomatmul
python -m build
#python -m twine upload dist/* --verbose
rm
-rf
dist build
make clean
make cleaneggs
export
CUDA_HOME
=
$BASE_PATH
/cuda-11.7
make cuda11x
make cuda11x
_nomatmul
if
[
!
-f
"./bitsandbytes/libbitsandbytes.so"
]
;
then
# Control will enter here if $DIRECTORY doesn't exist.
echo
"Compilation unsuccessul!"
1>&2
exit
64
fi
#CUDA_VERSION=117 python -m build
#CUDA_VERSION=117
-nomatmul
python -m build
#python -m twine upload dist/* --verbose
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment