Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
bitsandbytes
Commits
8400b58c
Commit
8400b58c
authored
Oct 17, 2021
by
Tim Dettmers
Browse files
Added Kepler and fixed V100+CUDA101 support. #4 #5
parent
20294dc0
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
28 additions
and
9 deletions
+28
-9
Makefile
Makefile
+28
-9
No files found.
Makefile
View file @
8400b58c
...
...
@@ -15,11 +15,30 @@ INCLUDE := -I $(CUDA_HOME)/include -I $(ROOT_DIR)/csrc -I $(CONDA_PREFIX)/inclu
LIB
:=
-L
$(CUDA_HOME)
/lib64
-lcudart
-lcuda
-lcublas
-lcurand
-lcusparse
-L
$(CONDA_PREFIX)
/lib
# NVIDIA NVCC compilation flags
COMPUTE_CAPABILITY
:=
-gencode
arch
=
compute_50,code
=
sm_50
# Maxwell
COMPUTE_CAPABILITY
:=
-gencode
arch
=
compute_35,code
=
sm_35
# Kepler
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_37,code
=
sm_37
# Kepler
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_50,code
=
sm_50
# Maxwell
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_52,code
=
sm_52
# Maxwell
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_60,code
=
sm_60
# Pascal
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_61,code
=
sm_61
# Pascal
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_70,code
=
sm_70
# Volta
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_72,code
=
sm_72
# Volta
COMPUTE_CAPABILITY
+=
-gencode
arch
=
compute_72,code
=
sm_72
# Volta
# CUDA 9.2 supports CC 3.0, but CUDA >= 11.0 does not
CC_CUDA92
:=
-gencode
arch
=
compute_30,code
=
sm_30
# Later versions of CUDA support the new architectures
CC_CUDA10x
:=
-gencode
arch
=
compute_30,code
=
sm_30
CC_CUDA10x
+=
-gencode
arch
=
compute_75,code
=
sm_75
CC_CUDA110
:=
-gencode
arch
=
compute_75,code
=
sm_75
CC_CUDA110
+=
-gencode
arch
=
compute_80,code
=
sm_80
CC_CUDA11x
:=
-gencode
arch
=
compute_75,code
=
sm_75
CC_CUDA11x
+=
-gencode
arch
=
compute_80,code
=
sm_80
CC_CUDA11x
+=
-gencode
arch
=
compute_86,code
=
sm_86
all
:
$(ROOT_DIR)/dependencies/cub $(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
...
...
@@ -27,23 +46,23 @@ all: $(ROOT_DIR)/dependencies/cub $(BUILD_DIR)
$(GPP)
-std
=
c++11
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cuda92
:
$(ROOT_DIR)/dependencies/cub $(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA92)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA92)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++11
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cuda10x
:
$(ROOT_DIR)/dependencies/cub $(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
-gencode
arch
=
compute_75,code
=
sm_75
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA10x)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA10x)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++11
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cuda110
:
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
-gencode
arch
=
compute_80,code
=
sm_80
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA10x)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA10x)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++11
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
cuda11x
:
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
-gencode
arch
=
compute_80,code
=
sm_80
-gencode
arch
=
compute_86,code
=
sm_86
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA10x)
-Xcompiler
'-fPIC'
--use_fast_math
-Xptxas
=
-v
-dc
$(FILES_CUDA)
$(INCLUDE)
$(LIB)
--output-directory
$(BUILD_DIR)
$(NVCC)
$(COMPUTE_CAPABILITY)
$(CC_CUDA10x)
-Xcompiler
'-fPIC'
-dlink
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
-o
$(BUILD_DIR)
/link.o
$(GPP)
-std
=
c++11
-shared
-fPIC
$(INCLUDE)
$(BUILD_DIR)
/ops.o
$(BUILD_DIR)
/kernels.o
$(BUILD_DIR)
/link.o
$(FILES_CPP)
-o
./bitsandbytes/libbitsandbytes.so
$(LIB)
$(BUILD_DIR)
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment