# Copyright (c) 2019-2023, NVIDIA CORPORATION. All rights reserved. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. cmake_minimum_required(VERSION 3.8) #find_package(CUDAToolkit REQUIRED) find_package(CUDA REQUIRED) add_subdirectory(gemm_test) set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fPIC") set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -fPIC") add_library(cuda_utils STATIC cuda_utils.cc) #set_property(TARGET cuda_utils PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET cuda_utils PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) target_link_libraries(cuda_utils PUBLIC cudart) add_library(logger STATIC logger.cc) #set_property(TARGET logger PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET logger PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) target_link_libraries(logger PUBLIC cudart) add_library(cublasAlgoMap STATIC cublasAlgoMap.cc) #set_property(TARGET cublasAlgoMap PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET cublasAlgoMap PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) target_link_libraries(cublasAlgoMap PUBLIC cublas cudart curand cuda_utils logger) add_library(cublasMMWrapper STATIC cublasMMWrapper.cc) #set_property(TARGET cublasMMWrapper PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET cublasMMWrapper PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) target_link_libraries(cublasMMWrapper PUBLIC cublas cudart curand cublasAlgoMap cuda_utils logger) if (SPARSITY_SUPPORT) target_link_libraries(cublasMMWrapper PUBLIC cusparse -lcusparseLt) endif() add_library(word_list STATIC word_list.cc) #set_property(TARGET word_list PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET word_list PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) add_library(nvtx_utils STATIC nvtx_utils.cc) #set_property(TARGET nvtx_utils PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET nvtx_utils PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) if(${CMAKE_VERSION} VERSION_LESS "3.25") # target_link_libraries(nvtx_utils PUBLIC nvToolsExt -ldl) else() # target_link_libraries(nvtx_utils PUBLIC nvtx3 -ldl) endif() add_library(memory_utils STATIC memory_utils.cu) #set_property(TARGET memory_utils PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET memory_utils PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) target_link_libraries(memory_utils PUBLIC cuda_utils logger tensor) add_library(mpi_utils STATIC mpi_utils.cc) #set_property(TARGET mpi_utils PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET mpi_utils PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) if (BUILD_MULTI_GPU) #target_link_libraries(mpi_utils PUBLIC mpi logger) target_link_libraries(mpi_utils PUBLIC ${MPI_CXX_LIBRARIES} logger) endif() add_library(nccl_utils STATIC nccl_utils.cc) #set_property(TARGET nccl_utils PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET nccl_utils PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) if (BUILD_MULTI_GPU) target_link_libraries(nccl_utils PUBLIC ${NCCL_LIBRARIES} logger) endif() # add_library(cublasINT8MMWrapper STATIC cublasINT8MMWrapper.cc) #set_property(TARGET cublasINT8MMWrapper PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET cublasINT8MMWrapper PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) #target_link_libraries(cublasINT8MMWrapper PUBLIC cublasLt cudart curand cublasAlgoMap cublasMMWrapper cuda_utils logger) if(ENABLE_FP8) add_library(cublasFP8MMWrapper STATIC cublasFP8MMWrapper.cu) #set_property(TARGET cublasFP8MMWrapper PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET cublasFP8MMWrapper PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) #target_link_libraries(cublasFP8MMWrapper PUBLIC cublasLt cudart curand target_link_libraries(cublasFP8MMWrapper PUBLIC cudart curand cublasAlgoMap cublasMMWrapper nvtx_utils fp8_qgmma_1x1_utils) endif() add_library(custom_ar_comm STATIC custom_ar_comm.cc) #set_property(TARGET custom_ar_comm PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET custom_ar_comm PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) target_link_libraries(custom_ar_comm PUBLIC custom_ar_kernels memory_utils cuda_utils logger) add_library(gemm STATIC gemm.cc) #set_property(TARGET gemm PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET gemm PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) target_link_libraries(gemm PUBLIC # cublas cublasLt cudart curand cublas cudart curand cublasAlgoMap memory_utils cuda_utils logger) if (SPARSITY_SUPPORT) target_link_libraries(gemm PUBLIC cusparse -lcusparseLt) endif() # add_library(cuda_fp8_utils STATIC cuda_fp8_utils.cu) #set_property(TARGET cuda_fp8_utils PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET cuda_fp8_utils PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) add_library(tensor STATIC Tensor.cc) #set_property(TARGET tensor PROPERTY POSITION_INDEPENDENT_CODE ON) #set_property(TARGET tensor PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON) target_link_libraries(tensor PUBLIC cuda_utils logger -lstdc++fs)