# SPDX-FileCopyrightText: Copyright (c) 2024-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved. # SPDX-License-Identifier: Apache-2.0 # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. cmake_minimum_required(VERSION 3.17) project( nvllm VERSION 0.1.0.0 LANGUAGES CXX ) include(${CMAKE_CURRENT_SOURCE_DIR}/cmake/modules/set_ifndef.cmake) set(CMAKE_CXX_STANDARD 17) set(CMAKE_CXX_STANDARD_REQUIRED true) set(CMAKE_POSTION_INDEPENDENT_CODE ON) set(CMAKE_EXPORT_COMPILE_COMMANDS ON) option(USE_STUBS "Build with stub implementations instead of real CUDA code" OFF) if (USE_STUBS) add_definitions(-DUSE_STUBS) set(SOURCE_FILES src/nvllm_trt.cpp src/engine_stub/engine.cpp ) add_library(tensorrt_llm SHARED src/engine_stub/tensorrt_llm.cpp) else() #SET(TRTLLM_SRC_DIR "${CMAKE_CURRENT_SOURCE_DIR}/../../submodules/tensorrt_llm" CACHE STRING "TRTLLM_SRC_DIR: /../../submodules/tensorrt_llm") SET(TRTLLM_LIB_DIR "/usr/local/lib" CACHE STRING "TRTLLM_LIB_DIR: /usr/local/lib") #include(${TRTLLM_SRC_DIR}/cpp/cmake/modules/find_library_create_target.cmake) set(CMAKE_INSTALL_RPATH "${CMAKE_INSTALL_PREFIX}/lib;/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/usr/local/tensorrt/targets/x86_64-linux-gnu/lib:/src/tensorrt_llm/cpp/build/tensorrt_llm/plugins") set(CMAKE_INSTALL_RPATH_USE_LINK_PATH TRUE) include(FetchContent) FetchContent_Declare( json GIT_REPOSITORY https://github.com/nlohmann/json.git GIT_TAG v3.11.2 ) FetchContent_Declare( spdlog GIT_REPOSITORY https://github.com/gabime/spdlog.git GIT_TAG v1.15.0 ) # Make nlohmann/json available FetchContent_MakeAvailable(json) FetchContent_MakeAvailable(spdlog) set_property(TARGET spdlog PROPERTY POSITION_INDEPENDENT_CODE ON) add_library(tensorrt_llm SHARED IMPORTED) set_target_properties( tensorrt_llm PROPERTIES IMPORTED_LOCATION "${TRTLLM_LIB_DIR}/libtensorrt_llm.so" ) add_library(nvinfer_plugin_tensorrt_llm SHARED IMPORTED) set_target_properties( nvinfer_plugin_tensorrt_llm PROPERTIES IMPORTED_LOCATION "${TRTLLM_LIB_DIR}/libnvinfer_plugin_tensorrt_llm.so" ) add_library(xxhash STATIC IMPORTED) set_target_properties( xxhash PROPERTIES IMPORTED_LOCATION "/usr/lib/x86_64-linux-gnu/libxxhash.a" ) set(SOURCE_FILES src/nvllm_trt.cpp src/engine_trt/engine.cpp src/engine_trt/request.cpp src/engine_trt/response.cpp src/engine_trt/config.cpp src/engine_trt/kv_event.cpp src/engine_trt/stats.cpp ${PROTO_SRCS} ${PROTO_HDRS} # ... other source files ... ) endif() function(set_library_target_properties target) target_include_directories( ${target} PUBLIC $ $ PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/src ${CMAKE_BINARY_DIR} /usr/local/cuda-12.6/targets/x86_64-linux/include /usr/local/tensorrt/include/ ) target_compile_features(${target} PRIVATE cxx_std_17) set_target_properties(${target} PROPERTIES OUTPUT_NAME nvllm_trt) target_compile_options( ${target} PRIVATE $<$,$,$>: -Wall -Wextra -Wno-unused-parameter -Wno-type-limits> -Wno-deprecated-declarations $<$:/Wall /D_WIN32_WINNT=0x0A00 /EHsc>) if (USE_STUBS) else() target_link_libraries( ${target} PRIVATE tensorrt_llm ${Protobuf_LIBRARIES} xxhash # ${MPI_LIBRARIES} # ${CUDA_LIBRARIES} # nvinfer nvinfer_plugin_tensorrt_llm nlohmann_json::nlohmann_json spdlog::spdlog ) endif() # target_link_options(${target} PRIVATE "-static") target_link_libraries(${target} PUBLIC ) endfunction() add_library(nvllm_trt SHARED ${SOURCE_FILES}) set_library_target_properties(nvllm_trt) include(CMakePackageConfigHelpers) configure_package_config_file( ${CMAKE_CURRENT_SOURCE_DIR}/nvllmConfig.cmake.in ${CMAKE_CURRENT_BINARY_DIR}/nvllmConfig.cmake INSTALL_DESTINATION lib/cmake/nvllm ) write_basic_package_version_file( "nvllmConfigVersion.cmake" VERSION ${PROJECT_VERSION} COMPATIBILITY AnyNewerVersion ) # Installation rules install(TARGETS nvllm_trt EXPORT nvllmConfig # This should match the name used in configure_package_config_file LIBRARY DESTINATION lib ARCHIVE DESTINATION lib RUNTIME DESTINATION bin INCLUDES DESTINATION include ) # Install the nvllmConfig.cmake and nvllmConfigVersion.cmake files install(FILES ${CMAKE_CURRENT_BINARY_DIR}/nvllmConfig.cmake # Corrected the file name ${CMAKE_CURRENT_BINARY_DIR}/nvllmConfigVersion.cmake DESTINATION lib/cmake/nvllm ) # # Install config.h # install(FILES "${PROJECT_BINARY_DIR}/config.h" # DESTINATION include/nvidia/nvllm) # Install header files install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/include/ DESTINATION include)