# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES.
# All rights reserved. SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may not
# use this file except in compliance with the License. You may obtain a copy of
# the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations under
# the License.

file(GLOB_RECURSE SRC_CU *.cu)
add_library(fusedGatedRMSNormQuant_src STATIC ${SRC_CU})

if("100" IN_LIST CMAKE_CUDA_ARCHITECTURES_ORIG)
  # for blackwell
  set(FUSED_GATED_RMSNORM_NVCC_FLAGS)
  list(APPEND FUSED_GATED_RMSNORM_NVCC_FLAGS --extra-device-vectorization)
  list(APPEND FUSED_GATED_RMSNORM_NVCC_FLAGS
       --ptxas-options=--warn-on-local-memory-usage,--warn-on-spills)

  target_compile_options(
    fusedGatedRMSNormQuant_src
    PRIVATE $<$<COMPILE_LANGUAGE:CUDA>:${FUSED_GATED_RMSNORM_NVCC_FLAGS}>)
endif()

if(NOT WIN32)
  target_compile_options(
    fusedGatedRMSNormQuant_src
    PRIVATE $<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=-Wno-psabi>)
endif()

set_property(TARGET fusedGatedRMSNormQuant_src
             PROPERTY POSITION_INDEPENDENT_CODE ON)
set_property(TARGET fusedGatedRMSNormQuant_src
             PROPERTY CUDA_RESOLVE_DEVICE_SYMBOLS ON)
