Unverified Commit a69cb5cf authored by Yineng Zhang's avatar Yineng Zhang Committed by GitHub
Browse files

cleanup unused header in sgl_kernel (#2986)

parent def5c318
...@@ -3,11 +3,8 @@ ...@@ -3,11 +3,8 @@
#pragma once #pragma once
#include "cutlass/arch/memory.h" #include <cutlass/arch/memory.h>
#include "cutlass/arch/memory_sm75.h" #include <cutlass/numeric_conversion.h>
#include "cutlass/cutlass.h"
#include "cutlass/fast_math.h"
#include "cutlass/numeric_conversion.h"
namespace cutlass { namespace cutlass {
namespace epilogue { namespace epilogue {
......
...@@ -2,16 +2,9 @@ ...@@ -2,16 +2,9 @@
// https://github.com/NVIDIA/TensorRT-LLM/blob/be1788106245496872d18e702978e59b6bfd50e0/cpp/tensorrt_llm/cutlass_extensions/include/cutlass_extensions/gemm/device/gemm_universal_base_compat.h // https://github.com/NVIDIA/TensorRT-LLM/blob/be1788106245496872d18e702978e59b6bfd50e0/cpp/tensorrt_llm/cutlass_extensions/include/cutlass_extensions/gemm/device/gemm_universal_base_compat.h
#pragma once #pragma once
#include "cutlass/arch/arch.h" #include <cutlass/cutlass.h>
#include "cutlass/cutlass.h" #include <cutlass/device_kernel.h>
#include "cutlass/device_kernel.h" #include <cutlass/trace.h>
#include "cutlass/gemm/device/default_gemm_configuration.h"
#include "cutlass/gemm/gemm.h"
#include "cutlass/gemm/kernel/default_gemm_universal.h"
#include "cutlass/gemm/kernel/gemm_universal.h"
#include "cutlass/gemm/threadblock/threadblock_swizzle.h"
#include "cutlass/numeric_types.h"
#include "cutlass/trace.h"
//////////////////////////////////////////////////////////////////////////////// ////////////////////////////////////////////////////////////////////////////////
......
...@@ -3,14 +3,11 @@ ...@@ -3,14 +3,11 @@
#pragma once #pragma once
#include "cutlass/complex.h" #include <cutlass/complex.h>
#include "cutlass/cutlass.h" #include <cutlass/cutlass.h>
#include "cutlass/fast_math.h" #include <cutlass/fast_math.h>
#include "cutlass/gemm/gemm.h" #include <cutlass/matrix_coord.h>
#include "cutlass/matrix_coord.h" #include <cutlass/trace.h>
#include "cutlass/semaphore.h"
#include "cutlass/trace.h"
#include "cutlass_extensions/epilogue/epilogue_per_row_per_col_scale.h"
///////////////////////////////////////////////////////////////////////////////////////////////// /////////////////////////////////////////////////////////////////////////////////////////////////
......
#include <vector>
#include "utils.hpp" #include "utils.hpp"
// trt_reduce // trt_reduce
......
...@@ -3,9 +3,6 @@ ...@@ -3,9 +3,6 @@
#include <c10/cuda/CUDAStream.h> #include <c10/cuda/CUDAStream.h>
#include <cassert> #include <cassert>
#include <iostream>
#include <sstream>
#include <unordered_map>
#include "trt_reduce_internal.cuh" #include "trt_reduce_internal.cuh"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment