add convert_vertical_slash_indexes and convert_vertical_slash_indexes_mergehead

1e636721 · zhuwenwen · d70425b2 · 1e636721 · 1e636721
Commit 1e636721 authored Sep 23, 2025 by zhuwenwen
Show whitespace changes
Inline Side-by-side

Showing with 0 additions and 5 deletions

csrc/ops.h csrc/ops.h +0 -3

csrc/torch_bindings.cpp csrc/torch_bindings.cpp +0 -2

No files found.
--- a/csrc/ops.h
+++ b/csrc/ops.h
@@ -179,8 +179,6 @@ void merge_attn_states(torch::Tensor& output,
                       const torch::Tensor& suffix_output,
                       const torch::Tensor& suffix_lse);

-
-#ifndef USE_ROCM
 void convert_vertical_slash_indexes(
    torch::Tensor& block_count,      // [BATCH, N_HEADS, NUM_ROWS]
    torch::Tensor& block_offset,     // [BATCH, N_HEADS, NUM_ROWS, NNZ_S]
@@ -205,7 +203,6 @@ void convert_vertical_slash_indexes_mergehead(
    torch::Tensor vertical_indices_count,  // [N_HEADS, ]
    torch::Tensor slash_indices_count, int64_t context_size,
    int64_t block_size_M, int64_t block_size_N, bool causal);
-#endif

 void rms_norm(torch::Tensor& out, torch::Tensor& input, torch::Tensor& weight,
              double epsilon);

--- a/csrc/torch_bindings.cpp
+++ b/csrc/torch_bindings.cpp
@@ -234,7 +234,6 @@ TORCH_LIBRARY_EXPAND(TORCH_EXTENSION_NAME, ops) {
  ops.impl("merge_attn_states", torch::kCUDA, &merge_attn_states);


-#ifndef USE_ROCM
  ops.def(
      "convert_vertical_slash_indexes("
      "   Tensor! block_count, Tensor! block_offset, "
@@ -257,7 +256,6 @@ TORCH_LIBRARY_EXPAND(TORCH_EXTENSION_NAME, ops) {
      "   bool causal) -> ()");
  ops.impl("convert_vertical_slash_indexes_mergehead", torch::kCUDA,
           &convert_vertical_slash_indexes_mergehead);
-#endif

  // Activation ops
  // Activation function used in SwiGLU.