add moe_wna16_gemm

c8492797 · zhuwenwen · fe6d3b05 · c8492797 · c8492797
Commit c8492797 authored Apr 02, 2025 by zhuwenwen
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

csrc/moe/moe_ops.h csrc/moe/moe_ops.h +1 -1

csrc/moe/torch_bindings.cpp csrc/moe/torch_bindings.cpp +1 -1

No files found.
--- a/csrc/moe/moe_ops.h
+++ b/csrc/moe/moe_ops.h
@@ -18,7 +18,7 @@ void sgl_moe_align_block_size(torch::Tensor topk_ids, int64_t num_experts,
                              torch::Tensor sorted_token_ids,
                              torch::Tensor experts_ids,
                              torch::Tensor num_tokens_post_pad);
-#ifndef USE_ROCM
+#ifdef USE_ROCM
 torch::Tensor moe_wna16_gemm(torch::Tensor input, torch::Tensor output,
                             torch::Tensor b_qweight, torch::Tensor b_scales,
                             std::optional<torch::Tensor> b_qzeros,

--- a/csrc/moe/torch_bindings.cpp
+++ b/csrc/moe/torch_bindings.cpp
@@ -31,7 +31,7 @@ TORCH_LIBRARY_EXPAND(TORCH_EXTENSION_NAME, m) {
      "                         Tensor! num_tokens_post_pad) -> ()");
  m.impl("sgl_moe_align_block_size", torch::kCUDA, &sgl_moe_align_block_size);
-#ifndef USE_ROCM
+#ifdef USE_ROCM
  m.def(
      "moe_wna16_gemm(Tensor input, Tensor! output, Tensor b_qweight, "
      "Tensor b_scales, Tensor? b_qzeros, "