fix AMX

b22cded8 · Atream · GitHub · 3f14e311 · b22cded8
Unverified Commit b22cded8 authored May 07, 2025 by Atream Committed by GitHub May 07, 2025
Show whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

csrc/ktransformers_ext/operators/amx/moe.hpp csrc/ktransformers_ext/operators/amx/moe.hpp +2 -2

No files found.
--- a/csrc/ktransformers_ext/operators/amx/moe.hpp
+++ b/csrc/ktransformers_ext/operators/amx/moe.hpp
@@ -272,8 +272,8 @@ public:
  void forward(int qlen, int k, const uint64_t *expert_ids, const float *weights, const void *input, void *output,
               int *batch_size_tensor, Backend *backend) {
-    bool use_amx = (qlen > 4 * config_.expert_num / config_.routed_expert_num);
    qlen = batch_size_tensor[0];
+    bool use_amx = (qlen > 4 * config_.expert_num / config_.routed_expert_num);
    int activated_expert = 0;
    for (int i = 0; i < config_.expert_num; i++) {
      m_local_num_[i] = 0;