fix: fix the typo in FluxModel.cpp as in #297 (#317)

* fix: fix a typo * style: format the imports

fix: fix the typo in FluxModel.cpp as in #297 (#317)
* fix: fix a typo * style: format the imports
85855252 · Muyang Li · GitHub · ccd93d1e · 85855252 · 85855252
Unverified Commit 85855252 authored Apr 25, 2025 by Muyang Li Committed by GitHub Apr 25, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 4 deletions

nunchaku/models/transformers/transformer_flux.py nunchaku/models/transformers/transformer_flux.py +4 -3

src/FluxModel.cpp src/FluxModel.cpp +1 -1

No files found.
--- a/nunchaku/models/transformers/transformer_flux.py
+++ b/nunchaku/models/transformers/transformer_flux.py
-from typing import Any, Dict, Optional, Union
 import logging
 import os
+from typing import Any, Dict, Optional, Union
 import diffusers
 import torch
@@ -10,7 +9,7 @@ from diffusers.configuration_utils import register_to_config
 from diffusers.models.modeling_outputs import Transformer2DModelOutput
 from huggingface_hub import utils
 from packaging.version import Version
-from safetensors.torch import load_file, save_file
+from safetensors.torch import load_file
 from torch import nn
 from .utils import NunchakuModelLoaderMixin, pad_tensor
@@ -180,9 +179,11 @@ class NunchakuFluxTransformerBlocks(nn.Module):
        encoder_hidden_states = encoder_hidden_states.to(original_dtype).to(original_device)
        return encoder_hidden_states, hidden_states
    def __del__(self):
        self.m.reset()
 ## copied from diffusers 0.30.3
 def rope(pos: torch.Tensor, dim: int, theta: int) -> torch.Tensor:
    assert dim % 2 == 0, "The dimension must be even."

--- a/src/FluxModel.cpp
+++ b/src/FluxModel.cpp
@@ -526,7 +526,7 @@ std::tuple<Tensor, Tensor> JointTransformerBlock::forward(Tensor hidden_states,
                    ? pool.slice(0, i, i + 1).slice(1, 0, num_tokens_img / POOL_SIZE)
                    : Tensor{};
                Tensor pool_qkv_context = pool.valid()
-                    ? concat.slice(0, i, i + 1).slice(1, num_tokens_img / POOL_SIZE, num_tokens_img / POOL_SIZE + num_tokens_txt / POOL_SIZE)
+                    ? pool.slice(0, i, i + 1).slice(1, num_tokens_img / POOL_SIZE, num_tokens_img / POOL_SIZE + num_tokens_txt / POOL_SIZE)
                    : Tensor{};
                // qkv_proj.forward(norm1_output.x.slice(0, i, i + 1), qkv);