[Pytorch] remove redundant error check in Linear module (#2420)

remove linear redundant check Signed-off-by: Varun Thumbe <vthumbe@nvidia.com>

[Pytorch] remove redundant error check in Linear module (#2420)
remove linear redundant check Signed-off-by: Varun Thumbe <vthumbe@nvidia.com>
3b8d9a8a · vthumbe1503 · GitHub · 66ae3030 · 3b8d9a8a
Unverified Commit 3b8d9a8a authored Nov 25, 2025 by vthumbe1503 Committed by GitHub Nov 25, 2025
Show whitespace changes
Inline Side-by-side

Showing with 0 additions and 14 deletions

transformer_engine/pytorch/module/linear.py transformer_engine/pytorch/module/linear.py +0 -14

No files found.
--- a/transformer_engine/pytorch/module/linear.py
+++ b/transformer_engine/pytorch/module/linear.py
@@ -1536,25 +1536,11 @@ class Linear(TransformerEngineBaseModule):
    def _get_weight_and_bias_tensors(self) -> Tuple[torch.Tensor, Optional[torch.Tensor]]:
        # Get concatenated weight and bias tensors
        unfused_weights = self._get_weight_tensors()
-        if any(isinstance(w, QuantizedTensor) for w in unfused_weights):
-            if self.fp8:
-                if len(unfused_weights) != 1:
-                    raise RuntimeError(
-                        "Splitting QuantizedTensor into multiple params is not supported"
-                    )
-            else:
-                warnings.warn(
-                    "You are using quantized weights without quantized compute. "
-                    "Please make sure this is intentional."
-                )
-                unfused_weights = [w.dequantize() for w in unfused_weights]
        weight_tensor = noop_cat(unfused_weights)
        if self.use_bias:
            bias_tensor = noop_cat([getattr(self, name) for name in self.bias_names])
        else:
            bias_tensor = None
        return weight_tensor, bias_tensor
    def onnx_forward(