Improve TorchAO error message (#10627)

improve error message

Improve TorchAO error message (#10627)
improve error message
ca60ad8e · Aryan · GitHub · beacaa55 · ca60ad8e
Unverified Commit ca60ad8e authored Jan 22, 2025 by Aryan Committed by GitHub Jan 22, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 10 additions and 3 deletions

src/diffusers/quantizers/quantization_config.py src/diffusers/quantizers/quantization_config.py +10 -3

No files found.
--- a/src/diffusers/quantizers/quantization_config.py
+++ b/src/diffusers/quantizers/quantization_config.py
@@ -481,8 +481,15 @@ class TorchAoConfig(QuantizationConfigMixin):
        TORCHAO_QUANT_TYPE_METHODS = self._get_torchao_quant_type_to_method()
        if self.quant_type not in TORCHAO_QUANT_TYPE_METHODS.keys():
+            is_floating_quant_type = self.quant_type.startswith("float") or self.quant_type.startswith("fp")
+            if is_floating_quant_type and not self._is_cuda_capability_atleast_8_9():
+                raise ValueError(
+                    f"Requested quantization type: {self.quant_type} is not supported on GPUs with CUDA capability <= 8.9. You "
+                    f"can check the CUDA capability of your GPU using `torch.cuda.get_device_capability()`."
+                )
            raise ValueError(
-                f"Requested quantization type: {self.quant_type} is not supported yet or is incorrect. If you think the "
+                f"Requested quantization type: {self.quant_type} is not supported or is an incorrect `quant_type` name. If you think the "
                f"provided quantization type should be supported, please open an issue at https://github.com/huggingface/diffusers/issues."
            )
@@ -652,13 +659,13 @@ class TorchAoConfig(QuantizationConfigMixin):
    def __repr__(self):
        r"""
-        Example of how this looks for `TorchAoConfig("uint_a16w4", group_size=32)`:
+        Example of how this looks for `TorchAoConfig("uint4wo", group_size=32)`:
        ```
        TorchAoConfig {
            "modules_to_not_convert": null,
            "quant_method": "torchao",
-            "quant_type": "uint_a16w4",
+            "quant_type": "uint4wo",
            "quant_type_kwargs": {
                "group_size": 32
            }