[BitsandBytes] Verify if GPU is available (#30533)

Change order
2025-07-31 02:02:21 +06:00 · 2024-05-08 12:42:58 +02:00 · 2024-05-08 12:42:58 +02:00 · 1872bde7fc
commit 1872bde7fc
parent 998dbe068b
2 changed files with 5 additions and 6 deletions
--- a/src/transformers/quantizers/quantizer_bnb_4bit.py
+++ b/src/transformers/quantizers/quantizer_bnb_4bit.py
@ -58,6 +58,8 @@ class Bnb4BitHfQuantizer(HfQuantizer):
            self.modules_to_not_convert = self.quantization_config.llm_int8_skip_modules

    def validate_environment(self, *args, **kwargs):
+        if not torch.cuda.is_available():
+            raise RuntimeError("No GPU found. A GPU is needed for quantization.")
        if not (is_accelerate_available() and is_bitsandbytes_available()):
            raise ImportError(
                "Using `bitsandbytes` 8-bit quantization requires Accelerate: `pip install accelerate` "
@ -70,9 +72,6 @@ class Bnb4BitHfQuantizer(HfQuantizer):
                " sure the weights are in PyTorch format."
            )

-        if not torch.cuda.is_available():
-            raise RuntimeError("No GPU found. A GPU is needed for quantization.")
-
        device_map = kwargs.get("device_map", None)
        if (
            device_map is not None
--- a/src/transformers/quantizers/quantizer_bnb_8bit.py
+++ b/src/transformers/quantizers/quantizer_bnb_8bit.py
@ -58,6 +58,9 @@ class Bnb8BitHfQuantizer(HfQuantizer):
            self.modules_to_not_convert = self.quantization_config.llm_int8_skip_modules

    def validate_environment(self, *args, **kwargs):
+        if not torch.cuda.is_available():
+            raise RuntimeError("No GPU found. A GPU is needed for quantization.")
+
        if not (is_accelerate_available() and is_bitsandbytes_available()):
            raise ImportError(
                "Using `bitsandbytes` 8-bit quantization requires Accelerate: `pip install accelerate` "
@ -70,9 +73,6 @@ class Bnb8BitHfQuantizer(HfQuantizer):
                " sure the weights are in PyTorch format."
            )

-        if not torch.cuda.is_available():
-            raise RuntimeError("No GPU found. A GPU is needed for quantization.")
-
        device_map = kwargs.get("device_map", None)
        if (
            device_map is not None