Specifying torch dtype in Qwen2VLForConditionalGeneration (#33953)

* Specifying torch dtype * Reverting change & changing fallback _from_config() dtype
2025-07-31 02:02:21 +06:00 · 2024-10-10 05:39:33 -07:00 · 2024-10-10 05:39:33 -07:00 · dda3f91d06
commit dda3f91d06
parent f8a260e2a4
1 changed files with 1 additions and 1 deletions
--- a/src/transformers/modeling_utils.py
+++ b/src/transformers/modeling_utils.py
@ -1499,7 +1499,7 @@ class PreTrainedModel(nn.Module, ModuleUtilsMixin, GenerationMixin, PushToHubMix
            torch_dtype (`torch.dtype`, *optional*):
                Override the default `torch.dtype` and load the model under this dtype.
        """
-        torch_dtype = kwargs.pop("torch_dtype", None)
+        torch_dtype = kwargs.pop("torch_dtype", torch.get_default_dtype())
        use_flash_attention_2 = kwargs.pop("use_flash_attention_2", False)

        # override default dtype if needed