[Qwen2.5-Omni] Fix dtype of cos,sin when used with flash attention (#38453)

* Fix dtype of cos,sin when used with flash attention * Fix dtype of cos,sin when used with flash attention
2025-07-03 12:50:06 +06:00 · 2025-05-30 02:24:40 +08:00 · 2025-05-30 02:24:40 +08:00 · 42ef218b58
commit 42ef218b58
parent 81cff7ad34
2 changed files with 4 additions and 4 deletions
--- a/src/transformers/models/qwen2_5_omni/modeling_qwen2_5_omni.py
+++ b/src/transformers/models/qwen2_5_omni/modeling_qwen2_5_omni.py
@ -1034,8 +1034,8 @@ class Qwen2_5OmniVisionFlashAttention2(nn.Module):
    def _apply_rotary_pos_emb_flashatt(self, tensor: torch.Tensor, freqs: torch.Tensor) -> torch.Tensor:
        tensor_ = tensor.float()
-        cos = freqs.cos()  # .type_as(tensor_)
+        cos = freqs.cos().type_as(tensor_)
-        sin = freqs.sin()  # .type_as(tensor_)
+        sin = freqs.sin().type_as(tensor_)
        output = apply_rotary_emb(tensor_, cos, sin).type_as(tensor)
        return output
--- a/src/transformers/models/qwen2_5_omni/modular_qwen2_5_omni.py
+++ b/src/transformers/models/qwen2_5_omni/modular_qwen2_5_omni.py
@ -2022,8 +2022,8 @@ class Qwen2_5OmniVisionFlashAttention2(nn.Module):
    def _apply_rotary_pos_emb_flashatt(self, tensor: torch.Tensor, freqs: torch.Tensor) -> torch.Tensor:
        tensor_ = tensor.float()
-        cos = freqs.cos()  # .type_as(tensor_)
+        cos = freqs.cos().type_as(tensor_)
-        sin = freqs.sin()  # .type_as(tensor_)
+        sin = freqs.sin().type_as(tensor_)
        output = apply_rotary_emb(tensor_, cos, sin).type_as(tensor)
        return output