Initialize flash attn flag (#38768)

_flash_supports_window_size is used further down in this file and relied on by e.g. [ring-flash-attention](https://github.com/zhuzilin/ring-flash-attention/blob/123f924/ring_flash_attn/adapters/hf_adapter.py#L9-L11). Even though it is an unexported name, it still makes sense to keep the state of `globals()` in this file consistent.
2025-07-18 12:08:22 +06:00 · 2025-06-12 07:06:13 -07:00 · 2025-06-12 07:06:13 -07:00 · 038a59e2cd
commit 038a59e2cd
parent 910355a010
1 changed files with 3 additions and 0 deletions
--- a/src/transformers/modeling_flash_attention_utils.py
+++ b/src/transformers/modeling_flash_attention_utils.py
@ -46,6 +46,9 @@ if is_torch_npu_available():
    from .integrations.npu_flash_attention import npu_flash_attn_varlen_func as flash_attn_varlen_func


+_flash_supports_window_size = False
+
+
 if flash_attn_func:
    _flash_supports_window_size = "window_size" in list(inspect.signature(flash_attn_func).parameters)