Fix flaky tests (#34069)

* fix mllama only * allow image token index
2025-07-31 02:02:21 +06:00 · 2024-10-11 15:41:46 +02:00 · 2024-10-11 15:41:46 +02:00 · fd70464fa7
commit fd70464fa7
parent 3a24ba82ad
2 changed files with 2 additions and 1 deletions
--- a/src/transformers/models/mllama/modeling_mllama.py
+++ b/src/transformers/models/mllama/modeling_mllama.py
@ -2214,7 +2214,7 @@ class MllamaForConditionalGeneration(MllamaPreTrainedModel, GenerationMixin):

        # If we're in pre-fill or cacheless decoding step, then we need pixel_values and aspect ratios
        # to compute image hidden states, otherwise they are cached within each cross attn layer
-        if (input_ids == self.config.image_token_index).any():
+        if cache_position[0] == 0:
            model_inputs["pixel_values"] = pixel_values
            model_inputs["aspect_ratio_ids"] = aspect_ratio_ids
            model_inputs["aspect_ratio_mask"] = aspect_ratio_mask
--- a/utils/check_config_attributes.py
+++ b/utils/check_config_attributes.py
@ -243,6 +243,7 @@ def check_attribute_being_used(config_class, attributes, default_value, source_s
        "pad_index",
        "unk_index",
        "mask_index",
+        "image_token_index",  # for VLMs
        "image_size",
        "use_cache",
        "out_features",