Fix beam_scores shape when token scores shape changes after logits_processor (#25980)

2025-07-31 02:02:21 +06:00 · 2023-09-14 02:12:47 +08:00 · 2023-09-14 02:12:47 +08:00 · 0fced06788
commit 0fced06788
parent a796f7eea6
1 changed files with 9 additions and 3 deletions
--- a/src/transformers/generation/utils.py
+++ b/src/transformers/generation/utils.py
@ -3038,7 +3038,9 @@ class GenerationMixin:
            )  # (batch_size * num_beams, vocab_size)

            next_token_scores_processed = logits_processor(input_ids, next_token_scores)
-            next_token_scores = next_token_scores_processed + beam_scores[:, None].expand_as(next_token_scores)
+            next_token_scores = next_token_scores_processed + beam_scores[:, None].expand_as(
+                next_token_scores_processed
+            )

            # Store scores, attentions and hidden_states when required
            if return_dict_in_generate:
@ -3363,7 +3365,9 @@ class GenerationMixin:
            )  # (batch_size * num_beams, vocab_size)

            next_token_scores_processed = logits_processor(input_ids, next_token_scores)
-            next_token_scores = next_token_scores_processed + beam_scores[:, None].expand_as(next_token_scores)
+            next_token_scores = next_token_scores_processed + beam_scores[:, None].expand_as(
+                next_token_scores_processed
+            )
            # Note: logits warpers are intentionally applied after adding running beam scores. On some logits warpers
            # (like top_p) this is indiferent, but on others (like temperature) it is not. For reference, see
            # https://github.com/huggingface/transformers/pull/5420#discussion_r449779867
@ -4080,7 +4084,9 @@ class GenerationMixin:

            next_token_scores_processed = logits_processor(input_ids, next_token_scores)

-            next_token_scores = next_token_scores_processed + beam_scores[:, None].expand_as(next_token_scores)
+            next_token_scores = next_token_scores_processed + beam_scores[:, None].expand_as(
+                next_token_scores_processed
+            )

            scores_for_all_vocab = next_token_scores.clone()