Seq2SeqTrainer: use unwrapped model to retrieve the generation config (#22584)

2025-07-31 02:02:21 +06:00 · 2023-04-06 13:29:58 +01:00 · 2023-04-06 13:29:58 +01:00 · 48706c7178
commit 48706c7178
parent 0aa1153ffb
1 changed files with 1 additions and 1 deletions
--- a/src/transformers/trainer_seq2seq.py
+++ b/src/transformers/trainer_seq2seq.py
@ -277,7 +277,7 @@ class Seq2SeqTrainer(Trainer):
            self.model.generation_config._from_model_config = False

        # Retrieves GenerationConfig from model.generation_config
-        gen_config = model.generation_config
+        gen_config = self.model.generation_config
        # in case the batch is shorter than max length, the output should be padded
        if generated_tokens.shape[-1] < gen_config.max_length:
            generated_tokens = self._pad_tensors_to_max_len(generated_tokens, gen_config.max_length)