Update bad_words_ids usage (#15641)

* Improve the parameter `bad_word_ids' usage * Update the bad_words_ids strategy
2025-08-02 19:21:31 +06:00 · 2022-02-15 22:44:34 +07:00 · 2022-02-15 22:44:34 +07:00 · 7bc4a01cb5
commit 7bc4a01cb5
parent 67047b86ce
2 changed files with 5 additions and 4 deletions
--- a/src/transformers/generation_logits_process.py
+++ b/src/transformers/generation_logits_process.py
@ -380,8 +380,9 @@ class NoBadWordsLogitsProcessor(LogitsProcessor):

    Args:
        bad_words_ids (`List[List[int]]`):
-            List of list of token ids that are not allowed to be generated. In order to get the tokens of the words
-            that should not appear in the generated text, use `tokenizer(bad_word, add_prefix_space=True).input_ids`.
+            List of list of token ids that are not allowed to be generated. In order to get the token ids of the words
+            that should not appear in the generated text, use `tokenizer(bad_words, add_prefix_space=True, 
+            add_special_tokens=False).input_ids`.
        eos_token_id (`int`):
            The id of the *end-of-sequence* token.
    """
--- a/src/transformers/generation_utils.py
+++ b/src/transformers/generation_utils.py
@ -901,8 +901,8 @@ class GenerationMixin:
                If set to int > 0, all ngrams of that size that occur in the `encoder_input_ids` cannot occur in the
                `decoder_input_ids`.
            bad_words_ids(`List[List[int]]`, *optional*):
-                List of token ids that are not allowed to be generated. In order to get the tokens of the words that
-                should not appear in the generated text, use `tokenizer(bad_word, add_prefix_space=True,
+                List of token ids that are not allowed to be generated. In order to get the token ids of the words that
+                should not appear in the generated text, use `tokenizer(bad_words, add_prefix_space=True,
                add_special_tokens=False).input_ids`.
            num_return_sequences(`int`, *optional*, defaults to 1):
                The number of independently computed returned sequences for each element in the batch.