Rename tokenizer_kwargs to tokenizer_encode_kwargs for text generation pipeline

Joshua-Chin · Joshua-Chin · commit e484dbb80232 · 2025-08-22T10:25:18.000-07:00
diff --git a/src/transformers/pipelines/text_generation.py b/src/transformers/pipelines/text_generation.py
@@ -158,7 +158,7 @@ def _sanitize_parameters(
         max_length=None,
         continue_final_message=None,
         skip_special_tokens=None,
-        tokenizer_kwargs=None,
+        tokenizer_encode_kwargs=None,
         **generate_kwargs,
     ):
         # preprocess kwargs
@@ -196,8 +196,8 @@ def _sanitize_parameters(
         if continue_final_message is not None:
             preprocess_params["continue_final_message"] = continue_final_message
 
-        if tokenizer_kwargs is not None:
-            preprocess_params["tokenizer_kwargs"] = tokenizer_kwargs
+        if tokenizer_encode_kwargs is not None:
+            preprocess_params["tokenizer_encode_kwargs"] = tokenizer_encode_kwargs
 
         preprocess_params.update(generate_kwargs)
 
@@ -293,9 +293,9 @@ def __call__(self, text_inputs, **kwargs):
                 - `None` : default strategy where nothing in particular happens
                 - `"hole"`: Truncates left of input, and leaves a gap wide enough to let generation happen (might
                   truncate a lot of the prompt and not suitable when generation exceed the model capacity)
-            tokenizer_kwargs (`dict`, *optional*):
-                Additional keyword arguments to pass along to the tokenizer. If the text input is a chat, it is passed
-                to `apply_chat_template`. Otherwise, it is passed to `__call__`.
+            tokenizer_encode_kwargs (`dict`, *optional*):
+                Additional keyword arguments to pass along to encoding step of the tokenizer. If the text input is a
+                chat, it is passed to `apply_chat_template`. Otherwise, it is passed to `__call__`.
             generate_kwargs (`dict`, *optional*):
                 Additional keyword arguments to pass along to the generate method of the model (see the generate method
                 corresponding to your framework [here](./text_generation)).
@@ -341,18 +341,18 @@ def preprocess(
         padding=None,
         max_length=None,
         continue_final_message=None,
-        tokenizer_kwargs=None,
+        tokenizer_encode_kwargs=None,
         **generate_kwargs,
     ):
         # Only set non-None tokenizer kwargs, so as to rely on the tokenizer's defaults
-        base_tokenizer_kwargs = {
+        tokenizer_kwargs = {
             "add_special_tokens": add_special_tokens,
             "truncation": truncation,
             "padding": padding,
             "max_length": max_length,  # NOTE: `max_length` is also a `generate` arg. Use `tokenizer_kwargs` to avoid a name clash
         }
-        base_tokenizer_kwargs = {key: value for key, value in base_tokenizer_kwargs.items() if value is not None}
-        tokenizer_kwargs = {**base_tokenizer_kwargs, **(tokenizer_kwargs or {})}
+        tokenizer_kwargs = {key: value for key, value in tokenizer_kwargs.items() if value is not None}
+        tokenizer_kwargs.update(tokenizer_encode_kwargs or {})
 
         if isinstance(prompt_text, Chat):
             tokenizer_kwargs.pop("add_special_tokens", None)  # ignore add_special_tokens on chats
diff --git a/tests/pipelines/test_pipelines_text_generation.py b/tests/pipelines/test_pipelines_text_generation.py
@@ -568,7 +568,7 @@ def test_forward_tokenizer_kwargs(self):
         tokenizer = text_generator.tokenizer
 
         with patch.object(tokenizer, "apply_chat_template", wraps=tokenizer.apply_chat_template) as mock:
-            text_generator(chat, tokenizer_kwargs={"enable_thinking": True})
+            text_generator(chat, tokenizer_encode_kwargs={"enable_thinking": True})
             self.assertGreater(mock.call_count, 0)
             kw_call_args = mock.call_args[1]
             self.assertIn("enable_thinking", kw_call_args)