From 89d7130fdeb8fb5df55e4a311f94191aa5e3768d Mon Sep 17 00:00:00 2001 From: Peter Schneider Date: Fri, 11 Jul 2025 13:08:25 -0700 Subject: [PATCH] fix: ImageTextToTextPipeline handles user-defined generation_config passed to the pipeline --- src/transformers/pipelines/image_text_to_text.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/src/transformers/pipelines/image_text_to_text.py b/src/transformers/pipelines/image_text_to_text.py index b205e63b05d7..c18378cd0df0 100644 --- a/src/transformers/pipelines/image_text_to_text.py +++ b/src/transformers/pipelines/image_text_to_text.py @@ -422,6 +422,11 @@ def _forward(self, model_inputs, generate_kwargs=None): input_ids = ( model_inputs["input_ids"] if "input_ids" in model_inputs else model_inputs["decoder_input_ids"] ) # for decoder-only models + + # User-defined `generation_config` passed to the pipeline call take precedence + if "generation_config" not in generate_kwargs: + generate_kwargs["generation_config"] = self.generation_config + generated_sequence = self.model.generate(**model_inputs, **generate_kwargs) return {"generated_sequence": generated_sequence, "prompt_text": prompt_text, "input_ids": input_ids}