diff --git a/src/transformers/models/paligemma/configuration_paligemma.py b/src/transformers/models/paligemma/configuration_paligemma.py index fe05f38514a7..918095ce85e0 100644 --- a/src/transformers/models/paligemma/configuration_paligemma.py +++ b/src/transformers/models/paligemma/configuration_paligemma.py @@ -74,6 +74,7 @@ class PaliGemmaConfig(PretrainedConfig): model_type = "paligemma" sub_configs = {"text_config": AutoConfig, "vision_config": AutoConfig} + keys_to_ignore_at_inference = ["past_key_values"] def __init__( self, diff --git a/src/transformers/trainer.py b/src/transformers/trainer.py index 677daa55ee40..23eb3907078d 100755 --- a/src/transformers/trainer.py +++ b/src/transformers/trainer.py @@ -4477,7 +4477,7 @@ def prediction_step( inputs = self._prepare_inputs(inputs) if ignore_keys is None: if hasattr(self.model, "config"): - ignore_keys = getattr(self.model.config, "keys_to_ignore_at_inference", []) + ignore_keys = getattr(self.model.config, "keys_to_ignore_at_inference", ["past_key_values"]) else: ignore_keys = []