From 85980d636c477a307285d008ab5b233a574a6d91 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Xavier=20Dupr=C3=A9?= Date: Wed, 7 Jan 2026 09:07:59 +0100 Subject: [PATCH 1/2] fix patched lazy_initialization for transformers>=5 --- .../patches/_patch_transformers_dynamic_cache.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/onnx_diagnostic/torch_export_patches/patches/_patch_transformers_dynamic_cache.py b/onnx_diagnostic/torch_export_patches/patches/_patch_transformers_dynamic_cache.py index d29f5616..0966d9f6 100644 --- a/onnx_diagnostic/torch_export_patches/patches/_patch_transformers_dynamic_cache.py +++ b/onnx_diagnostic/torch_export_patches/patches/_patch_transformers_dynamic_cache.py @@ -22,7 +22,9 @@ class patched_DynamicLayer: _PATCHES_ = ["lazy_initialization"] _PATCHED_CLASS_ = DynamicLayer - def lazy_initialization(self, key_states: torch.Tensor): + def lazy_initialization( + self, key_states: torch.Tensor, value_states: torch.Tensor = None + ): self.dtype, self.device = key_states.dtype, key_states.device assert ( hasattr(key_states, "shape") and key_states is not None From 67cf7c5488d55450f89e949f68454de086d2baa3 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Xavier=20Dupr=C3=A9?= Date: Wed, 7 Jan 2026 09:08:54 +0100 Subject: [PATCH 2/2] doc --- CHANGELOGS.rst | 1 + 1 file changed, 1 insertion(+) diff --git a/CHANGELOGS.rst b/CHANGELOGS.rst index 134c526f..51c85101 100644 --- a/CHANGELOGS.rst +++ b/CHANGELOGS.rst @@ -4,6 +4,7 @@ Change Logs 0.8.8 +++++ +* :pr:`376`: fix patched lazy_initialization for transformers>=5 * :pr:`372`: fix patch on rotary embedding * :pr:`371`: fix make_fake_with_dynamic_dimensions