fix(modeling_utils): Correctly call _init_weights in smart_apply

2025-07-04 21:30:07 +06:00 · 2025-07-01 23:45:21 +08:00 · 2025-07-01 23:45:21 +08:00 · f3d88d70f3
commit f3d88d70f3
parent 8e87adc45f
1 changed files with 7 additions and 3 deletions
--- a/src/transformers/modeling_utils.py
+++ b/src/transformers/modeling_utils.py
@ -2763,10 +2763,14 @@ class PreTrainedModel(nn.Module, ModuleUtilsMixin, PushToHubMixin, PeftAdapterMi
            def smart_apply(self, fn):
                for module in self.children():
                    # We found a sub-model: recursively dispatch its own init function now!
-                    if isinstance(module, PreTrainedModel):
-                        module.smart_apply(module._initialize_weights)
+                    # If a module has its own _init_weights function, that one takes priority.
+                    # The logic is:
+                    # 1. Recursively apply the top-level initialization function (`fn`) to all children.
+                    # 2. Apply the submodule's own custom initializer (`_init_weights`) on top of that.
+                    if hasattr(module, "_init_weights"):
+                        module.init_weights()
                    else:
-                        module.smart_apply(fn)
+                        module.apply(fn)
                fn(self)
                return self