From da3ba3a1672c87f460382c10d3c1572c39117977 Mon Sep 17 00:00:00 2001 From: Younes Belkada <49240599+younesbelkada@users.noreply.github.com> Date: Thu, 16 Mar 2023 16:18:05 +0100 Subject: [PATCH] [`XGLM`] Add `accelerate` support for XGLM (#22207) * add `accelerate` support for XGLM * fix order --- src/transformers/models/xglm/modeling_xglm.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/transformers/models/xglm/modeling_xglm.py b/src/transformers/models/xglm/modeling_xglm.py index b9cef18efc7..8a19557932f 100755 --- a/src/transformers/models/xglm/modeling_xglm.py +++ b/src/transformers/models/xglm/modeling_xglm.py @@ -510,6 +510,7 @@ class XGLMPreTrainedModel(PreTrainedModel): config_class = XGLMConfig base_model_prefix = "model" supports_gradient_checkpointing = True + _no_split_modules = ["XGLMDecoderLayer"] def _init_weights(self, module): std = self.config.init_std