Merge pull request #1162 from huggingface/xlnet-bias

XLNet bias fix on resize embeddings (cf #1124)
2025-07-31 02:02:21 +06:00 · 2019-09-02 23:14:04 +02:00 · 2019-09-02 23:14:04 +02:00 · 0287d264e9
commit 0287d264e9
parent 7f522437bc ea86bef545
1 changed files with 8 additions and 0 deletions
--- a/pytorch_transformers/modeling_utils.py
+++ b/pytorch_transformers/modeling_utils.py
@ -331,6 +331,14 @@ class PreTrainedModel(nn.Module):
        else:
            first_module.weight = second_module.weight

+        if hasattr(first_module, 'bias') and first_module.bias is not None:
+            first_module.bias.data = torch.nn.functional.pad(
+                first_module.bias.data,
+                (0, first_module.weight.shape[0] - first_module.bias.shape[0]),
+                'constant',
+                0
+            )
+
    def resize_token_embeddings(self, new_num_tokens=None):
        """ Resize input token embeddings matrix of the model if new_num_tokens != config.vocab_size.
        Take care of tying weights embeddings afterwards if the model class has a `tie_weights()` method.