Change attention mask dtype to be bool. Fix #1119

2025-07-25 23:38:59 +06:00 · 2019-08-27 14:19:03 +03:00 · 2019-08-27 14:19:03 +03:00 · 53282b5bd0
commit 53282b5bd0
parent e08c01aa1a
1 changed files with 2 additions and 2 deletions
--- a/pytorch_transformers/modeling_transfo_xl.py
+++ b/pytorch_transformers/modeling_transfo_xl.py
@ -1142,10 +1142,10 @@ class TransfoXLModel(TransfoXLPreTrainedModel):
            else:
                mask_shift_len = qlen
            dec_attn_mask = (torch.triu(all_ones, 1+mlen)
-                    + torch.tril(all_ones, -mask_shift_len)).byte()[:, :, None] # -1
+                    + torch.tril(all_ones, -mask_shift_len)).bool()[:, :, None] # -1
        else:
            dec_attn_mask = torch.triu(
-                word_emb.new_ones(qlen, klen), diagonal=1+mlen).byte()[:,:,None]
+                word_emb.new_ones(qlen, klen), diagonal=1+mlen).bool()[:,:,None]
        hids = []
        attentions = []