mirror of
https://github.com/huggingface/transformers.git
synced 2025-08-01 02:31:11 +06:00
parent
19919689b2
commit
d1efaf0318
@ -625,7 +625,7 @@ class RwkvModel(RwkvPreTrainedModel):
|
||||
use_cache = use_cache if use_cache is not None else (self.config.use_cache if not self.training else False)
|
||||
return_dict = return_dict if return_dict is not None else self.config.use_return_dict
|
||||
|
||||
if attention_mask is None:
|
||||
if attention_mask is not None:
|
||||
logger.warning_once("`attention_mask` was passed, but it is unused in this model.")
|
||||
|
||||
if self.training == self.layers_are_rescaled:
|
||||
|
Loading…
Reference in New Issue
Block a user