mirror of
https://github.com/huggingface/transformers.git
synced 2025-08-01 02:31:11 +06:00
[GptNeox
] don't gather on pkv when using the trainer (#29892)
don't gather on pkv when using the trainer
This commit is contained in:
parent
b256516a8c
commit
543889f3f6
@ -103,6 +103,7 @@ class GPTNeoXConfig(PretrainedConfig):
|
||||
```"""
|
||||
|
||||
model_type = "gpt_neox"
|
||||
keys_to_ignore_at_inference = ["past_key_values"]
|
||||
|
||||
def __init__(
|
||||
self,
|
||||
|
Loading…
Reference in New Issue
Block a user