mirror of
https://github.com/huggingface/transformers.git
synced 2025-08-01 02:31:11 +06:00
compute_loss in trainer failing to label shift for PEFT model when label smoothing enabled. (#25044)
* added PeftModelForCausalLM to MODEL_FOR_CAUSAL_LM_MAPPING_NAMES dict * check for PEFT model in compute_loss section --------- Co-authored-by: Nathan Brake <nbrake3@mmm.com>
This commit is contained in:
parent
a03d13c83d
commit
3611fc90e0
@ -2677,7 +2677,11 @@ class Trainer:
|
||||
self._past = outputs[self.args.past_index]
|
||||
|
||||
if labels is not None:
|
||||
if unwrap_model(model)._get_name() in MODEL_FOR_CAUSAL_LM_MAPPING_NAMES.values():
|
||||
if is_peft_available() and isinstance(model, PeftModel):
|
||||
model_name = unwrap_model(model.base_model)._get_name()
|
||||
else:
|
||||
model_name = unwrap_model(model)._get_name()
|
||||
if model_name in MODEL_FOR_CAUSAL_LM_MAPPING_NAMES.values():
|
||||
loss = self.label_smoother(outputs, labels, shift_labels=True)
|
||||
else:
|
||||
loss = self.label_smoother(outputs, labels)
|
||||
|
Loading…
Reference in New Issue
Block a user