mirror of
https://github.com/huggingface/transformers.git
synced 2025-07-31 02:02:21 +06:00
FIX / OPT: Fix OPT multi-GPU training for OPTForQuestionAnswering
(#31092)
Update modeling_opt.py
This commit is contained in:
parent
94d416f018
commit
ab19f907fd
@ -1427,8 +1427,8 @@ class OPTForQuestionAnswering(OPTPreTrainedModel):
|
||||
end_positions = end_positions.squeeze(-1)
|
||||
# sometimes the start/end positions are outside our model inputs, we ignore these terms
|
||||
ignored_index = start_logits.size(1)
|
||||
start_positions = start_positions.clamp(0, ignored_index)
|
||||
end_positions = end_positions.clamp(0, ignored_index)
|
||||
start_positions = start_positions.clamp(0, ignored_index).to(logits.device)
|
||||
end_positions = end_positions.clamp(0, ignored_index).to(logits.device)
|
||||
|
||||
loss_fct = CrossEntropyLoss(ignore_index=ignored_index)
|
||||
start_loss = loss_fct(start_logits, start_positions)
|
||||
|
Loading…
Reference in New Issue
Block a user