[trainer: distributed_concat] ensure all_gather's inputs are contiguous (#20951)

[trainer: distributed_concat] ensure all_gather's input are contiguous
2025-08-02 19:21:31 +06:00 · 2022-12-30 21:55:12 -08:00 · 2022-12-30 21:55:12 -08:00 · 9e6da0a7ed
commit 9e6da0a7ed
parent 17292440c0
1 changed files with 1 additions and 1 deletions
--- a/src/transformers/trainer_pt_utils.py
+++ b/src/transformers/trainer_pt_utils.py
@ -189,7 +189,7 @@ def distributed_concat(tensor: Any, num_total_examples: Optional[int] = None) ->
    try:
        if isinstance(tensor, (tuple, list)):
            return type(tensor)(distributed_concat(t, num_total_examples) for t in tensor)
-        tensor = atleast_1d(tensor)
+        tensor = atleast_1d(tensor).contiguous()
        output_tensors = [tensor.clone() for _ in range(dist.get_world_size())]
        dist.all_gather(output_tensors, tensor)
        concat = torch.cat(output_tensors, dim=0)