add timeout for downloading the librispeech_asr dataset (#38073)

* add timeout

* change 10 to 60
This commit is contained in:
Fanli Lin 2025-05-13 18:50:12 +08:00 committed by GitHub
parent 3ad35d0bca
commit 8fb60bf6be
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -21,6 +21,7 @@ from dataclasses import dataclass
from pathlib import Path from pathlib import Path
from typing import Optional, Union from typing import Optional, Union
import aiohttp
import datasets import datasets
import torch import torch
from accelerate import Accelerator from accelerate import Accelerator
@ -454,6 +455,7 @@ def main():
split=train_split_name, split=train_split_name,
cache_dir=args.cache_dir, cache_dir=args.cache_dir,
trust_remote_code=args.trust_remote_code, trust_remote_code=args.trust_remote_code,
storage_options={"client_kwargs": {"timeout": aiohttp.ClientTimeout(total=60 * 60)}},
) )
datasets_splits.append(dataset_split) datasets_splits.append(dataset_split)