add timeout for downloading the librispeech_asr dataset (#38073)

* add timeout

* change 10 to 60
This commit is contained in:
Fanli Lin 2025-05-13 18:50:12 +08:00 committed by GitHub
parent 3ad35d0bca
commit 8fb60bf6be
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -21,6 +21,7 @@ from dataclasses import dataclass
from pathlib import Path
from typing import Optional, Union
import aiohttp
import datasets
import torch
from accelerate import Accelerator
@ -454,6 +455,7 @@ def main():
split=train_split_name,
cache_dir=args.cache_dir,
trust_remote_code=args.trust_remote_code,
storage_options={"client_kwargs": {"timeout": aiohttp.ClientTimeout(total=60 * 60)}},
)
datasets_splits.append(dataset_split)