From bca0dd5ee3a34d41a54cde3aa598bf8045e36cad Mon Sep 17 00:00:00 2001 From: Suraj Patil Date: Wed, 3 Feb 2021 20:14:42 +0530 Subject: [PATCH] [run_clm.py] fix getting extention --- examples/language-modeling/run_clm.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/examples/language-modeling/run_clm.py b/examples/language-modeling/run_clm.py index 94821a24f04..0c655f08b48 100644 --- a/examples/language-modeling/run_clm.py +++ b/examples/language-modeling/run_clm.py @@ -227,7 +227,11 @@ def main(): data_files["train"] = data_args.train_file if data_args.validation_file is not None: data_files["validation"] = data_args.validation_file - extension = data_args.train_file.split(".")[-1] + extension = ( + data_args.train_file.split(".")[-1] + if data_args.train_file is not None + else data_args.validation_file.split(".")[-1] + ) if extension == "txt": extension = "text" datasets = load_dataset(extension, data_files=data_files)