fix check for hidden size in text model for deepspeed zero3 auto entries (#33829)

* fix check for hidden size in text model for deepspeed zero3 auto entries

* fix typo
This commit is contained in:
Wing Lian 2024-10-01 06:28:26 -04:00 committed by GitHub
parent 808997a634
commit fbde09c8c9
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -228,6 +228,11 @@ class HfTrainerDeepSpeedConfig(HfDeepSpeedConfig):
elif hasattr(model.config, "hidden_sizes"):
# if there are many hidden sizes pick the largest one
hidden_size = max(model.config.hidden_sizes)
elif hasattr(model.config, "text_config") and hasattr(model.config.text_config, "hidden_size"):
hidden_size = model.config.text_config.hidden_size
elif hasattr(model.config, "text_config") and hasattr(model.config.text_config, "hidden_sizes"):
# if there are many hidden sizes pick the largest one
hidden_size = max(model.config.text_config.hidden_sizes)
else:
raise ValueError(
"The model's config file has neither `hidden_size` nor `hidden_sizes` entry, "