fix _no_split_modules for Whisper model (#22486)

This commit is contained in:
Sourab Mangrulkar 2023-04-04 22:31:32 +05:30 committed by GitHub
parent 900677487d
commit 48fbd8fa2e
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -577,7 +577,7 @@ class WhisperPreTrainedModel(PreTrainedModel):
base_model_prefix = "model"
main_input_name = "input_features"
supports_gradient_checkpointing = True
_no_split_modules = ["WhisperEncoderLayer"]
_no_split_modules = ["WhisperEncoderLayer", "WhisperDecoderLayer"]
def _init_weights(self, module):
std = self.config.init_std