Correct direct lang loading

huggingface · patrickvonplaten · Jun 20, 2023 · Jun 17, 2023 · Jun 18, 2023 · Jun 20, 2023
commit 7c00aed3939e24e07b4463470e791109d9624397
diff --git a/src/transformers/modeling_utils.py b/src/transformers/modeling_utils.py
@@ -1275,6 +1275,12 @@ def tie_weights(self):
             if hasattr(module, "_tie_weights"):
                 module._tie_weights()
 
+    def load_adaptive_weights(self):
+        """
+        Load adaptive weights after state dict has been loaded. If required this method should be overridden by derived class.
+        """
+        pass
-        pass
+        raise NotImplementedError
 def tie_weights(self): 
 def _init_weights(self, module): 
-        pass
+        raise NotImplementedError
 def tie_weights(self): 
 def _init_weights(self, module): 
+
     @staticmethod
     def _tie_encoder_decoder_weights(encoder: nn.Module, decoder: nn.Module, base_model_prefix: str):
         uninitialized_encoder_weights: List[str] = []
@@ -2897,6 +2903,9 @@ def from_pretrained(cls, pretrained_model_name_or_path: Optional[Union[str, os.P
         # make sure token embedding weights are still tied if needed
         model.tie_weights()
 
+        # make sure adaptive weights can be loaded dynamically
+        model.load_adaptive_weights()
+
         # Set model in evaluation mode to deactivate DropOut modules by default
         model.eval()
 

diff --git a/src/transformers/models/wav2vec2/modeling_wav2vec2.py b/src/transformers/models/wav2vec2/modeling_wav2vec2.py
@@ -1854,11 +1854,12 @@ def forward(
     WAV_2_VEC_2_START_DOCSTRING,
 )
 class Wav2Vec2ForCTC(Wav2Vec2PreTrainedModel):
-    def __init__(self, config, target_lang=None):
+    def __init__(self, config, target_lang: Optional[str] = None):
         super().__init__(config)
 
         self.wav2vec2 = Wav2Vec2Model(config)
         self.dropout = nn.Dropout(config.final_dropout)
+        self.target_lang = target_lang
 
         if config.vocab_size is None:
             raise ValueError(
@@ -1872,16 +1873,18 @@ def __init__(self, config, target_lang=None):
         )
         self.lm_head = nn.Linear(output_hidden_size, config.vocab_size)
 
+        # Initialize weights and apply final processing
+        self.post_init()
+
+    def load_adaptive_weights(self):
+        target_lang = self.target_lang
         if target_lang is not None and getattr(self.config, "adapter_attn_dim", None) is None:
             raise ValueError(f"Cannot pass `target_lang`: {target_lang} if `config.adapter_attn_dim` is not defined.")
         elif target_lang is None and getattr(self.config, "adapter_attn_dim", None) is not None:
             logger.info("By default `target_lang` is set to 'eng'.")
         elif target_lang is not None:
             self.load_adapter(target_lang)
 
-        # Initialize weights and apply final processing
-        self.post_init()
-
     def freeze_feature_extractor(self):
         """
         Calling this function will disable the gradient computation for the feature encoder so that its parameter will