adapter-hub · calpt · Feb 9, 2023 · Jan 28, 2023 · Jan 28, 2023 · Feb 9, 2023
diff --git a/src/transformers/adapters/trainer.py b/src/transformers/adapters/trainer.py
@@ -217,6 +217,28 @@ def _load_heads(self, resume_from_checkpoint):
                 ):
                     self.model.load_head(os.path.join(resume_from_checkpoint, file_name))
 
+    def _load_best_model(self):
+        model = self.model_wrapped if is_sagemaker_mp_enabled() else self.model
+        logger.info(
+            f"Loading best adapter(s) from {self.state.best_model_checkpoint} (score: {self.state.best_metric})."
+        )
+        # attempt to re-load all adapters from checkpoint
+        for adapter in model.config.adapters.adapters:
+            adapter_dir = os.path.join(self.state.best_model_checkpoint, adapter)
+            if os.path.exists(adapter_dir):
+                model.load_adapter(adapter_dir)
+        if self.train_adapter_fusion:
+            logger.info(
+                f"Loading best adapter fusion(s) from {self.state.best_model_checkpoint} (score:"
+                f" {self.state.best_metric})."
+            )
+            # attempt to re-load all adapter fusions from checkpoint
+            for fusion in model.config.adapters.fusions:
+                fusion_dir = os.path.join(self.state.best_model_checkpoint, fusion)
+                if os.path.exists(fusion_dir):
+                    model.load_adapter_fusion(fusion_dir)
+        model.to(self.args.device)
+
 
 class AdapterTrainerCallback(TrainerCallback):
     def __init__(self, trainer):
@@ -232,27 +254,6 @@ def on_train_begin(self, args: TrainingArguments, state: TrainerState, control:
                 " method"
             )
 
-    def on_train_end(self, args: TrainingArguments, state: TrainerState, control: TrainerControl, **kwargs):
-        model = kwargs.pop("model")
-        if args.load_best_model_at_end and state.best_model_checkpoint is not None:
-
-            logger.info(f"Loading best adapter(s) from {state.best_model_checkpoint} (score: {state.best_metric}).")
-            # attempt to re-load all adapters from checkpoint
-            for adapter in model.config.adapters.adapters:
-                adapter_dir = os.path.join(state.best_model_checkpoint, adapter)
-                if os.path.exists(adapter_dir):
-                    model.load_adapter(adapter_dir)
-            if self.trainer.train_adapter_fusion:
-                logger.info(
-                    f"Loading best adapter fusion(s) from {state.best_model_checkpoint} (score: {state.best_metric})."
-                )
-                # attempt to re-load all adapter fusions from checkpoint
-                for fusion in model.config.adapters.fusions:
-                    fusion_dir = os.path.join(state.best_model_checkpoint, fusion)
-                    if os.path.exists(fusion_dir):
-                        model.load_adapter_fusion(fusion_dir)
-            model.to(args.device)
-
     def on_step_end(self, args: TrainingArguments, state: TrainerState, control: TrainerControl, **kwargs):
         # apply adapter fusion weight regularization on the value matrix
         model = kwargs.pop("model")