huggingface · alexrs · Sep 29, 2023 · Sep 29, 2023 · Sep 29, 2023 · Sep 29, 2023
diff --git a/src/peft/tuners/ia3/layer.py b/src/peft/tuners/ia3/layer.py
@@ -34,7 +34,6 @@ def __init__(
         out_features: int,
         is_feedforward: bool,
     ):
-        self.scaling = {}
         self.ia3_l = nn.ParameterDict({})
         # Mark the weight as unmerged
         self._disable_adapters = False
@@ -166,7 +165,6 @@ def _linear(self, input: torch.Tensor) -> torch.Tensor:
 
     def forward(self, x: torch.Tensor) -> torch.Tensor:
         dtype = previous_dtype = x.dtype
-
         if self.disable_adapters:
             if self.merged:
                 self.unmerge()

diff --git a/src/peft/tuners/ia3/model.py b/src/peft/tuners/ia3/model.py
@@ -12,11 +12,12 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
+import operator
 import re
 import warnings
-from dataclasses import asdict
+from dataclasses import asdict, replace
 from enum import Enum
+from functools import reduce
 
 import torch
 from transformers.pytorch_utils import Conv1D
@@ -27,6 +28,7 @@
     TRANSFORMERS_MODELS_TO_IA3_FEEDFORWARD_MODULES_MAPPING,
     TRANSFORMERS_MODELS_TO_IA3_TARGET_MODULES_MAPPING,
     ModulesToSaveWrapper,
+    _freeze_adapter,
     _get_submodules,
 )
 
@@ -278,13 +280,15 @@ def _prepare_adapter_config(self, peft_config, model_config):
         if peft_config.target_modules is None:
             if model_config["model_type"] not in TRANSFORMERS_MODELS_TO_IA3_TARGET_MODULES_MAPPING:
                 raise ValueError("Please specify `target_modules` in `peft_config`")
-            peft_config.target_modules = TRANSFORMERS_MODELS_TO_IA3_TARGET_MODULES_MAPPING[model_config["model_type"]]
+            peft_config.target_modules = set(
+                TRANSFORMERS_MODELS_TO_IA3_TARGET_MODULES_MAPPING[model_config["model_type"]]
+            )
         if peft_config.feedforward_modules is None:
             if model_config["model_type"] not in TRANSFORMERS_MODELS_TO_IA3_FEEDFORWARD_MODULES_MAPPING:
                 raise ValueError("Please specify `feedforward_modules` in `peft_config`")
-            peft_config.feedforward_modules = TRANSFORMERS_MODELS_TO_IA3_FEEDFORWARD_MODULES_MAPPING[
-                model_config["model_type"]
-            ]
+            peft_config.feedforward_modules = set(
+                TRANSFORMERS_MODELS_TO_IA3_FEEDFORWARD_MODULES_MAPPING[model_config["model_type"]]
+            )
         return peft_config
 
     def merge_and_unload(self, safe_merge: bool = False):
@@ -336,3 +340,103 @@ def merge_and_unload(self, safe_merge: bool = False):
             self._replace_module(parent, target_name, new_module, target)
 
         return self.model
+
+    def delete_adapter(self, adapter_name: str):
+        """
+        Deletes an existing adapter.
+
+        Args:
+            adapter_name (str): Name of the adapter to be deleted.
+        """
+        if adapter_name not in self.peft_config:
+            raise ValueError(f"Adapter {adapter_name} does not exist")
+        del self.peft_config[adapter_name]
+
+        key_list = [key for key, _ in self.model.named_modules() if "ia3" not in key]
+        for key in key_list:
+            _, target, _ = _get_submodules(self.model, key)
+            if isinstance(target, IA3Layer):
+                if adapter_name in target.ia3_l:
+                    target.ia3_l.pop(adapter_name)
+                if adapter_name in target.active_adapters:
+                    resetting_active_adapter = (
+                        list(self.peft_config.keys())[0] if len(self.peft_config) > 0 else "default"
+                    )
+                    warnings.warn(
+                        f"Adapter {adapter_name} was active which is now deleted. Setting active adapter to {resetting_active_adapter}. "
+                    )
+                    target.set_adapter(resetting_active_adapter)
+
+    def _new_modules(self, adapters, module_type):
+        """
+        Args:
+            adapters (`list`):
+                List of adapter names to be merged.
+            module_type (`str`):
+                Type of the module to be merged.
+        """
+        module_types = [type(getattr(self.peft_config[adapter], module_type)) for adapter in adapters]
+        if not module_types:
+            raise ValueError(f"Found no adapter matching the names in {adapters}")
+        if len(set(module_types)) > 1:
+            raise ValueError(
+                "all adapter configs should follow the same target modules type. "
+                f"Combining adapters with `{module_type}` type being a mix of list/set and string is not supported."
+            )
+        if module_types[0] == str:
+            new_modules = "|".join(f"({getattr(self.peft_config[adapter], module_type)})" for adapter in adapters)
+        elif module_types[0] == set:
+            new_modules = reduce(
+                operator.or_, (getattr(self.peft_config[adapter], module_type) for adapter in adapters)
+            )
+        else:
+            raise TypeError(f"Invalid type {module_types[0]} found in {module_type}")
+        return new_modules
+
+    def add_weighted_adapter(self, adapters, weights, adapter_name):
+        """
+        This method adds a new adapter by merging the given adapters with the given weights.
+
+        Args:
+            adapters (`list`):
+                List of adapter names to be merged.
+            weights (`list`):
+                List of weights for each adapter.
+            adapter_name (`str`):
+                Name of the new adapter.
+        """
+        if adapter_name in list(self.peft_config.keys()):
+            return
+        for adapter in adapters:
+            if adapter not in list(self.peft_config.keys()):
+                raise ValueError(f"Adapter {adapter} does not exist")
+
+        new_target_modules = self._new_modules(adapters, "target_modules")
+        new_feedforward_modules = self._new_modules(adapters, "feedforward_modules")
+
+        self.peft_config[adapter_name] = replace(
+            self.peft_config[adapters[0]],
+            target_modules=new_target_modules,
+            feedforward_modules=new_feedforward_modules,
+        )
+        self.inject_adapter(self.model, adapter_name)
+
+        # Do we really need that?
+        _freeze_adapter(self.model, adapter_name)
+
+        key_list = [key for key, _ in self.model.named_modules() if "ia3" not in key]
+        for key in key_list:
+            _, target, _ = _get_submodules(self.model, key)
+            if isinstance(target, IA3Layer):
+                if adapter_name in target.ia3_l:
+                    target_ia3_l = target.ia3_l[adapter_name]
+                else:
+                    continue
+
+                target_ia3_l.data = target_ia3_l.data * 0.0
+                for adapter, weight in zip(adapters, weights):
+                    if adapter in target.ia3_l:
+                        current_adapter_ia3_l = target.ia3_l[adapter]
+                    else:
+                        continue
+                    target_ia3_l.data += current_adapter_ia3_l.data * weight
 ia3_scaling = 1 
 for active_adapter in self.active_adapters: 
     if active_adapter not in self.ia3_l.keys(): 
         continue 
     dtype = self.ia3_l[active_adapter].dtype 
     ia3_scaling *= self.ia3_l[active_adapter].flatten() 
 if tuner_method == "lora": 
     # create a weighted adapter combining both adapters and check that 
     # its output is same as setting multiple active adapters 
     peft_model.add_weighted_adapter( 
         ["adapter_1", "adapter_2"], [1.0, 1.0], "new_combined_adapter", combination_type="cat" 
     ) 
     peft_model.set_adapter("new_combined_adapter") 
     new_combined_output = peft_model(**X) 
     self.assertTrue(torch.allclose(new_combined_output, combined_output, atol=1e-5)) 
 ia3_scaling = 1 
 for active_adapter in self.active_adapters: 
     if active_adapter not in self.ia3_l.keys(): 
         continue 
     dtype = self.ia3_l[active_adapter].dtype 
     ia3_scaling *= self.ia3_l[active_adapter].flatten() 
 if tuner_method == "lora": 
     # create a weighted adapter combining both adapters and check that 
     # its output is same as setting multiple active adapters 
     peft_model.add_weighted_adapter( 
         ["adapter_1", "adapter_2"], [1.0, 1.0], "new_combined_adapter", combination_type="cat" 
     ) 
     peft_model.set_adapter("new_combined_adapter") 
     new_combined_output = peft_model(**X) 
     self.assertTrue(torch.allclose(new_combined_output, combined_output, atol=1e-5)) 
diff --git a/tests/testing_common.py b/tests/testing_common.py
@@ -37,6 +37,7 @@
     get_peft_model_state_dict,
     prepare_model_for_int8_training,
 )
+from peft.tuners.ia3 import IA3Layer
 from peft.tuners.lora import LoraLayer
 from peft.utils import _get_submodules, infer_device
 
@@ -810,7 +811,7 @@ def _test_delete_adapter(self, model_id, config_cls, config_kwargs):
         model.set_adapter(adapter_to_delete)
         model = model.to(self.torch_device)
 
-        if config.peft_type not in ("LORA"):
+        if config.peft_type not in ("LORA", "IA3"):
             with self.assertRaises(AttributeError):
                 model.delete_adapter(adapter_to_delete)
         else:
@@ -831,6 +832,8 @@ def _test_delete_adapter(self, model_id, config_cls, config_kwargs):
                         "lora_dropout",
                     ]:
                         self.assertFalse(adapter_to_delete in getattr(target, attr))
+                elif isinstance(target, IA3Layer):
+                    self.assertFalse(adapter_to_delete in target.ia3_l)
 
     def _test_unload_adapter(self, model_id, config_cls, config_kwargs):
         model = self.transformers_class.from_pretrained(model_id)
@@ -870,70 +873,95 @@ def _test_weighted_combination_of_adapters(self, model_id, config_cls, config_kw
             base_model_name_or_path=model_id,
             **config_kwargs,
         )
-        if not isinstance(config, (LoraConfig)):
+        if not isinstance(config, (LoraConfig, IA3Config)):
             return
-        model = get_peft_model(model, config, adapter_list[0])
-        model.add_adapter(adapter_list[1], config)
-        model.add_adapter(adapter_list[2], replace(config, r=20))
-        model = model.to(self.torch_device)
-
-        # test re-weighting single adapter
-        model.add_weighted_adapter([adapter_list[0]], [weight_list[0]], "single_adapter_reweighting")
 
-        # test svd re-weighting with multiple adapters
-        model.add_weighted_adapter(adapter_list[1:], weight_list[1:], "multi_adapter_svd_reweighting")
+        if isinstance(config, (LoraConfig)):
+            model = get_peft_model(model, config, adapter_list[0])
+            model.add_adapter(adapter_list[1], config)
+            model.add_adapter(adapter_list[2], replace(config, r=20))
+            model = model.to(self.torch_device)
+            # test re-weighting single adapter
+            model.add_weighted_adapter([adapter_list[0]], [weight_list[0]], "single_adapter_reweighting")
 
-        # test cat re-weighting with multiple adapters
-        model.add_weighted_adapter(
-            adapter_list[1:], weight_list[1:], "multi_adapter_cat_reweighting", combination_type="cat"
-        )
+            # test svd re-weighting with multiple adapters
+            model.add_weighted_adapter(adapter_list[1:], weight_list[1:], "multi_adapter_svd_reweighting")
 
-        # test linear re-weighting with multiple adapters
-        model.add_weighted_adapter(
-            adapter_list[:2], weight_list[:2], "multi_adapter_linear_reweighting", combination_type="linear"
-        )
+            # test cat re-weighting with multiple adapters
+            model.add_weighted_adapter(
+                adapter_list[1:], weight_list[1:], "multi_adapter_cat_reweighting", combination_type="cat"
+            )
 
-        with self.assertRaises(ValueError):
+            # test linear re-weighting with multiple adapters
             model.add_weighted_adapter(
-                adapter_list[1:],
-                weight_list[1:],
-                "multi_adapter_linear_reweighting_uneven_r",
-                combination_type="linear",
+                adapter_list[:2], weight_list[:2], "multi_adapter_linear_reweighting", combination_type="linear"
             )
 
-        new_adapters = [
-            "single_adapter_reweighting",
-            "multi_adapter_svd_reweighting",
-            "multi_adapter_cat_reweighting",
-            "multi_adapter_linear_reweighting",
-        ]
-        for new_adapter in new_adapters:
-            self.assertTrue(new_adapter in model.peft_config)
-
-        key_list = [key for key, _ in model.named_modules() if "lora" not in key]
-        for key in key_list:
-            _, target, _ = _get_submodules(model, key)
-            if isinstance(target, LoraLayer):
-                for adapter_name in new_adapters:
-                    if "single" in adapter_name:
-                        new_delta_weight = target.get_delta_weight(adapter_name)
-                        weighted_original_delta_weights = target.get_delta_weight(adapter_list[0]) * weight_list[0]
-                        self.assertTrue(
-                            torch.allclose(new_delta_weight, weighted_original_delta_weights, atol=1e-4, rtol=1e-4)
-                        )
-                    elif "svd" in adapter_name:
-                        self.assertTrue(target.r[adapter_name] == 20)
-                    elif "linear" in adapter_name:
-                        self.assertTrue(target.r[adapter_name] == 8)
-                    elif "cat" in adapter_name:
-                        self.assertTrue(target.r[adapter_name] == 28)
-
-        for adapter_name in new_adapters:
-            # ensuring new adapters pass the forward loop
-            model.set_adapter(adapter_name)
-            dummy_input = self.prepare_inputs_for_testing()
-            model.eval()
-            _ = model(**dummy_input)[0]
+            with self.assertRaises(ValueError):
+                model.add_weighted_adapter(
+                    adapter_list[1:],
+                    weight_list[1:],
+                    "multi_adapter_linear_reweighting_uneven_r",
+                    combination_type="linear",
+                )
+
+            new_adapters = [
+                "single_adapter_reweighting",
+                "multi_adapter_svd_reweighting",
+                "multi_adapter_cat_reweighting",
+                "multi_adapter_linear_reweighting",
+            ]
+            for new_adapter in new_adapters:
+                self.assertTrue(new_adapter in model.peft_config)
+
+            key_list = [key for key, _ in model.named_modules() if "lora" not in key]
+            for key in key_list:
+                _, target, _ = _get_submodules(model, key)
+                if isinstance(target, LoraLayer):
+                    for adapter_name in new_adapters:
+                        if "single" in adapter_name:
+                            new_delta_weight = target.get_delta_weight(adapter_name)
+                            weighted_original_delta_weights = target.get_delta_weight(adapter_list[0]) * weight_list[0]
+                            self.assertTrue(
+                                torch.allclose(new_delta_weight, weighted_original_delta_weights, atol=1e-4, rtol=1e-4)
+                            )
+                        elif "svd" in adapter_name:
+                            self.assertTrue(target.r[adapter_name] == 20)
+                        elif "linear" in adapter_name:
+                            self.assertTrue(target.r[adapter_name] == 8)
+                        elif "cat" in adapter_name:
+                            self.assertTrue(target.r[adapter_name] == 28)
+
+            for adapter_name in new_adapters:
+                # ensuring new adapters pass the forward loop
+                model.set_adapter(adapter_name)
+                dummy_input = self.prepare_inputs_for_testing()
+                model.eval()
+                _ = model(**dummy_input)[0]
+
+        elif isinstance(config, (IA3Config)):
+            model = get_peft_model(model, config, adapter_list[0])
+            model.add_adapter(adapter_list[1], config)
+            model.add_adapter(adapter_list[2], config)
+            model = model.to(self.torch_device)
+            # single adapter re-weighting and multi adapter linear re-weighting
+            # Note: IA3 only supports linear re-weighting
+            model.add_weighted_adapter([adapter_list[0]], [weight_list[0]], "single_adapter_reweighting")
+            model.add_weighted_adapter(adapter_list[:2], weight_list[:2], "multi_adapter_linear_reweighting")
+
+            new_adapters = [
+                "single_adapter_reweighting",
+                "multi_adapter_linear_reweighting",
+            ]
+            for new_adapter in new_adapters:
+                self.assertTrue(new_adapter in model.peft_config)
+
+            for adapter_name in new_adapters:
+                # ensuring new adapters pass the forward loop
+                model.set_adapter(adapter_name)
+                dummy_input = self.prepare_inputs_for_testing()
+                model.eval()
+                _ = model(**dummy_input)[0]
 
     def _test_disable_adapter(self, model_id, config_cls, config_kwargs):
         task_type = config_kwargs.get("task_type")