minor change

yintong-lu · yintong-lu · commit cc759f406116 · 2024-02-22T18:41:35.000-08:00
Signed-off-by: Lu, Yintong &lt;yintong.lu@intel.com&gt;
diff --git a/neural_compressor/adaptor/torch_utils/waq/auto_alpha.py b/neural_compressor/adaptor/torch_utils/waq/auto_alpha.py
@@ -56,6 +56,7 @@ def __init__(
         alpha_step=0.1,
         shared_criterion="mean",
         init_alpha=0.5,
+        folding=False,
         do_blockwise=False,
         n_samples=32,
     ):
@@ -75,6 +76,7 @@ def __init__(
         self.absorb_to_layer = absorb_to_layer
         self.weight_scale_dict = {}
         self.q_func = q_func
+        self.folding = folding
         self.example_inputs = example_inputs
         self.max_value_info = {}  # to record max values for alpha tune
         self.weight_clip = weight_clip[0] if isinstance(weight_clip, tuple) else weight_clip
@@ -92,9 +94,10 @@ def tune(self):
         for key in self.input_mins.keys():
             self.input_maxes_abs[key] = torch.max(torch.abs(self.input_mins[key]), torch.abs(self.input_maxes[key]))
 
-        diff_modules = set(self.absorb_to_layer.keys()).difference(self.input_mins.keys())
-        for d in diff_modules:
-            del self.absorb_to_layer[d]
+        if not self.folding:
+            diff_modules = set(self.absorb_to_layer.keys()).difference(self.input_mins.keys())
+            for d in diff_modules:
+                del self.absorb_to_layer[d]
 
         scale_memo_use = 0
         for key in self.absorb_to_layer:
diff --git a/neural_compressor/adaptor/torch_utils/waq/smooth_quant.py b/neural_compressor/adaptor/torch_utils/waq/smooth_quant.py
@@ -452,6 +452,7 @@ def transform(
                 op_types=op_types,
                 device=self.device,
                 q_func=self.q_func,
+                folding=folding,
                 example_inputs=self.example_inputs,
                 **auto_alpha_args,
             )

Original file line number	Diff line number	Diff line change
`@@ -452,6 +452,7 @@ def transform(`
`452`	`452`	`op_types=op_types,`
`453`	`453`	`device=self.device,`
`454`	`454`	`q_func=self.q_func,`
	`455`	`+ folding=folding,`
`455`	`456`	`example_inputs=self.example_inputs,`
`456`	`457`	`**auto_alpha_args,`
`457`	`458`	`)`