refine per review comments

xin3he · xin3he · commit 46243111633b · 2024-01-25T17:36:54.000+08:00
Signed-off-by: xin3he &lt;xin3.he@intel.com&gt;
diff --git a/neural_compressor/torch/quantization/__init__.py b/neural_compressor/torch/quantization/__init__.py
@@ -25,7 +25,7 @@
 )
 
 # TODO(Yi): move config to config.py
-from .autotune import autotune, TuningConfig, get_default_tune_config
+from neural_compressor.torch.quantization.autotune import autotune, TuningConfig, get_default_tune_config
 
 ### Quantization Function Registration ###
 import neural_compressor.torch.quantization.weight_only
diff --git a/neural_compressor/torch/quantization/config.py b/neural_compressor/torch/quantization/config.py
@@ -98,6 +98,7 @@ def __init__(
             use_mse_search (bool): Enables mean squared error (MSE) search, default is False.
             use_layer_wise (bool): Enables quantize model per layer. Defaults to False.
             export_compressed_model (bool): Enables return model in int format or not. Defaults to False.
+            use_double_quant (bool): Enables double quantization, default is False.
             double_quant_dtype (str): Data type for double_quant scale, default is "int".
             double_quant_bits (int): Number of bits used to represent double_quant scale, default is 4.
             double_quant_use_sym (bool): Indicates whether double_quant scale are symmetric, default is True.
diff --git a/test/3x/torch/quantization/weight_only/test_rtn.py b/test/3x/torch/quantization/weight_only/test_rtn.py
@@ -102,7 +102,7 @@ def test_mse_search(self):
                 atol_false > atol_true
             ), "use_mse_search=True doesn't help accuracy, maybe is reasonable, please double check."
         except:
-            pass  # atol is very close, double checked the logic.
+            assert torch.allclose(atol_false, atol_true, atol=0.012), "atol is very close, double checked the logic."
 
     def test_layer_wise(self):
         model = copy.deepcopy(self.tiny_gptj)

Original file line number	Diff line number	Diff line change
`@@ -25,7 +25,7 @@`
`25`	`25`	`)`
`26`	`26`
`27`	`27`	`# TODO(Yi): move config to config.py`
`28`		`-from .autotune import autotune, TuningConfig, get_default_tune_config`
	`28`	`+from neural_compressor.torch.quantization.autotune import autotune, TuningConfig, get_default_tune_config`
`29`	`29`
`30`	`30`	`### Quantization Function Registration ###`
`31`	`31`	`import neural_compressor.torch.quantization.weight_only`