add int4tilepackedto4dtensor subclass to safetensors (#3064)

liangel-02 · web-flow · commit fd061512676b · 2025-09-26T07:31:17.000-07:00
diff --git a/test/prototype/safetensors/test_safetensors_support.py b/test/prototype/safetensors/test_safetensors_support.py
@@ -45,6 +45,7 @@ class TestSafeTensors(TestCase):
             (Float8DynamicActivationFloat8WeightConfig(granularity=PerRow()), False),
             (Int4WeightOnlyConfig(), False),
             (Int4WeightOnlyConfig(), True),
+            (Int4WeightOnlyConfig(int4_packing_format="tile_packed_to_4d"), False),
         ],
     )
     def test_safetensors(self, config, act_pre_scale=False):
diff --git a/torchao/prototype/safetensors/safetensors_utils.py b/torchao/prototype/safetensors/safetensors_utils.py
@@ -6,21 +6,30 @@
 import torch
 
 import torchao
-from torchao.quantization import Float8Tensor, Int4Tensor
+from torchao.quantization import (
+    Float8Tensor,
+    Int4Tensor,
+    Int4TilePackedTo4dTensor,
+)
 from torchao.quantization.quantize_.common import KernelPreference
 from torchao.quantization.quantize_.workflows import QuantizeTensorToFloat8Kwargs
 
 ALLOWED_CLASSES = {
     "Float8Tensor": Float8Tensor,
     "Int4Tensor": Int4Tensor,
+    "Int4TilePackedTo4dTensor": Int4TilePackedTo4dTensor,
     "Float8MMConfig": torchao.float8.inference.Float8MMConfig,
     "QuantizeTensorToFloat8Kwargs": QuantizeTensorToFloat8Kwargs,
     "PerRow": torchao.quantization.PerRow,
     "PerTensor": torchao.quantization.PerTensor,
     "KernelPreference": KernelPreference,
 }
 
-ALLOWED_TENSORS_SUBCLASSES = ["Float8Tensor", "Int4Tensor"]
+ALLOWED_TENSORS_SUBCLASSES = [
+    "Float8Tensor",
+    "Int4Tensor",
+    "Int4TilePackedTo4dTensor",
+]
 
 __all__ = [
     "TensorSubclassAttributeJSONEncoder",

Original file line number	Diff line number	Diff line change
`@@ -45,6 +45,7 @@ class TestSafeTensors(TestCase):`
`45`	`45`	`(Float8DynamicActivationFloat8WeightConfig(granularity=PerRow()), False),`
`46`	`46`	`(Int4WeightOnlyConfig(), False),`
`47`	`47`	`(Int4WeightOnlyConfig(), True),`
	`48`	`+ (Int4WeightOnlyConfig(int4_packing_format="tile_packed_to_4d"), False),`
`48`	`49`	`],`
`49`	`50`	`)`
`50`	`51`	`def test_safetensors(self, config, act_pre_scale=False):`