-
Notifications
You must be signed in to change notification settings - Fork 260
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Signed-off-by: xin3he <xin3.he@intel.com>
- Loading branch information
Showing
20 changed files
with
3,669 additions
and
1,263 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,18 @@ | ||
#!/usr/bin/env python | ||
# -*- coding: utf-8 -*- | ||
# | ||
# Copyright (c) 2023 Intel Corporation | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
"""Torch layer-wise quantization module.""" | ||
from .utils import * |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,272 @@ | ||
#!/usr/bin/env python | ||
# -*- coding: utf-8 -*- | ||
# | ||
# Copyright (c) 2023 Intel Corporation | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
"""Load one specify tensor from a bin file.""" | ||
|
||
import io | ||
import os | ||
import warnings | ||
from typing import IO, Any, BinaryIO, Callable, Dict, Optional, Union | ||
|
||
from packaging.version import Version | ||
from torch.serialization import ( | ||
StorageType, | ||
_get_restore_location, | ||
_is_torchscript_zip, | ||
_is_zipfile, | ||
_maybe_decode_ascii, | ||
_open_file_like, | ||
_open_zipfile_reader, | ||
) | ||
|
||
from neural_compressor.adaptor.torch_utils.layer_wise_quant import modified_pickle as pickle | ||
|
||
from .utils import torch | ||
|
||
torch_version = torch.__version__.split("+")[0] | ||
version = Version(torch_version) | ||
|
||
FILE_LIKE = Union[str, os.PathLike, BinaryIO, IO[bytes]] | ||
MAP_LOCATION = Optional[Union[Callable[[torch.Tensor, str], torch.Tensor], torch.device, str, Dict[str, str]]] | ||
|
||
if version.release < Version("1.13.0").release: | ||
UntypedStorage = torch._UntypedStorage | ||
else: | ||
UntypedStorage = torch.UntypedStorage | ||
|
||
|
||
def _load(zip_file, tensor_name, prefix, map_location, pickle_module, pickle_file="data.pkl", **pickle_load_args): | ||
restore_location = _get_restore_location(map_location) | ||
|
||
loaded_storages = {} | ||
|
||
def load_tensor(dtype, numel, key, location): | ||
name = f"data/{key}" | ||
|
||
if version.release < Version("1.13.0").release: | ||
storage = zip_file.get_storage_from_record(name, numel, torch._UntypedStorage).storage()._untyped() | ||
typed_storage = torch.storage._TypedStorage(wrap_storage=restore_location(storage, location), dtype=dtype) | ||
loaded_storages[key] = typed_storage | ||
elif version.release < Version("2.0.0").release: # pragma: no cover | ||
storage = zip_file.get_storage_from_record(name, numel, UntypedStorage).storage().untyped() | ||
typed_storage = torch.storage.TypedStorage(wrap_storage=restore_location(storage, location), dtype=dtype) | ||
loaded_storages[key] = typed_storage | ||
else: | ||
storage = zip_file.get_storage_from_record(name, numel, UntypedStorage)._typed_storage()._untyped_storage | ||
typed_storage = torch.storage.TypedStorage( | ||
wrap_storage=restore_location(storage, location), dtype=dtype, _internal=True | ||
) | ||
|
||
if typed_storage._data_ptr() != 0: | ||
loaded_storages[key] = typed_storage | ||
|
||
return typed_storage | ||
|
||
load_module_mapping: Dict[str, str] = {"torch.tensor": "torch._tensor"} | ||
|
||
# Need to subclass Unpickler instead of directly monkey-patching the find_class method | ||
# because it's marked readonly in pickle. | ||
# The type: ignore is because mypy can't statically determine the type of this class. | ||
class UnpicklerWrapper(pickle_module.Unpickler): # type: ignore[name-defined] | ||
def find_class(self, mod_name, name): | ||
if type(name) is str and "Storage" in name: | ||
try: | ||
return StorageType(name) | ||
except KeyError: # pragma: no cover | ||
pass | ||
mod_name = load_module_mapping.get(mod_name, mod_name) | ||
return super().find_class(mod_name, name) | ||
|
||
def persistent_load(self, saved_id): | ||
assert isinstance(saved_id, tuple) | ||
typename = _maybe_decode_ascii(saved_id[0]) | ||
data = saved_id[1:] | ||
|
||
assert ( | ||
typename == "storage" | ||
), f"Unknown typename for persistent_load, expected 'storage' but got '{typename}'" | ||
storage_type, key, location, numel = data | ||
|
||
if storage_type is UntypedStorage: # pragma: no cover | ||
dtype = torch.uint8 | ||
else: | ||
dtype = storage_type.dtype | ||
|
||
if key in loaded_storages: | ||
typed_storage = loaded_storages[key] | ||
else: | ||
name_list = [self.tensor_name] | ||
if prefix: | ||
no_prefix_name = self.tensor_name.split(".") | ||
if prefix in no_prefix_name: | ||
no_prefix_name.remove(prefix) | ||
no_prefix_name = ".".join(no_prefix_name) | ||
name_list.append(no_prefix_name) | ||
if self.tensor_name and self.metastack[-1][-2] not in name_list: | ||
# typed_storage = None | ||
# loaded_storages[key] = typed_storage | ||
# nbytes = numel * torch._utils._element_size(dtype) | ||
# typed_storage = load_tensor(dtype, nbytes, key, _maybe_decode_ascii(location)) | ||
typed_storage = None | ||
else: | ||
nbytes = numel * torch._utils._element_size(dtype) | ||
typed_storage = load_tensor(dtype, nbytes, key, _maybe_decode_ascii(location)) | ||
|
||
return typed_storage | ||
|
||
# Load the data (which may in turn use `persistent_load` to load tensors) | ||
data_file = io.BytesIO(zip_file.get_record(pickle_file)) | ||
|
||
unpickler = UnpicklerWrapper(data_file, **pickle_load_args) | ||
# unpickler.persistent_load = persistent_load | ||
result = unpickler.load(tensor_name) | ||
|
||
torch._utils._validate_loaded_sparse_tensors() | ||
return result | ||
|
||
|
||
def load( | ||
f: FILE_LIKE, | ||
tensor_name: str = None, | ||
prefix: str = None, | ||
map_location: MAP_LOCATION = None, | ||
pickle_module: Any = None, | ||
*, | ||
weights_only: bool = False, | ||
**pickle_load_args: Any, | ||
) -> Any: | ||
# Reference: https://github.com/pytorch/pytorch/issues/54354 | ||
# The first line of this docstring overrides the one Sphinx generates for the | ||
# documentation. We need it so that Sphinx doesn't leak `pickle`s path from | ||
# the build environment (e.g. `<module 'pickle' from '/leaked/path'). | ||
|
||
"""Load(f, map_location=None, pickle_module=pickle, *, weights_only=False, **pickle_load_args) | ||
Loads an object saved with :func:`torch.save` from a file. | ||
:func:`torch.load` uses Python's unpickling facilities but treats storages, | ||
which underlie tensors, specially. They are first deserialized on the | ||
CPU and are then moved to the device they were saved from. If this fails | ||
(e.g. because the run time system doesn't have certain devices), an exception | ||
is raised. However, storages can be dynamically remapped to an alternative | ||
set of devices using the :attr:`map_location` argument. | ||
If :attr:`map_location` is a callable, it will be called once for each serialized | ||
storage with two arguments: storage and location. The storage argument | ||
will be the initial deserialization of the storage, residing on the CPU. | ||
Each serialized storage has a location tag associated with it which | ||
identifies the device it was saved from, and this tag is the second | ||
argument passed to :attr:`map_location`. The builtin location tags are ``'cpu'`` | ||
for CPU tensors and ``'cuda:device_id'`` (e.g. ``'cuda:2'``) for CUDA tensors. | ||
:attr:`map_location` should return either ``None`` or a storage. If | ||
:attr:`map_location` returns a storage, it will be used as the final deserialized | ||
object, already moved to the right device. Otherwise, :func:`torch.load` will | ||
fall back to the default behavior, as if :attr:`map_location` wasn't specified. | ||
If :attr:`map_location` is a :class:`torch.device` object or a string containing | ||
a device tag, it indicates the location where all tensors should be loaded. | ||
Otherwise, if :attr:`map_location` is a dict, it will be used to remap location tags | ||
appearing in the file (keys), to ones that specify where to put the | ||
storages (values). | ||
User extensions can register their own location tags and tagging and | ||
deserialization methods using :func:`torch.serialization.register_package`. | ||
Args: | ||
f: a file-like object (has to implement :meth:`read`, :meth:`readline`, :meth:`tell`, and :meth:`seek`), | ||
or a string or os.PathLike object containing a file name | ||
map_location: a function, :class:`torch.device`, string or a dict specifying how to remap storage | ||
locations | ||
pickle_module: module used for unpickling metadata and objects (has to | ||
match the :attr:`pickle_module` used to serialize file) | ||
weights_only: Indicates whether unpickler should be restricted to | ||
loading only tensors, primitive types and dictionaries | ||
pickle_load_args: (Python 3 only) optional keyword arguments passed over to | ||
:func:`pickle_module.load` and :func:`pickle_module.Unpickler`, e.g., | ||
:attr:`errors=...`. | ||
.. warning:: | ||
:func:`torch.load()` unless `weights_only` parameter is set to `True`, | ||
uses ``pickle`` module implicitly, which is known to be insecure. | ||
It is possible to construct malicious pickle data which will execute arbitrary code | ||
during unpickling. Never load data that could have come from an untrusted | ||
source in an unsafe mode, or that could have been tampered with. **Only load data you trust**. | ||
.. note:: | ||
When you call :func:`torch.load()` on a file which contains GPU tensors, those tensors | ||
will be loaded to GPU by default. You can call ``torch.load(.., map_location='cpu')`` | ||
and then :meth:`load_state_dict` to avoid GPU RAM surge when loading a model checkpoint. | ||
.. note:: | ||
By default, we decode byte strings as ``utf-8``. This is to avoid a common error | ||
case ``UnicodeDecodeError: 'ascii' codec can't decode byte 0x...`` | ||
when loading files saved by Python 2 in Python 3. If this default | ||
is incorrect, you may use an extra :attr:`encoding` keyword argument to specify how | ||
these objects should be loaded, e.g., :attr:`encoding='latin1'` decodes them | ||
to strings using ``latin1`` encoding, and :attr:`encoding='bytes'` keeps them | ||
as byte arrays which can be decoded later with ``byte_array.decode(...)``. | ||
Example: | ||
>>> # xdoctest: +SKIP("undefined filepaths") | ||
>>> torch.load('tensors.pt') | ||
# Load all tensors onto the CPU | ||
>>> torch.load('tensors.pt', map_location=torch.device('cpu')) | ||
# Load all tensors onto the CPU, using a function | ||
>>> torch.load('tensors.pt', map_location=lambda storage, loc: storage) | ||
# Load all tensors onto GPU 1 | ||
>>> torch.load('tensors.pt', map_location=lambda storage, loc: storage.cuda(1)) | ||
# Map tensors from GPU 1 to GPU 0 | ||
>>> torch.load('tensors.pt', map_location={'cuda:1': 'cuda:0'}) | ||
# Load tensor from io.BytesIO object | ||
>>> with open('tensor.pt', 'rb') as f: | ||
... buffer = io.BytesIO(f.read()) | ||
>>> torch.load(buffer) | ||
# Load a module with 'ascii' encoding for unpickling | ||
>>> torch.load('module.pt', encoding='ascii') | ||
""" | ||
torch._C._log_api_usage_once("torch.load") | ||
# Add ability to force safe only weight loads via environment variable | ||
if os.getenv("TORCH_FORCE_WEIGHTS_ONLY_LOAD", "0").lower() in ["1", "y", "yes", "true"]: # pragma: no cover | ||
weights_only = True | ||
|
||
if weights_only: # pragma: no cover | ||
if pickle_module is not None: | ||
raise RuntimeError("Can not safely load weights when explicit pickle_module is specified") | ||
else: | ||
if pickle_module is None: | ||
pickle_module = pickle | ||
|
||
if "encoding" not in pickle_load_args.keys(): | ||
pickle_load_args["encoding"] = "utf-8" | ||
|
||
with _open_file_like(f, "rb") as opened_file: | ||
if _is_zipfile(opened_file): | ||
# The zipfile reader is going to advance the current file position. | ||
# If we want to actually tail call to torch.jit.load, we need to | ||
# reset back to the original position. | ||
orig_position = opened_file.tell() | ||
with _open_zipfile_reader(opened_file) as opened_zipfile: | ||
if _is_torchscript_zip(opened_zipfile): # pragma: no cover | ||
warnings.warn( | ||
"'torch.load' received a zip file that looks like a TorchScript archive" | ||
" dispatching to 'torch.jit.load' (call 'torch.jit.load' directly to" | ||
" silence this warning)", | ||
UserWarning, | ||
) | ||
opened_file.seek(orig_position) | ||
return torch.jit.load(opened_file, map_location=map_location) | ||
return _load(opened_zipfile, tensor_name, prefix, map_location, pickle_module, **pickle_load_args) |
Oops, something went wrong.