Skip to content

Commit

Permalink
update publish script
Browse files Browse the repository at this point in the history
  • Loading branch information
Tau-J committed Mar 9, 2023
1 parent 31b4b54 commit b7b372b
Showing 1 changed file with 26 additions and 14 deletions.
40 changes: 26 additions & 14 deletions tools/misc/publish_model.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,35 +4,47 @@
from datetime import date

import torch
from mmengine.logging import print_log
from mmengine.utils import digit_version
from mmengine.utils.dl_utils import TORCH_VERSION


def parse_args():
parser = argparse.ArgumentParser(
description='Process a checkpoint to be published')
parser.add_argument('in_file', help='input checkpoint filename')
parser.add_argument('out_file', help='output checkpoint filename')
parser.add_argument(
'--save-keys',
nargs='+',
type=str,
default=['meta', 'state_dict'],
help='keys to save in published checkpoint (default: meta state_dict)')
args = parser.parse_args()
return args


def process_checkpoint(in_file, out_file):
def process_checkpoint(in_file, out_file, save_keys=['meta', 'state_dict']):
checkpoint = torch.load(in_file, map_location='cpu')

# remove optimizer for smaller file size
if 'optimizer' in checkpoint:
del checkpoint['optimizer']
if 'message_hub' in checkpoint:
del checkpoint['message_hub']
if 'ema_state_dict' in checkpoint:
del checkpoint['ema_state_dict']

for key in list(checkpoint['state_dict']):
if key.startswith('data_preprocessor'):
checkpoint['state_dict'].pop(key)
# only keep `meta` and `state_dict` for smaller file size
ckpt_keys = list(checkpoint.keys())
for k in ckpt_keys:
if k not in save_keys:
print_log(
f'Key `{k}` will be removed because it is not in '
f'save_keys. If you want to keep it, '
f'please set --save-keys.',
logger='current')
checkpoint.pop(k, None)

# if it is necessary to remove some sensitive data in checkpoint['meta'],
# add the code here.
torch.save(checkpoint, out_file)

if digit_version(TORCH_VERSION) >= digit_version('1.6.0'):
torch.save(checkpoint, out_file, _use_new_zipfile_serialization=False)
else:
torch.save(checkpoint, out_file)
sha = subprocess.check_output(['sha256sum', out_file]).decode()
if out_file.endswith('.pth'):
out_file_name = out_file[:-4]
Expand All @@ -46,7 +58,7 @@ def process_checkpoint(in_file, out_file):

def main():
args = parse_args()
process_checkpoint(args.in_file, args.out_file)
process_checkpoint(args.in_file, args.out_file, args.save_keys)


if __name__ == '__main__':
Expand Down

0 comments on commit b7b372b

Please sign in to comment.