utils/utils.py

import os 
import csv
import logging
import numbers
import subprocess
import time
from functools import reduce
from pathlib import Path
from time import sleep
from typing import Sequence, List, Dict, Union, Optional

from hydra.utils import to_absolute_path
from pandas.io.common import is_url
from pytorch_lightning.utilities.rank_zero import rank_zero_only
import rich.syntax
import rich.tree
from omegaconf import DictConfig, OmegaConf, ListConfig
# import torch should be first. Unclear issue, mentioned here: https://github.com/pytorch/pytorch/issues/2575
import torch
from torchvision import models
import numpy as np
import requests
from urllib.parse import urlparse

# These two import statements prevent exception when using eval(metadata) in SegmentationDataset()'s __init__()
from rasterio.crs import CRS
from affine import Affine
from torchvision.datasets.utils import download_url

from utils.logger import get_logger

# Set the logging file
log = get_logger(__name__)  # need to be different from logging in this case


class Interpolate(torch.nn.Module):
    def __init__(self, mode, scale_factor):
        super(Interpolate, self).__init__()
        self.interp = torch.nn.functional.interpolate
        self.scale_factor = scale_factor
        self.mode = mode

    def forward(self, x):
        x = self.interp(x, scale_factor=self.scale_factor, mode=self.mode, align_corners=False)
        return x


def get_device_ids(
        number_requested: int,
        max_used_ram_perc: int = 25,
        max_used_perc: int = 15):
    """
    Function to check which GPU devices are available and unused.
    :param number_requested: (int) Number of devices requested.
    :param max_used_ram_perc: (int) If RAM usage of detected GPU exceeds this percentage, it will be ignored
    :param max_used_perc: (int) If GPU's usage exceeds this percentage, it will be ignored
    :return: (list) Unused GPU devices.
    """
    lst_free_devices = {}
    if not number_requested or number_requested == 0:
        logging.warning(f"No GPUs requested. This process will run on CPU")
        return lst_free_devices
    if not torch.cuda.is_available():
        log.warning(f'\nRequested {number_requested} GPUs, but no CUDA devices found. This process will run on CPU')
        return lst_free_devices
    try:
        torch.cuda.init()
        if number_requested > 0:
            device_count = torch.cuda.device_count()
            for i in range(device_count):
                res, mem = gpu_stats(i)
                used_ram = mem['used'] / (1024 ** 2)
                max_ram = mem['total'] / (1024 ** 2)
                used_ram_perc = used_ram / max_ram * 100
                log.info(f"\nGPU RAM used: {used_ram_perc} ({used_ram:.0f}/{max_ram:.0f} MiB)\nGPU % used: {res['gpu']}")
                if used_ram_perc < max_used_ram_perc:
                    if res['gpu'] < max_used_perc:
                        lst_free_devices[i] = {'used_ram_at_init': used_ram, 'max_ram': max_ram}
                    else:
                        log.warning(f"\nGpu #{i} filtered out based on usage % threshold.\n"
                                    f"Current % usage: {res['gpu']}\n"
                                    f"Max % usage allowed by user: {max_used_perc}.")
                else:
                    log.warning(f'\nGpu #{i} filtered out based on RAM threshold.\n'
                                f'Current RAM usage: {used_ram}/{max_ram}\n'
                                f'Max used RAM allowed by user: {max_used_ram_perc}.')
                if len(lst_free_devices.keys()) == number_requested:
                    break
            if len(lst_free_devices.keys()) < number_requested:
                log.warning(f"\nYou requested {number_requested} devices. {device_count} devices are available and "
                            f"other processes are using {device_count-len(lst_free_devices.keys())} device(s).")
        else:
            return lst_free_devices
    except NameError as error:
        raise log.critical(
            NameError(f"\n{error}. Make sure that the NVIDIA management library (pynvml) is installed and running.")
        )
  
    logging.info(f'\nGPUs devices available: {lst_free_devices}')
    return lst_free_devices


def gpu_stats(device=0):
    """
    Provides GPU utilization (%) and RAM usage
    :return: res.gpu, res.memory
    """
    torch.cuda.init()
    res = {'gpu': torch.cuda.utilization(device)}
    torch_cuda_mem = torch.cuda.mem_get_info(device)
    mem = {
        'used': torch_cuda_mem[-1] - torch_cuda_mem[0],
        'total': torch_cuda_mem[-1]
    }    
    return res, mem


def set_device(gpu_devices_dict: dict = {}):
    """
    From dictionary of available devices, sets the device to be used
    @param gpu_devices_dict: dictionary containing info on GPU devices as returned by lst_device_ids
    @return: torch.device
    """
    if gpu_devices_dict:
        logging.info(f"\nCuda devices available: {gpu_devices_dict}.\nUsing {list(gpu_devices_dict.keys())[0]}\n\n")
        device = torch.device(f'cuda:{list(range(len(gpu_devices_dict.keys())))[0]}')
    else:
        logging.warning(f"\nNo Cuda device available. This process will only run on CPU")
        device = torch.device('cpu')
        try:
            models.resnet18().to(device)  # test with a small model
        except (RuntimeError, AssertionError):  # HPC: when device 0 not available. Error: Cuda invalid device ordinal.
            logging.warning(f"\nUnable to use device. Trying device 'cuda', not {device}")
            device = torch.device(f'cuda')
    return device


def get_key_def(key, config, default=None, expected_type=None, to_path: bool = False,
                validate_path_exists: bool = False, wildcard=None):
    """Returns a value given a dictionary key, or the default value if it cannot be found.
    :param key: key in dictionary (e.g. generated from .yaml)
    :param config: (dict) dictionary containing keys corresponding to parameters used in script
    :param default: default value assigned if no value found with provided key
    :param expected_type: (type) type of the expected variable.
    :param to_path: (bool) if True, parameter will be converted to a pathlib.Path object (warns if cannot be converted)
    :param validate_path_exists: (bool) if True, checks if path exists (is_path must be True)
    :param wildcard: suffix wildcard string (ex. '*.pth.tar')
    :return:
    """
    val = default
    if not config:
        pass
    elif isinstance(key, (list, ListConfig)):
        if len(key) <= 1:  # expects list of length more than 1 to search inside a dictionary recursively
            raise ValueError("Must provide at least two valid keys to search recursively in dictionary")
        for k in key:  # iterate through items in list
            if k in config:  # if item is a key in config, check if dictionary, else set value.
                if isinstance(config[k], (dict, DictConfig)):
                    config = config[k]
                else:
                    val = config[k]
    else:
        if key not in config or config[key] is None:  # if config exists, but key not in it
            pass
        else:
            val = config[key] if config[key] != 'None' else None
            
    if not val:  # Skips below if statements if val is None
        logging.error(f"The key {key} as a None value.")
        return val
    if is_url(val):
        logging.info(f"\nProvided path is url. Cannot validate it's existence nor convert to Path object. Got:"
                     f"\n{val}")
        validate_path_exists = False
    elif to_path:
        try:
            val = Path(to_absolute_path(val))
        except TypeError:
            logging.error(f"Couldn't convert value {val} to a pathlib.Path object")
        expected_type = Path if expected_type == str else expected_type  # allows "str" and "Path" as expected_type
    if validate_path_exists:
        if not isinstance(val, Path):
            val = Path(to_absolute_path(val))
        if val.is_dir() and wildcard: # Globs through directory and picks first item matching wildcard
            items = [item for item in val.glob(wildcard)]
            if items:
                val = items[0]
            else:
                logging.critical(f"Couldn't find any item in directory: {val} matching wildcard: {wildcard}")
                raise FileNotFoundError()
        if not val.exists():
            logging.critical(f"Couldn't locate path: {val}.\nProvided key: {key}")
            raise FileNotFoundError()

    if expected_type and val is not False:
        if not isinstance(val, expected_type):
            raise TypeError(f"{val} is of type {type(val)}, expected {expected_type}")

    return val

def minmax_scale(img, scale_range=(0, 1), orig_range=(0, 255)):
    """Scale image to desired range

    Args:
        img (tensor or ndarray): Image to be scaled  
        scale_range (tuple, optional): Desired range of transformed data (0, 1) or (-1, 1).. Defaults to (0, 1).
        orig_range (tuple, optional): Original range of input data. Defaults to (0, 255).

    Returns:
        np.ndarray or tensor: Scaled image
    """
    assert scale_range in [(0, 1), (-1, 1)], 'expects scale_range as (0, 1) or (-1, 1)'
    assert orig_range[1] > orig_range[0], 'invalid orig_range'
    assert isinstance(img, (np.ndarray, torch.Tensor)), 'img should be a numpy array or a PyTorch tensor'

    if isinstance(img, np.ndarray):
        img = img.astype(np.float32)
    elif isinstance(img, torch.Tensor):
        img = img.float()

    scale_img = (img - orig_range[0]) / (orig_range[1] - orig_range[0])
    if scale_range == (-1, 1):
        scale_img = 2.0 * scale_img - 1.0

    return scale_img

def unscale(img, float_range=(0, 1), orig_range=(0, 255)):
    """Unscale the image from a given float range to the original range.

    Args:
        img (np.ndarray or torch.Tensor): Image to be unscaled.
        float_range (tuple, optional): Float range of the scaled image. Defaults to (0, 1).
        orig_range (tuple, optional): Original range of the image. Defaults to (0, 255).

    Returns:
        np.ndarray or torch.Tensor: Unscaled image.
    """
    f_r = float_range[1] - float_range[0]
    o_r = orig_range[1] - orig_range[0]
    return (o_r * (img - float_range[0]) / f_r) + orig_range[0]

def pad(img, padding, fill=0):
    r"""Pad the given ndarray on all sides with specified padding mode and fill value.
    Adapted from https://github.com/pytorch/vision/blob/master/torchvision/transforms/functional.py#L255
    Args:
        img (ndarray): Image to be padded.
        padding (int or tuple): Padding on each border. If a single int is provided this
            is used to pad all borders. If tuple of length 2 is provided this is the padding
            on left/right and top/bottom respectively. If a tuple of length 4 is provided
            this is the padding for the left, top, right and bottom borders
            respectively.
        fill: Pixel fill value for constant fill. Default is 0. If a tuple of
            length 3, it is used to fill R, G, B channels respectively.
            This value is only used when the padding_mode is constant
    Returns:
        ndarray: Padded image.
    """
    if not isinstance(padding, (numbers.Number, tuple)):
        raise TypeError('Got inappropriate padding arg')
    if not isinstance(fill, (numbers.Number, str, tuple)):
        raise TypeError('Got inappropriate fill arg')

    if isinstance(padding, Sequence) and len(padding) not in [2, 4]:
        raise ValueError("Padding must be an int or a 2, or 4 element tuple, not a " +
                         "{} element tuple".format(len(padding)))

    if isinstance(padding, int):
        pad_left = pad_right = pad_top = pad_bottom = padding
    if isinstance(padding, Sequence) and len(padding) == 2:
        pad_left = pad_right = padding[0]
        pad_top = pad_bottom = padding[1]
    if isinstance(padding, Sequence) and len(padding) == 4:
        pad_left = padding[0]
        pad_top = padding[1]
        pad_right = padding[2]
        pad_bottom = padding[3]

    # RGB image
    if len(img.shape) == 3:
        img = np.pad(img, ((pad_top, pad_bottom), (pad_left, pad_right), (0, 0)), mode='constant', constant_values=fill)
    # Grayscale image
    elif len(img.shape) == 2:
        img = np.pad(img, ((pad_top, pad_bottom), (pad_left, pad_right)), mode='constant', constant_values=fill)

    return img


def pad_diff(actual_height, actual_width, desired_height, desired_width):
    """ Pads img_arr width or height < samples_size with zeros """
    h_diff = desired_height - actual_height
    w_diff = desired_width - actual_width
    padding = (0, 0, w_diff, h_diff)  # left, top, right, bottom
    return padding


def unnormalize(input_img, mean, std):

    """
    :param input_img: (numpy array) Image to be "unnormalized"
    :param mean: (list of mean values) for each channel
    :param std:  (list of std values) for each channel
    :return: (numpy_array) "Unnormalized" image
    """
    return (input_img * std) + mean


def checkpoint_url_download(url: str):
    mime_type = ('application/tar', 'application/x-tar', 'applicaton/x-gtar',
                 'multipart/x-tar', 'application/x-compress', 'application/x-compressed')
    try:
        response = requests.head(url)
        if response.headers['content-type'] in mime_type:
            working_folder = Path.cwd().joinpath('inference_out')
            Path.mkdir(working_folder, parents=True, exist_ok=True)
            checkpoint_path = working_folder.joinpath(Path(url).name)
            r = requests.get(url)
            checkpoint_path.write_bytes(r.content)
            print(checkpoint_path)
            return checkpoint_path
        else:
            raise SystemExit('Invalid Url, checkpoint content not detected')

    except requests.exceptions.RequestException as e:
        raise SystemExit(e)


def read_csv(csv_file_name: str) -> Dict:
    """
    Open csv file and parse it, returning a list of dictionaries with keys:
    - "tif": path to a single image
    - "gpkg": path to a single ground truth file
    - dataset: (str) "trn" or "tst"
    - aoi_id: (str) a string id for area of interest
    @param csv_file_name:
        path to csv file containing list of input data with expected columns
        expected columns (without header): imagery, ground truth, dataset[, aoi id]
    """
    list_values = []
    with open(csv_file_name, 'r') as f:
        reader = csv.reader(f)
        row_lengths_set = set()
        for row in reader:
            row_lengths_set.update([len(row)])
            if ";" in row[0]:
                raise TypeError(f"Elements in rows should be delimited with comma, not semicolon.")
            if not len(row_lengths_set) == 1:
                raise ValueError(f"Rows in csv should be of same length. Got rows with length: {row_lengths_set}")
            row = [str(i) or None for i in row]  # replace empty strings to None.
            row.extend([None] * (4 - len(row)))  # fill row with None values to obtain row of length == 5
 
            row[0] = to_absolute_path(row[0]) if not is_url(row[0]) else row[0] # Convert relative paths to absolute with hydra's util to_absolute_path()
            try:
                row[1] = str(to_absolute_path(row[1]) if not is_url(row[1]) else row[1])
            except TypeError:
                row[1] = None
            # save all values
            list_values.append(
                {'tif': str(row[0]), 'gpkg': row[1], 'split': row[2], 'aoi_id': row[3]})
    try:
        # Try sorting according to dataset name (i.e. group "train", "val" and "test" rows together)
        list_values = sorted(list_values, key=lambda k: k['split'])
    except TypeError:
        log.warning('Unable to sort csv rows')
    return list_values


def read_csv_change_detection(csv_file_name: str) -> dict:
    """
    Open csv file and parse it, returning a list of dictionaries with keys:
    - "tif": path to a single image.
    - "gpkg": path to a single ground truth file.
    - dataset: (str) "trn" or "tst"
    - aoi_id: (str) a string id for area of interest

    Args:
        csv_file_name (str): path to csv file containing list of input data 
                             with expected columns (imagery_t1, ground_truth_t1,
                             imagery_t2, ground_truth_t2, dataset[, aoi id]).

    Raises:
        TypeError: error if a semicolon is use instead of a comma for 
                   delimitation.
        ValueError: error if each line contain different number of items.

    Returns:
        dict: dictionary of two list of dictionary with the contain of the csv.
    """    
    list_values = {'t1':[], 't2':[]}
    with open(csv_file_name, 'r') as f:
        reader = csv.reader(f)
        row_lengths_set = set()
        for row in reader:
            row_lengths_set.update([len(row)])
            if ";" in row[0]:
                raise TypeError(
                    f"Elements in rows should be delimited with comma, "
                    f"not semicolon."
                )
            if not len(row_lengths_set) == 1:
                raise ValueError(
                    f"Rows in csv should be of same length. "
                    f"Got rows with length: {row_lengths_set}"
                )
            # replace empty strings to None.
            row = [str(i) or None for i in row]
            # fill row with None values to obtain row of length == 7  
            row.extend([None] * (6 - len(row)))
            # Convert relative paths to absolute with hydra's util 
            # to_absolute_path() function
            row[0] = to_absolute_path(row[0]) if not is_url(row[0]) else row[0]
            row[2] = to_absolute_path(row[2]) if not is_url(row[2]) else row[2]
            try:
                row[1] = str(
                    to_absolute_path(row[1]) if not is_url(row[1]) else row[1]
                )
            except TypeError:
                row[1] = None
            try:
                row[3] = str(
                    to_absolute_path(row[3]) if not is_url(row[3]) else row[3]
                )
            except TypeError:
                row[3] = None
            # save all values
            list_values['t1'].append({
                'tif': str(row[0]), 'gpkg': row[1],
                'split': row[4], 'aoi_id': row[5]
            })
            list_values['t2'].append({
                'tif': str(row[2]), 'gpkg': row[3],
                'split': row[4], 'aoi_id': row[5]
            })
    try:
        # Try sorting according to dataset name 
        # (i.e. group "train", "val" and "test" rows together)
        list_values['t1'] = sorted(list_values['t1'], key=lambda k: k['split'])
        list_values['t2'] = sorted(list_values['t2'], key=lambda k: k['split'])
    except TypeError:
        log.warning('Unable to sort csv rows')
    # TODO add test that verify if the number of images is the same at t1 and t2
    return list_values


def add_metadata_from_raster_to_sample(sat_img_arr: np.ndarray,
                                       raster_handle: dict,
                                       raster_info: dict = None
                                       ) -> dict:
    """
    :param sat_img_arr: source image as array (opened with rasterio.read)
    :param raster_info: info from raster as read with read_csv (except at inference)
    :return: Returns a metadata dictionary populated with info from source raster, including original csv line and
             histogram.
    """
    metadata_dict = {'name': raster_handle.name, 'csv_info': raster_info, 'source_raster_bincount': {}}
    assert 'dtype' in raster_handle.meta.keys(), "\"dtype\" could not be found in source image metadata"
    metadata_dict.update(raster_handle.meta)
    if not metadata_dict['dtype'] in ["uint8", "uint16"]:
        logging.warning(f"Datatype should be \"uint8\" or \"uint16\". Got \"{metadata_dict['dtype']}\". ")
        if sat_img_arr.min() >= 0 and sat_img_arr.max() <= 255:
            metadata_dict['dtype'] = "uint8"
        elif sat_img_arr.min() >= 0 and sat_img_arr.max() <= 65535:
            metadata_dict['dtype'] = "uint16"
        else:
            raise NotImplementedError(f"Min and max values of array ({[sat_img_arr.min(), sat_img_arr.max()]}) "
                                      f"are not contained in 8 bit nor 16 bit range. Datatype cannot be overwritten.")
    # Save bin count (i.e. histogram) to metadata
    assert isinstance(sat_img_arr, np.ndarray) and len(sat_img_arr.shape) == 3, f"Array should be 3-dimensional"
    for band_index in range(sat_img_arr.shape[2]):
        band = sat_img_arr[..., band_index]
        metadata_dict['source_raster_bincount'][f'band{band_index}'] = {count for count in np.bincount(band.flatten())}
    return metadata_dict

def get_git_hash():
    """
    Get git hash during execution of python script
    :return: (str) hash code for current version of geo-deep-learning. If necessary, the code associated to this hash can be
    found with the following url: https://github.com/<owner>/<project>/commit/<hash>, aka
    https://github.com/NRCan/geo-deep-learning/commit/<hash>
    """
    command = f'git rev-parse --short HEAD'
    subproc = subprocess.run(command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
    git_hash = str(subproc.stdout, "utf-8").replace("\n", "")
    # when code not executed from git repo, subprocess outputs return code #128. This has been tested.
    # Reference: https://stackoverflow.com/questions/58575970/subprocess-call-with-exit-status-128
    if subproc.returncode == 128:
        log.warning(f'No git repo associated to this code.')
        return None
    return git_hash


def ordereddict_eval(str_to_eval: str):
    """
    Small utility to successfully evaluate an ordereddict object that was converted to str by repr() function.
    :param str_to_eval: (str) string to prepared for import with eval()
    """
    try:
        # Replaces "ordereddict" string to "Collections.OrderedDict"
        if isinstance(str_to_eval, bytes):
            str_to_eval = str_to_eval.decode('UTF-8')
        str_to_eval = str_to_eval.replace("ordereddict", "collections.OrderedDict")
        return eval(str_to_eval)
    except Exception:
        log.exception(f'Object of type \"{type(str_to_eval)}\" cannot not be evaluated. Problems may occur.')
        return str_to_eval


def getpath(d, path):
    """
    TODO
    """
    return reduce(lambda acc, i: acc[i], path.split('.'), d)


@rank_zero_only
def print_config(
    config: DictConfig,
    fields: Sequence[str] = (
        "general.task",
        "mode",
        "loss",
        "dataset",
        "general.work_dir",
        "general.config_name",
        "general.config_path",
        "general.project_name",
        "general.workspace",
    ),
    resolve: bool = True,
) -> None:
    """
    Prints content of DictConfig using Rich library and its tree structure.

    Args:
        config (DictConfig): Configuration composed by Hydra.
        fields (Sequence[str], optional): Determines which main fields from config will
        be printed and in what order.
        resolve (bool, optional): Whether to resolve reference fields of DictConfig.
    """
    style = "dim"
    tree = rich.tree.Tree("CONFIG", style=style, guide_style=style)
    save_git_hash = tree.add('Git hash', style=style, guide_style=style)
    save_git_hash.add(str(getpath(config, 'general.git_hash')))
    save_dir = tree.add('Saving directory', style=style, guide_style=style)
    save_dir.add(os.getcwd())

    if config.get('mode') == 'tiling':
        fields += (
            "general.raw_data_dir",
            "general.raw_data_csv",
            "general.tiling_data_dir",
        )
    elif config.get('mode') == 'train':
        fields += (
            "model",
            "training",
            'optimizer',
            'callbacks',
            'scheduler',
            'augmentation',
            "general.tiling_data_dir",
            "general.save_weights_dir",
        )
    elif config.get('mode') == 'inference':
        fields += (
            "inference",
            "model",
            "general.tiling_data_dir",
        )

    if config.get('tracker'):
        fields += ("tracker",)

    for field in fields:
        branch = tree.add(field, style=style, guide_style=style)
        # config_section = config.get(field)
        config_section = getpath(config, field)
        branch_content = str(config_section)
        if isinstance(config_section, DictConfig):
            branch_content = OmegaConf.to_yaml(config_section, resolve=resolve)
        branch.add(rich.syntax.Syntax(branch_content, "yaml", word_wrap=True))

    if config.get('debug'):
        rich.print(tree, flush=False)

    with open("run_config.config", "w") as fp:
        rich.print(tree, file=fp)


def is_inference_compatible(cfg: Union[dict, DictConfig]):
    """Checks whether a configuration dictionary contains a config structure compatible with current inference script"""
    try:
        # don't update if already a recent checkpoint
        # checks if major keys for current config exist, especially those that have changed over time
        cfg['params']['augmentation']
        cfg['params']['dataset']['classes_dict']
        cfg['params']['dataset']['bands']
        cfg['params']['model']['_target_']

        # model state dicts
        cfg['model_state_dict']
        return True
    except KeyError as e:
        logging.debug(e)
        return False


def update_gdl_checkpoint(checkpoint: Union[dict, DictConfig]) -> Dict:
    """
    Utility to update model checkpoints from older versions of GDL to current version.
    NB: The purpose of this utility is ONLY to allow the use of "old" model in current inference script.
        Mostly inference-relevant parameters are update.
    @param checkpoint:
        Dictionary containing weights, optimizer state and saved configuration params from training
    @return:
    """
    # covers gdl checkpoints pre-hydra (<=2.0.0)
    bands = {'red': 'R', 'green': 'G', 'blue': 'B', 'nir': 'N'}
    old2new = {
        'manet_pretrained': {
            '_target_': 'segmentation_models_pytorch.MAnet', 'encoder_name': 'resnext50_32x4d',
            'encoder_weights': 'imagenet'
        },
        'unet_pretrained': {
            '_target_': 'segmentation_models_pytorch.Unet', 'encoder_name': 'resnext50_32x4d',
            'encoder_depth': 4, 'encoder_weights': 'imagenet', 'decoder_channels': [256, 128, 64, 32]
        },
        'unet': {
            '_target_': 'models.unet.UNet', 'dropout': False, 'prob': False
        },
        'unet_small': {
            '_target_': 'models.unet.UNetSmall', 'dropout': False, 'prob': False
        },
        'deeplabv3_pretrained': {
            '_target_': 'segmentation_models_pytorch.DeepLabV3', 'encoder_name': 'resnet101',
            'encoder_weights': 'imagenet'
        },
        'deeplabv3+_pretrained': {
            '_target_': 'segmentation_models_pytorch.DeepLabV3Plus', 'encoder_name': 'resnext50_32x4d',
            'encoder_weights': 'imagenet'
        },
    }
    if not is_inference_compatible(checkpoint):
        # covers gdl checkpoints from version <= 2.0.1
        if 'model' in checkpoint.keys():
            checkpoint['model_state_dict'] = checkpoint['model']
            del checkpoint['model']
        try:
            num_classes_ckpt = get_key_def('num_classes', checkpoint['params']['global'], expected_type=int)
            num_bands_ckpt = get_key_def('number_of_bands', checkpoint['params']['global'], expected_type=int)
            model_name = get_key_def('model_name', checkpoint['params']['global'], expected_type=str)
        except KeyError as e:
            logging.critical(f"\nCouldn't update checkpoint parameters"
                             f"\nError {type(e)}: {e}")
            raise e
        try:
            model_ckpt = old2new[model_name]
        except KeyError as e:
            logging.critical(f"\nCouldn't locate yaml configuration for model architecture {model_name} as found "
                             f"in provided checkpoint. Name of yaml may have changed."
                             f"\nError {type(e)}: {e}")
            raise e
        # For GDL pre-v2.0.2
        # Move transformation/augmentations hyperparameters
        if not "augmentation" in checkpoint["params"].keys():
            checkpoint["params"]["augmentation"] = {
                'normalization': {'mean': [], 'std': []},
                'clahe_enhance_clip_limit': None
            }
        try:
            means_ckpt = checkpoint['params']['training']['normalization']['mean']
            stds_ckpt = checkpoint['params']['training']['normalization']['std']
            scale_ckpt = checkpoint['params']['global']['scale_data']
            # clahe_enhance was never officially added to GDL, so will default to None if not present
            clahe_enhance = get_key_def('clahe_enhance', checkpoint['params']['training']['augmentation'], default=None)
        except KeyError as e:  # if KeyError on old keys, then we'll assume we have an up-to-date checkpoint
            logging.debug(e)
            return checkpoint

        checkpoint["params"]["augmentation"]["normalization"]["mean"] = means_ckpt
        checkpoint["params"]["augmentation"]["normalization"]["std"] = stds_ckpt
        checkpoint["params"]["augmentation"]["scale_data"] = scale_ckpt
        checkpoint["params"]["augmentation"]["clahe_enhance_clip_limit"] = 0.1 if clahe_enhance is True else None

        checkpoint['params'].update({'model': model_ckpt})

        checkpoint['params'].update({
            'dataset': {
                'bands': [list(bands.keys())[i] for i in range(num_bands_ckpt)],
                "classes_dict": {f"class{i + 1}": i + 1 for i in range(num_classes_ckpt)}
                # Some manually update may be necessary when using old models
                # 'bands': ['nir', 'red', 'green'],
                # "classes_dict": {f"FORE": 1},
            }
        })
    return checkpoint


def wait_while_modif(fpath: Union[str, Path], sleep_secs: int = 10, timeout: int = 1800) -> None:
    """
    fpath (str or Path): Path to file potentially being modified
    sleep_secs (int, optional): Seconds to wait before re-checking the size of file to be downloaded
    timeout (int, optional): Maximum amount of time (seconds) to check if file size has changed
    """
    timeout_time = time.time() + timeout
    if Path(fpath).is_file():
        while True:
            initial_size = os.stat(fpath).st_size
            sleep(sleep_secs)
            final_size = os.stat(fpath).st_size
            if time.time() > timeout_time:
                raise TimeoutError(f"File has been modified for more than {timeout} seconds. \nFile: {fpath}")
            # if the initial size is equal to the final size, the file has most likely
            # not changed, unless they are both False.
            elif initial_size == final_size:
                logging.debug(f"File has not changed. \nInitial size: {initial_size}\nFinal size: {final_size}")
                break
            logging.debug(f"File has changed. \nInitial size: {initial_size}\nFinal size: {final_size}")
    else:
        logging.debug(f"File doesn't exist: {fpath}")


def download_url_wcheck(
    url: str, root: str, filename: Optional[str] = None, md5: Optional[str] = None, max_redirect_hops: int = 3,
        sleep_secs: int = 10, timeout: int = 1800
) -> None:
    """Download a file from a url and place it in root. If file to be downloaded exists, but its size varies within a
    certain period, wait for size to remain stable.

    Args:
        url (str): URL to download file from
        root (str): Directory to place downloaded file in
        filename (str, optional): Name to save the file under. If None, use the basename of the URL
        md5 (str, optional): MD5 checksum of the download. If None, do not check
        max_redirect_hops (int, optional): Maximum number of redirect hops allowed
        sleep_secs (int, optional): Seconds to wait before re-checking the size of file to be downloaded
        timeout (int, optional): Maximum amount of time (seconds) to check if file size has change
    """
    timeout = int(time.time() + timeout)
    fpath = Path(root) / filename
    if fpath.is_file():
        wait_while_modif(fpath=fpath, sleep_secs=sleep_secs, timeout=timeout)
    else:
        download_url(url=url, root=root, filename=filename, md5=md5, max_redirect_hops=max_redirect_hops)


def map_wrapper(x):
    """For multi-threading"""
    return x[0](*(x[1:]))