From 1ac3037a8f1ca4e4c00733dd7e799095a7a7070f Mon Sep 17 00:00:00 2001 From: Jinzhe Zeng Date: Tue, 23 Jan 2024 09:37:56 -0500 Subject: [PATCH 1/3] Move model deviation and ase calculator to `deepmd_utils` ..., so they can benifit from multiple-backend DeepPot. Update docs. Signed-off-by: Jinzhe Zeng --- deepmd/calculator.py | 146 +-------- deepmd/infer/model_devi.py | 518 +------------------------------ deepmd_utils/calculator.py | 144 +++++++++ deepmd_utils/infer/__init__.py | 5 +- deepmd_utils/infer/model_devi.py | 510 ++++++++++++++++++++++++++++++ doc/inference/python.md | 10 +- doc/third-party/ase.md | 2 +- 7 files changed, 677 insertions(+), 658 deletions(-) create mode 100644 deepmd_utils/calculator.py create mode 100644 deepmd_utils/infer/model_devi.py diff --git a/deepmd/calculator.py b/deepmd/calculator.py index b9c0a81006..4dbed51fac 100644 --- a/deepmd/calculator.py +++ b/deepmd/calculator.py @@ -1,144 +1,8 @@ # SPDX-License-Identifier: LGPL-3.0-or-later -"""ASE calculator interface module.""" - -from pathlib import ( - Path, -) -from typing import ( - TYPE_CHECKING, - ClassVar, - Dict, - List, - Optional, - Union, -) - -from ase.calculators.calculator import ( - Calculator, - PropertyNotImplementedError, - all_changes, -) - -from deepmd import ( - DeepPotential, +from deepmd_utils.calculator import ( + DP, ) -if TYPE_CHECKING: - from ase import ( - Atoms, - ) - -__all__ = ["DP"] - - -class DP(Calculator): - """Implementation of ASE deepmd calculator. - - Implemented propertie are `energy`, `forces` and `stress` - - Parameters - ---------- - model : Union[str, Path] - path to the model - label : str, optional - calculator label, by default "DP" - type_dict : Dict[str, int], optional - mapping of element types and their numbers, best left None and the calculator - will infer this information from model, by default None - neighbor_list : ase.neighborlist.NeighborList, optional - The neighbor list object. If None, then build the native neighbor list. - - Examples - -------- - Compute potential energy - - >>> from ase import Atoms - >>> from deepmd.calculator import DP - >>> water = Atoms('H2O', - >>> positions=[(0.7601, 1.9270, 1), - >>> (1.9575, 1, 1), - >>> (1., 1., 1.)], - >>> cell=[100, 100, 100], - >>> calculator=DP(model="frozen_model.pb")) - >>> print(water.get_potential_energy()) - >>> print(water.get_forces()) - - Run BFGS structure optimization - - >>> from ase.optimize import BFGS - >>> dyn = BFGS(water) - >>> dyn.run(fmax=1e-6) - >>> print(water.get_positions()) - """ - - name = "DP" - implemented_properties: ClassVar[List[str]] = [ - "energy", - "free_energy", - "forces", - "virial", - "stress", - ] - - def __init__( - self, - model: Union[str, "Path"], - label: str = "DP", - type_dict: Optional[Dict[str, int]] = None, - neighbor_list=None, - **kwargs, - ) -> None: - Calculator.__init__(self, label=label, **kwargs) - self.dp = DeepPotential(str(Path(model).resolve()), neighbor_list=neighbor_list) - if type_dict: - self.type_dict = type_dict - else: - self.type_dict = dict( - zip(self.dp.get_type_map(), range(self.dp.get_ntypes())) - ) - - def calculate( - self, - atoms: Optional["Atoms"] = None, - properties: List[str] = ["energy", "forces", "virial"], - system_changes: List[str] = all_changes, - ): - """Run calculation with deepmd model. - - Parameters - ---------- - atoms : Optional[Atoms], optional - atoms object to run the calculation on, by default None - properties : List[str], optional - unused, only for function signature compatibility, - by default ["energy", "forces", "stress"] - system_changes : List[str], optional - unused, only for function signature compatibility, by default all_changes - """ - if atoms is not None: - self.atoms = atoms.copy() - - coord = self.atoms.get_positions().reshape([1, -1]) - if sum(self.atoms.get_pbc()) > 0: - cell = self.atoms.get_cell().reshape([1, -1]) - else: - cell = None - symbols = self.atoms.get_chemical_symbols() - atype = [self.type_dict[k] for k in symbols] - e, f, v = self.dp.eval(coords=coord, cells=cell, atom_types=atype) - self.results["energy"] = e[0][0] - # see https://gitlab.com/ase/ase/-/merge_requests/2485 - self.results["free_energy"] = e[0][0] - self.results["forces"] = f[0] - self.results["virial"] = v[0].reshape(3, 3) - - # convert virial into stress for lattice relaxation - if "stress" in properties: - if sum(atoms.get_pbc()) > 0: - # the usual convention (tensile stress is positive) - # stress = -virial / volume - stress = -0.5 * (v[0].copy() + v[0].copy().T) / atoms.get_volume() - # Voigt notation - self.results["stress"] = stress.flat[[0, 4, 8, 5, 2, 1]] - else: - raise PropertyNotImplementedError +__all__ = [ + "DP", +] diff --git a/deepmd/infer/model_devi.py b/deepmd/infer/model_devi.py index 8c329a0845..a45f96805b 100644 --- a/deepmd/infer/model_devi.py +++ b/deepmd/infer/model_devi.py @@ -1,511 +1,9 @@ # SPDX-License-Identifier: LGPL-3.0-or-later -from typing import ( - Optional, - Tuple, - overload, -) - -import numpy as np - -from deepmd.common import ( - expand_sys_str, -) - -from ..utils.batch_size import ( - AutoBatchSize, -) -from ..utils.data import ( - DeepmdData, -) -from .deep_pot import ( - DeepPot, -) - -try: - from typing import Literal # python >=3.8 -except ImportError: - from typing_extensions import Literal # type: ignore - - -@overload -def calc_model_devi_f( - fs: np.ndarray, - real_f: Optional[np.ndarray] = None, - relative: Optional[float] = None, - atomic: Literal[False] = False, -) -> Tuple[np.ndarray, np.ndarray, np.ndarray]: - ... - - -@overload -def calc_model_devi_f( - fs: np.ndarray, - real_f: Optional[np.ndarray] = None, - relative: Optional[float] = None, - *, - atomic: Literal[True], -) -> Tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]: - ... - - -def calc_model_devi_f( - fs: np.ndarray, - real_f: Optional[np.ndarray] = None, - relative: Optional[float] = None, - atomic: bool = False, -) -> Tuple[np.ndarray, ...]: - """Calculate model deviation of force. - - Parameters - ---------- - fs : numpy.ndarray - size of `n_models x n_frames x n_atoms x 3` - real_f : numpy.ndarray or None - real force, size of `n_frames x n_atoms x 3`. If given, - the RMS real error is calculated instead. - relative : float, default: None - If given, calculate the relative model deviation of force. The - value is the level parameter for computing the relative model - deviation of the force. - atomic : bool, default: False - Whether return deviation of force in all atoms - - Returns - ------- - max_devi_f : numpy.ndarray - maximum deviation of force in all atoms - min_devi_f : numpy.ndarray - minimum deviation of force in all atoms - avg_devi_f : numpy.ndarray - average deviation of force in all atoms - fs_devi : numpy.ndarray - deviation of force in all atoms, returned if atomic=True - """ - if real_f is None: - fs_devi = np.linalg.norm(np.std(fs, axis=0), axis=-1) - else: - fs_devi = np.linalg.norm( - np.sqrt(np.mean(np.square(fs - real_f), axis=0)), axis=-1 - ) - if relative is not None: - if real_f is None: - # if real force is not given, the magnitude is calculated from mean value of four models - # See DeepPotModelDevi::compute_relative_std_f - # See also Eq. 71 in DeePMD-kit v2 paepr - magnitude = np.linalg.norm(np.mean(fs, axis=0), axis=-1) - else: - # otherwise, the magnitude is calculated from the real force - magnitude = np.linalg.norm(real_f, axis=-1) - fs_devi /= magnitude + relative - max_devi_f = np.max(fs_devi, axis=-1) - min_devi_f = np.min(fs_devi, axis=-1) - avg_devi_f = np.mean(fs_devi, axis=-1) - if atomic: - return max_devi_f, min_devi_f, avg_devi_f, fs_devi - return max_devi_f, min_devi_f, avg_devi_f - - -def calc_model_devi_e( - es: np.ndarray, real_e: Optional[np.ndarray] = None -) -> np.ndarray: - """Calculate model deviation of total energy per atom. - - Here we don't use the atomic energy, as the decomposition - of energy is arbitrary and not unique. There is no fitting - target for atomic energy. - - Parameters - ---------- - es : numpy.ndarray - size of `n_models x n_frames x 1 - real_e : numpy.ndarray - real energy, size of `n_frames x 1`. If given, - the RMS real error is calculated instead. - - Returns - ------- - max_devi_e : numpy.ndarray - maximum deviation of energy - """ - if real_e is None: - es_devi = np.std(es, axis=0) - else: - es_devi = np.sqrt(np.mean(np.square(es - real_e), axis=0)) - es_devi = np.squeeze(es_devi, axis=-1) - return es_devi - - -def calc_model_devi_v( - vs: np.ndarray, - real_v: Optional[np.ndarray] = None, - relative: Optional[float] = None, -) -> Tuple[np.ndarray, np.ndarray, np.ndarray]: - """Calculate model deviation of virial. - - Parameters - ---------- - vs : numpy.ndarray - size of `n_models x n_frames x 9` - real_v : numpy.ndarray - real virial, size of `n_frames x 9`. If given, - the RMS real error is calculated instead. - relative : float, default: None - If given, calculate the relative model deviation of virial. The - value is the level parameter for computing the relative model - deviation of the virial. - - Returns - ------- - max_devi_v : numpy.ndarray - maximum deviation of virial in 9 elements - min_devi_v : numpy.ndarray - minimum deviation of virial in 9 elements - avg_devi_v : numpy.ndarray - average deviation of virial in 9 elements - """ - if real_v is None: - vs_devi = np.std(vs, axis=0) - else: - vs_devi = np.sqrt(np.mean(np.square(vs - real_v), axis=0)) - if relative is not None: - if real_v is None: - # if real virial is not given, the magnitude is calculated from mean value of four models - # See DeepPotModelDevi::compute_relative_std_v - # See also Eq. 72 in DeePMD-kit v2 paepr - magnitude = np.linalg.norm(np.mean(vs, axis=0), axis=-1) - else: - # otherwise, the magnitude is calculated from the real virial - magnitude = np.linalg.norm(real_v, axis=-1) - vs_devi /= magnitude + relative - max_devi_v = np.max(vs_devi, axis=-1) - min_devi_v = np.min(vs_devi, axis=-1) - avg_devi_v = np.linalg.norm(vs_devi, axis=-1) / 3 - return max_devi_v, min_devi_v, avg_devi_v - - -def write_model_devi_out( - devi: np.ndarray, fname: str, header: str = "", atomic: bool = False -): - """Write output of model deviation. - - Parameters - ---------- - devi : numpy.ndarray - the first column is the steps index - fname : str - the file name to dump - header : str, default="" - the header to dump - atomic : bool, default: False - whether atomic model deviation is printed - """ - if not atomic: - assert devi.shape[1] == 8 - else: - assert devi.shape[1] > 8 - header = "%s\n%10s" % (header, "step") - for item in "vf": - header += "%19s%19s%19s" % ( - f"max_devi_{item}", - f"min_devi_{item}", - f"avg_devi_{item}", - ) - header += "%19s" % "devi_e" - if atomic: - header += "%19s" % "atm_devi_f(N)" - with open(fname, "ab") as fp: - np.savetxt( - fp, - devi, - fmt=["%12d"] + ["%19.6e" for _ in range(devi.shape[1] - 1)], - delimiter="", - header=header, - ) - return devi - - -def _check_tmaps(tmaps, ref_tmap=None): - """Check whether type maps are identical.""" - assert isinstance(tmaps, list) - if ref_tmap is None: - ref_tmap = tmaps[0] - assert isinstance(ref_tmap, list) - - flag = True - for tmap in tmaps: - if tmap != ref_tmap: - flag = False - break - return flag - - -def calc_model_devi( - coord, - box, - atype, - models, - fname=None, - frequency=1, - mixed_type=False, - fparam: Optional[np.ndarray] = None, - aparam: Optional[np.ndarray] = None, - real_data: Optional[dict] = None, - atomic: bool = False, - relative: Optional[float] = None, - relative_v: Optional[float] = None, -): - """Python interface to calculate model deviation. - - Parameters - ---------- - coord : numpy.ndarray, `n_frames x n_atoms x 3` - Coordinates of system to calculate - box : numpy.ndarray or None, `n_frames x 3 x 3` - Box to specify periodic boundary condition. If None, no pbc will be used - atype : numpy.ndarray, `n_atoms x 1` - Atom types - models : list of DeepPot models - Models used to evaluate deviation - fname : str or None - File to dump results, default None - frequency : int - Steps between frames (if the system is given by molecular dynamics engine), default 1 - mixed_type : bool - Whether the input atype is in mixed_type format or not - fparam : numpy.ndarray - frame specific parameters - aparam : numpy.ndarray - atomic specific parameters - real_data : dict, optional - real data to calculate RMS real error - atomic : bool, default: False - If True, calculate the force model deviation of each atom. - relative : float, default: None - If given, calculate the relative model deviation of force. The - value is the level parameter for computing the relative model - deviation of the force. - relative_v : float, default: None - If given, calculate the relative model deviation of virial. The - value is the level parameter for computing the relative model - deviation of the virial. - - Returns - ------- - model_devi : numpy.ndarray, `n_frames x 8` - Model deviation results. The first column is index of steps, the other 7 columns are - max_devi_v, min_devi_v, avg_devi_v, max_devi_f, min_devi_f, avg_devi_f, devi_e. - - Examples - -------- - >>> from deepmd.infer import calc_model_devi - >>> from deepmd.infer import DeepPot as DP - >>> import numpy as np - >>> coord = np.array([[1,0,0], [0,0,1.5], [1,0,3]]).reshape([1, -1]) - >>> cell = np.diag(10 * np.ones(3)).reshape([1, -1]) - >>> atype = [1,0,1] - >>> graphs = [DP("graph.000.pb"), DP("graph.001.pb")] - >>> model_devi = calc_model_devi(coord, cell, atype, graphs) - """ - energies = [] - forces = [] - virials = [] - natom = atype.shape[-1] - for dp in models: - ret = dp.eval( - coord, - box, - atype, - fparam=fparam, - aparam=aparam, - mixed_type=mixed_type, - ) - energies.append(ret[0] / natom) - forces.append(ret[1]) - virials.append(ret[2] / natom) - - energies = np.array(energies) - forces = np.array(forces) - virials = np.array(virials) - - devi = [np.arange(coord.shape[0]) * frequency] - if real_data is None: - devi += list(calc_model_devi_v(virials, relative=relative_v)) - devi_f = list(calc_model_devi_f(forces, relative=relative, atomic=atomic)) - devi += devi_f[:3] - devi.append(calc_model_devi_e(energies)) - else: - devi += list( - calc_model_devi_v(virials, real_data["virial"], relative=relative_v) - ) - devi_f = list( - calc_model_devi_f( - forces, real_data["force"], relative=relative, atomic=atomic - ) - ) - devi += devi_f[:3] - devi.append(calc_model_devi_e(energies, real_data["energy"])) - devi = np.vstack(devi).T - if atomic: - devi = np.concatenate([devi, devi_f[3]], axis=1) - if fname: - write_model_devi_out(devi, fname, atomic=atomic) - return devi - - -def make_model_devi( - *, - models: list, - system: str, - set_prefix: str, - output: str, - frequency: int, - real_error: bool = False, - atomic: bool = False, - relative: Optional[float] = None, - relative_v: Optional[float] = None, - **kwargs, -): - """Make model deviation calculation. - - Parameters - ---------- - models : list - A list of paths of models to use for making model deviation - system : str - The path of system to make model deviation calculation - set_prefix : str - The set prefix of the system - output : str - The output file for model deviation results - frequency : int - The number of steps that elapse between writing coordinates - in a trajectory by a MD engine (such as Gromacs / Lammps). - This paramter is used to determine the index in the output file. - real_error : bool, default: False - If True, calculate the RMS real error instead of model deviation. - atomic : bool, default: False - If True, calculate the force model deviation of each atom. - relative : float, default: None - If given, calculate the relative model deviation of force. The - value is the level parameter for computing the relative model - deviation of the force. - relative_v : float, default: None - If given, calculate the relative model deviation of virial. The - value is the level parameter for computing the relative model - deviation of the virial. - **kwargs - Arbitrary keyword arguments. - """ - auto_batch_size = AutoBatchSize() - # init models - dp_models = [DeepPot(model, auto_batch_size=auto_batch_size) for model in models] - - # check type maps - tmaps = [dp.get_type_map() for dp in dp_models] - if _check_tmaps(tmaps): - tmap = tmaps[0] - else: - raise RuntimeError("The models does not have the same type map.") - - all_sys = expand_sys_str(system) - if len(all_sys) == 0: - raise RuntimeError("Did not find valid system") - devis_coll = [] - - first_dp = dp_models[0] - - for system in all_sys: - # create data-system - dp_data = DeepmdData( - system, set_prefix, shuffle_test=False, type_map=tmap, sort_atoms=False - ) - if first_dp.get_dim_fparam() > 0: - dp_data.add( - "fparam", - first_dp.get_dim_fparam(), - atomic=False, - must=True, - high_prec=False, - ) - if first_dp.get_dim_aparam() > 0: - dp_data.add( - "aparam", - first_dp.get_dim_aparam(), - atomic=True, - must=True, - high_prec=False, - ) - if real_error: - dp_data.add( - "energy", - 1, - atomic=False, - must=False, - high_prec=True, - ) - dp_data.add( - "force", - 3, - atomic=True, - must=False, - high_prec=False, - ) - dp_data.add( - "virial", - 9, - atomic=False, - must=False, - high_prec=False, - ) - - mixed_type = dp_data.mixed_type - - data_sets = [dp_data._load_set(set_name) for set_name in dp_data.dirs] - nframes_tot = 0 - devis = [] - for data in data_sets: - coord = data["coord"] - box = data["box"] - if mixed_type: - atype = data["type"] - else: - atype = data["type"][0] - if not dp_data.pbc: - box = None - if first_dp.get_dim_fparam() > 0: - fparam = data["fparam"] - else: - fparam = None - if first_dp.get_dim_aparam() > 0: - aparam = data["aparam"] - else: - aparam = None - if real_error: - natoms = atype.shape[-1] - real_data = { - "energy": data["energy"] / natoms, - "force": data["force"].reshape([-1, natoms, 3]), - "virial": data["virial"] / natoms, - } - else: - real_data = None - devi = calc_model_devi( - coord, - box, - atype, - dp_models, - mixed_type=mixed_type, - fparam=fparam, - aparam=aparam, - real_data=real_data, - atomic=atomic, - relative=relative, - relative_v=relative_v, - ) - nframes_tot += coord.shape[0] - devis.append(devi) - devis = np.vstack(devis) - devis[:, 0] = np.arange(nframes_tot) * frequency - write_model_devi_out(devis, output, header=system, atomic=atomic) - devis_coll.append(devis) - return devis_coll +__all_ = [ + "make_model_devi", + "calc_model_devi", + "write_model_devi_out", + "calc_model_devi_e", + "calc_model_devi_f", + "calc_model_devi_v", +] diff --git a/deepmd_utils/calculator.py b/deepmd_utils/calculator.py new file mode 100644 index 0000000000..5b45aa49b3 --- /dev/null +++ b/deepmd_utils/calculator.py @@ -0,0 +1,144 @@ +# SPDX-License-Identifier: LGPL-3.0-or-later +"""ASE calculator interface module.""" + +from pathlib import ( + Path, +) +from typing import ( + TYPE_CHECKING, + ClassVar, + Dict, + List, + Optional, + Union, +) + +from ase.calculators.calculator import ( + Calculator, + PropertyNotImplementedError, + all_changes, +) + +from deepmd_utils.infer import ( + DeepPot, +) + +if TYPE_CHECKING: + from ase import ( + Atoms, + ) + +__all__ = ["DP"] + + +class DP(Calculator): + """Implementation of ASE deepmd calculator. + + Implemented propertie are `energy`, `forces` and `stress` + + Parameters + ---------- + model : Union[str, Path] + path to the model + label : str, optional + calculator label, by default "DP" + type_dict : Dict[str, int], optional + mapping of element types and their numbers, best left None and the calculator + will infer this information from model, by default None + neighbor_list : ase.neighborlist.NeighborList, optional + The neighbor list object. If None, then build the native neighbor list. + + Examples + -------- + Compute potential energy + + >>> from ase import Atoms + >>> from deepmd.calculator import DP + >>> water = Atoms('H2O', + >>> positions=[(0.7601, 1.9270, 1), + >>> (1.9575, 1, 1), + >>> (1., 1., 1.)], + >>> cell=[100, 100, 100], + >>> calculator=DP(model="frozen_model.pb")) + >>> print(water.get_potential_energy()) + >>> print(water.get_forces()) + + Run BFGS structure optimization + + >>> from ase.optimize import BFGS + >>> dyn = BFGS(water) + >>> dyn.run(fmax=1e-6) + >>> print(water.get_positions()) + """ + + name = "DP" + implemented_properties: ClassVar[List[str]] = [ + "energy", + "free_energy", + "forces", + "virial", + "stress", + ] + + def __init__( + self, + model: Union[str, "Path"], + label: str = "DP", + type_dict: Optional[Dict[str, int]] = None, + neighbor_list=None, + **kwargs, + ) -> None: + Calculator.__init__(self, label=label, **kwargs) + self.dp = DeepPot(str(Path(model).resolve()), neighbor_list=neighbor_list) + if type_dict: + self.type_dict = type_dict + else: + self.type_dict = dict( + zip(self.dp.get_type_map(), range(self.dp.get_ntypes())) + ) + + def calculate( + self, + atoms: Optional["Atoms"] = None, + properties: List[str] = ["energy", "forces", "virial"], + system_changes: List[str] = all_changes, + ): + """Run calculation with deepmd model. + + Parameters + ---------- + atoms : Optional[Atoms], optional + atoms object to run the calculation on, by default None + properties : List[str], optional + unused, only for function signature compatibility, + by default ["energy", "forces", "stress"] + system_changes : List[str], optional + unused, only for function signature compatibility, by default all_changes + """ + if atoms is not None: + self.atoms = atoms.copy() + + coord = self.atoms.get_positions().reshape([1, -1]) + if sum(self.atoms.get_pbc()) > 0: + cell = self.atoms.get_cell().reshape([1, -1]) + else: + cell = None + symbols = self.atoms.get_chemical_symbols() + atype = [self.type_dict[k] for k in symbols] + e, f, v = self.dp.eval(coords=coord, cells=cell, atom_types=atype) + self.results["energy"] = e[0][0] + # see https://gitlab.com/ase/ase/-/merge_requests/2485 + self.results["free_energy"] = e[0][0] + self.results["forces"] = f[0] + self.results["virial"] = v[0].reshape(3, 3) + + # convert virial into stress for lattice relaxation + if "stress" in properties: + if sum(atoms.get_pbc()) > 0: + # the usual convention (tensile stress is positive) + # stress = -virial / volume + stress = -0.5 * (v[0].copy() + v[0].copy().T) / atoms.get_volume() + # Voigt notation + self.results["stress"] = stress.flat[[0, 4, 8, 5, 2, 1]] + else: + raise PropertyNotImplementedError diff --git a/deepmd_utils/infer/__init__.py b/deepmd_utils/infer/__init__.py index 644f5e1f43..b76262882e 100644 --- a/deepmd_utils/infer/__init__.py +++ b/deepmd_utils/infer/__init__.py @@ -2,5 +2,8 @@ from .deep_pot import ( DeepPot, ) +from .model_devi import ( + calc_model_devi, +) -__all__ = ["DeepPot"] +__all__ = ["DeepPot", "calc_model_devi"] diff --git a/deepmd_utils/infer/model_devi.py b/deepmd_utils/infer/model_devi.py new file mode 100644 index 0000000000..1cb6c6fca1 --- /dev/null +++ b/deepmd_utils/infer/model_devi.py @@ -0,0 +1,510 @@ +# SPDX-License-Identifier: LGPL-3.0-or-later +from typing import ( + Optional, + Tuple, + overload, +) + +import numpy as np + +from deepmd_utils.common import ( + expand_sys_str, +) +from deepmd_utils.infer.deep_pot import ( + DeepPot, +) +from deepmd_utils.utils.batch_size import ( + AutoBatchSize, +) +from deepmd_utils.utils.data import ( + DeepmdData, +) + +try: + from typing import Literal # python >=3.8 +except ImportError: + from typing_extensions import Literal # type: ignore + + +@overload +def calc_model_devi_f( + fs: np.ndarray, + real_f: Optional[np.ndarray] = None, + relative: Optional[float] = None, + atomic: Literal[False] = False, +) -> Tuple[np.ndarray, np.ndarray, np.ndarray]: + ... + + +@overload +def calc_model_devi_f( + fs: np.ndarray, + real_f: Optional[np.ndarray] = None, + relative: Optional[float] = None, + *, + atomic: Literal[True], +) -> Tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]: + ... + + +def calc_model_devi_f( + fs: np.ndarray, + real_f: Optional[np.ndarray] = None, + relative: Optional[float] = None, + atomic: bool = False, +) -> Tuple[np.ndarray, ...]: + """Calculate model deviation of force. + + Parameters + ---------- + fs : numpy.ndarray + size of `n_models x n_frames x n_atoms x 3` + real_f : numpy.ndarray or None + real force, size of `n_frames x n_atoms x 3`. If given, + the RMS real error is calculated instead. + relative : float, default: None + If given, calculate the relative model deviation of force. The + value is the level parameter for computing the relative model + deviation of the force. + atomic : bool, default: False + Whether return deviation of force in all atoms + + Returns + ------- + max_devi_f : numpy.ndarray + maximum deviation of force in all atoms + min_devi_f : numpy.ndarray + minimum deviation of force in all atoms + avg_devi_f : numpy.ndarray + average deviation of force in all atoms + fs_devi : numpy.ndarray + deviation of force in all atoms, returned if atomic=True + """ + if real_f is None: + fs_devi = np.linalg.norm(np.std(fs, axis=0), axis=-1) + else: + fs_devi = np.linalg.norm( + np.sqrt(np.mean(np.square(fs - real_f), axis=0)), axis=-1 + ) + if relative is not None: + if real_f is None: + # if real force is not given, the magnitude is calculated from mean value of four models + # See DeepPotModelDevi::compute_relative_std_f + # See also Eq. 71 in DeePMD-kit v2 paepr + magnitude = np.linalg.norm(np.mean(fs, axis=0), axis=-1) + else: + # otherwise, the magnitude is calculated from the real force + magnitude = np.linalg.norm(real_f, axis=-1) + fs_devi /= magnitude + relative + max_devi_f = np.max(fs_devi, axis=-1) + min_devi_f = np.min(fs_devi, axis=-1) + avg_devi_f = np.mean(fs_devi, axis=-1) + if atomic: + return max_devi_f, min_devi_f, avg_devi_f, fs_devi + return max_devi_f, min_devi_f, avg_devi_f + + +def calc_model_devi_e( + es: np.ndarray, real_e: Optional[np.ndarray] = None +) -> np.ndarray: + """Calculate model deviation of total energy per atom. + + Here we don't use the atomic energy, as the decomposition + of energy is arbitrary and not unique. There is no fitting + target for atomic energy. + + Parameters + ---------- + es : numpy.ndarray + size of `n_models x n_frames x 1 + real_e : numpy.ndarray + real energy, size of `n_frames x 1`. If given, + the RMS real error is calculated instead. + + Returns + ------- + max_devi_e : numpy.ndarray + maximum deviation of energy + """ + if real_e is None: + es_devi = np.std(es, axis=0) + else: + es_devi = np.sqrt(np.mean(np.square(es - real_e), axis=0)) + es_devi = np.squeeze(es_devi, axis=-1) + return es_devi + + +def calc_model_devi_v( + vs: np.ndarray, + real_v: Optional[np.ndarray] = None, + relative: Optional[float] = None, +) -> Tuple[np.ndarray, np.ndarray, np.ndarray]: + """Calculate model deviation of virial. + + Parameters + ---------- + vs : numpy.ndarray + size of `n_models x n_frames x 9` + real_v : numpy.ndarray + real virial, size of `n_frames x 9`. If given, + the RMS real error is calculated instead. + relative : float, default: None + If given, calculate the relative model deviation of virial. The + value is the level parameter for computing the relative model + deviation of the virial. + + Returns + ------- + max_devi_v : numpy.ndarray + maximum deviation of virial in 9 elements + min_devi_v : numpy.ndarray + minimum deviation of virial in 9 elements + avg_devi_v : numpy.ndarray + average deviation of virial in 9 elements + """ + if real_v is None: + vs_devi = np.std(vs, axis=0) + else: + vs_devi = np.sqrt(np.mean(np.square(vs - real_v), axis=0)) + if relative is not None: + if real_v is None: + # if real virial is not given, the magnitude is calculated from mean value of four models + # See DeepPotModelDevi::compute_relative_std_v + # See also Eq. 72 in DeePMD-kit v2 paepr + magnitude = np.linalg.norm(np.mean(vs, axis=0), axis=-1) + else: + # otherwise, the magnitude is calculated from the real virial + magnitude = np.linalg.norm(real_v, axis=-1) + vs_devi /= magnitude + relative + max_devi_v = np.max(vs_devi, axis=-1) + min_devi_v = np.min(vs_devi, axis=-1) + avg_devi_v = np.linalg.norm(vs_devi, axis=-1) / 3 + return max_devi_v, min_devi_v, avg_devi_v + + +def write_model_devi_out( + devi: np.ndarray, fname: str, header: str = "", atomic: bool = False +): + """Write output of model deviation. + + Parameters + ---------- + devi : numpy.ndarray + the first column is the steps index + fname : str + the file name to dump + header : str, default="" + the header to dump + atomic : bool, default: False + whether atomic model deviation is printed + """ + if not atomic: + assert devi.shape[1] == 8 + else: + assert devi.shape[1] > 8 + header = "%s\n%10s" % (header, "step") + for item in "vf": + header += "%19s%19s%19s" % ( + f"max_devi_{item}", + f"min_devi_{item}", + f"avg_devi_{item}", + ) + header += "%19s" % "devi_e" + if atomic: + header += "%19s" % "atm_devi_f(N)" + with open(fname, "ab") as fp: + np.savetxt( + fp, + devi, + fmt=["%12d"] + ["%19.6e" for _ in range(devi.shape[1] - 1)], + delimiter="", + header=header, + ) + return devi + + +def _check_tmaps(tmaps, ref_tmap=None): + """Check whether type maps are identical.""" + assert isinstance(tmaps, list) + if ref_tmap is None: + ref_tmap = tmaps[0] + assert isinstance(ref_tmap, list) + + flag = True + for tmap in tmaps: + if tmap != ref_tmap: + flag = False + break + return flag + + +def calc_model_devi( + coord, + box, + atype, + models, + fname=None, + frequency=1, + mixed_type=False, + fparam: Optional[np.ndarray] = None, + aparam: Optional[np.ndarray] = None, + real_data: Optional[dict] = None, + atomic: bool = False, + relative: Optional[float] = None, + relative_v: Optional[float] = None, +): + """Python interface to calculate model deviation. + + Parameters + ---------- + coord : numpy.ndarray, `n_frames x n_atoms x 3` + Coordinates of system to calculate + box : numpy.ndarray or None, `n_frames x 3 x 3` + Box to specify periodic boundary condition. If None, no pbc will be used + atype : numpy.ndarray, `n_atoms x 1` + Atom types + models : list of DeepPot models + Models used to evaluate deviation + fname : str or None + File to dump results, default None + frequency : int + Steps between frames (if the system is given by molecular dynamics engine), default 1 + mixed_type : bool + Whether the input atype is in mixed_type format or not + fparam : numpy.ndarray + frame specific parameters + aparam : numpy.ndarray + atomic specific parameters + real_data : dict, optional + real data to calculate RMS real error + atomic : bool, default: False + If True, calculate the force model deviation of each atom. + relative : float, default: None + If given, calculate the relative model deviation of force. The + value is the level parameter for computing the relative model + deviation of the force. + relative_v : float, default: None + If given, calculate the relative model deviation of virial. The + value is the level parameter for computing the relative model + deviation of the virial. + + Returns + ------- + model_devi : numpy.ndarray, `n_frames x 8` + Model deviation results. The first column is index of steps, the other 7 columns are + max_devi_v, min_devi_v, avg_devi_v, max_devi_f, min_devi_f, avg_devi_f, devi_e. + + Examples + -------- + >>> from deepmd.infer import calc_model_devi + >>> from deepmd.infer import DeepPot as DP + >>> import numpy as np + >>> coord = np.array([[1,0,0], [0,0,1.5], [1,0,3]]).reshape([1, -1]) + >>> cell = np.diag(10 * np.ones(3)).reshape([1, -1]) + >>> atype = [1,0,1] + >>> graphs = [DP("graph.000.pb"), DP("graph.001.pb")] + >>> model_devi = calc_model_devi(coord, cell, atype, graphs) + """ + energies = [] + forces = [] + virials = [] + natom = atype.shape[-1] + for dp in models: + ret = dp.eval( + coord, + box, + atype, + fparam=fparam, + aparam=aparam, + mixed_type=mixed_type, + ) + energies.append(ret[0] / natom) + forces.append(ret[1]) + virials.append(ret[2] / natom) + + energies = np.array(energies) + forces = np.array(forces) + virials = np.array(virials) + + devi = [np.arange(coord.shape[0]) * frequency] + if real_data is None: + devi += list(calc_model_devi_v(virials, relative=relative_v)) + devi_f = list(calc_model_devi_f(forces, relative=relative, atomic=atomic)) + devi += devi_f[:3] + devi.append(calc_model_devi_e(energies)) + else: + devi += list( + calc_model_devi_v(virials, real_data["virial"], relative=relative_v) + ) + devi_f = list( + calc_model_devi_f( + forces, real_data["force"], relative=relative, atomic=atomic + ) + ) + devi += devi_f[:3] + devi.append(calc_model_devi_e(energies, real_data["energy"])) + devi = np.vstack(devi).T + if atomic: + devi = np.concatenate([devi, devi_f[3]], axis=1) + if fname: + write_model_devi_out(devi, fname, atomic=atomic) + return devi + + +def make_model_devi( + *, + models: list, + system: str, + set_prefix: str, + output: str, + frequency: int, + real_error: bool = False, + atomic: bool = False, + relative: Optional[float] = None, + relative_v: Optional[float] = None, + **kwargs, +): + """Make model deviation calculation. + + Parameters + ---------- + models : list + A list of paths of models to use for making model deviation + system : str + The path of system to make model deviation calculation + set_prefix : str + The set prefix of the system + output : str + The output file for model deviation results + frequency : int + The number of steps that elapse between writing coordinates + in a trajectory by a MD engine (such as Gromacs / Lammps). + This paramter is used to determine the index in the output file. + real_error : bool, default: False + If True, calculate the RMS real error instead of model deviation. + atomic : bool, default: False + If True, calculate the force model deviation of each atom. + relative : float, default: None + If given, calculate the relative model deviation of force. The + value is the level parameter for computing the relative model + deviation of the force. + relative_v : float, default: None + If given, calculate the relative model deviation of virial. The + value is the level parameter for computing the relative model + deviation of the virial. + **kwargs + Arbitrary keyword arguments. + """ + auto_batch_size = AutoBatchSize() + # init models + dp_models = [DeepPot(model, auto_batch_size=auto_batch_size) for model in models] + + # check type maps + tmaps = [dp.get_type_map() for dp in dp_models] + if _check_tmaps(tmaps): + tmap = tmaps[0] + else: + raise RuntimeError("The models does not have the same type map.") + + all_sys = expand_sys_str(system) + if len(all_sys) == 0: + raise RuntimeError("Did not find valid system") + devis_coll = [] + + first_dp = dp_models[0] + + for system in all_sys: + # create data-system + dp_data = DeepmdData( + system, set_prefix, shuffle_test=False, type_map=tmap, sort_atoms=False + ) + if first_dp.get_dim_fparam() > 0: + dp_data.add( + "fparam", + first_dp.get_dim_fparam(), + atomic=False, + must=True, + high_prec=False, + ) + if first_dp.get_dim_aparam() > 0: + dp_data.add( + "aparam", + first_dp.get_dim_aparam(), + atomic=True, + must=True, + high_prec=False, + ) + if real_error: + dp_data.add( + "energy", + 1, + atomic=False, + must=False, + high_prec=True, + ) + dp_data.add( + "force", + 3, + atomic=True, + must=False, + high_prec=False, + ) + dp_data.add( + "virial", + 9, + atomic=False, + must=False, + high_prec=False, + ) + + mixed_type = dp_data.mixed_type + + data_sets = [dp_data._load_set(set_name) for set_name in dp_data.dirs] + nframes_tot = 0 + devis = [] + for data in data_sets: + coord = data["coord"] + box = data["box"] + if mixed_type: + atype = data["type"] + else: + atype = data["type"][0] + if not dp_data.pbc: + box = None + if first_dp.get_dim_fparam() > 0: + fparam = data["fparam"] + else: + fparam = None + if first_dp.get_dim_aparam() > 0: + aparam = data["aparam"] + else: + aparam = None + if real_error: + natoms = atype.shape[-1] + real_data = { + "energy": data["energy"] / natoms, + "force": data["force"].reshape([-1, natoms, 3]), + "virial": data["virial"] / natoms, + } + else: + real_data = None + devi = calc_model_devi( + coord, + box, + atype, + dp_models, + mixed_type=mixed_type, + fparam=fparam, + aparam=aparam, + real_data=real_data, + atomic=atomic, + relative=relative, + relative_v=relative_v, + ) + nframes_tot += coord.shape[0] + devis.append(devi) + devis = np.vstack(devis) + devis[:, 0] = np.arange(nframes_tot) * frequency + write_model_devi_out(devis, output, header=system, atomic=atomic) + devis_coll.append(devis) + return devis_coll diff --git a/doc/inference/python.md b/doc/inference/python.md index b5d3ca1efc..b01f371356 100644 --- a/doc/inference/python.md +++ b/doc/inference/python.md @@ -2,7 +2,7 @@ One may use the python interface of DeePMD-kit for model inference, an example is given as follows ```python -from deepmd.infer import DeepPot +from deepmd_utils.infer import DeepPot import numpy as np dp = DeepPot("graph.pb") @@ -15,8 +15,8 @@ where `e`, `f` and `v` are predicted energy, force and virial of the system, res Furthermore, one can use the python interface to calculate model deviation. ```python -from deepmd.infer import calc_model_devi -from deepmd.infer import DeepPot as DP +from deepmd_utils.infer import calc_model_devi +from deepmd_utils.infer import DeepPot as DP import numpy as np coord = np.array([[1, 0, 0], [0, 0, 1.5], [1, 0, 3]]).reshape([1, -1]) @@ -32,7 +32,7 @@ Note that if the model inference or model deviation is performed cyclically, one The native neighbor list algorithm of the DeePMD-kit is in $O(N^2)$ complexity ($N$ is the number of atoms). While this is not a problem for small systems that quantum methods can afford, the large systems for molecular dynamics have slow performance. -In this case, one may pass an external neighbor list that has lower complexity to {class}`DeepPot `, once it is compatible with {class}`ase.neighborlist.NewPrimitiveNeighborList`. +In this case, one may pass an external neighbor list that has lower complexity to {class}`DeepPot `, once it is compatible with {class}`ase.neighborlist.NewPrimitiveNeighborList`. ```py import ase.neighborlist @@ -43,4 +43,4 @@ neighbor_list = ase.neighborlist.NewPrimitiveNeighborList( dp = DeepPot("graph.pb", neighbor_list=neighbor_list) ``` -The `update` and `build` methods will be called by {class}`DeepPot `, and `first_neigh`, `pair_second`, and `offset_vec` properties will be used. +The `update` and `build` methods will be called by {class}`DeepPot `, and `first_neigh`, `pair_second`, and `offset_vec` properties will be used. diff --git a/doc/third-party/ase.md b/doc/third-party/ase.md index ac65fc926e..d9ab67ae3d 100644 --- a/doc/third-party/ase.md +++ b/doc/third-party/ase.md @@ -3,7 +3,7 @@ Deep potential can be set up as a calculator with ASE to obtain potential energies and forces. ```python from ase import Atoms -from deepmd.calculator import DP +from deepmd_utils.calculator import DP water = Atoms( "H2O", From c2c9e72b740d62d11639b231b52ad4847ff7ecc6 Mon Sep 17 00:00:00 2001 From: Jinzhe Zeng Date: Tue, 23 Jan 2024 23:03:50 -0500 Subject: [PATCH 2/3] fix deepmd.infer.model_devi Signed-off-by: Jinzhe Zeng --- deepmd/infer/model_devi.py | 11 ++++++++++- 1 file changed, 10 insertions(+), 1 deletion(-) diff --git a/deepmd/infer/model_devi.py b/deepmd/infer/model_devi.py index a45f96805b..802e0ae401 100644 --- a/deepmd/infer/model_devi.py +++ b/deepmd/infer/model_devi.py @@ -1,5 +1,14 @@ # SPDX-License-Identifier: LGPL-3.0-or-later -__all_ = [ +from deepmd_utils.infer.model_devi import ( + calc_model_devi, + calc_model_devi_e, + calc_model_devi_f, + calc_model_devi_v, + make_model_devi, + write_model_devi_out, +) + +__all__ = [ "make_model_devi", "calc_model_devi", "write_model_devi_out", From 60e44b4771fe38a08d946d397ebde0d4a7629cb4 Mon Sep 17 00:00:00 2001 From: Jinzhe Zeng Date: Tue, 23 Jan 2024 23:32:44 -0500 Subject: [PATCH 3/3] set auto_batch_size to True Signed-off-by: Jinzhe Zeng --- deepmd_utils/infer/model_devi.py | 6 +----- 1 file changed, 1 insertion(+), 5 deletions(-) diff --git a/deepmd_utils/infer/model_devi.py b/deepmd_utils/infer/model_devi.py index 1cb6c6fca1..b0693f5823 100644 --- a/deepmd_utils/infer/model_devi.py +++ b/deepmd_utils/infer/model_devi.py @@ -13,9 +13,6 @@ from deepmd_utils.infer.deep_pot import ( DeepPot, ) -from deepmd_utils.utils.batch_size import ( - AutoBatchSize, -) from deepmd_utils.utils.data import ( DeepmdData, ) @@ -395,9 +392,8 @@ def make_model_devi( **kwargs Arbitrary keyword arguments. """ - auto_batch_size = AutoBatchSize() # init models - dp_models = [DeepPot(model, auto_batch_size=auto_batch_size) for model in models] + dp_models = [DeepPot(model, auto_batch_size=True) for model in models] # check type maps tmaps = [dp.get_type_map() for dp in dp_models]