Source code for deepmd.dpmodel.descriptor.se_t

# SPDX-License-Identifier: LGPL-3.0-or-later
import itertools
from collections.abc import (
    Callable,
)
from typing import (
    Any,
    NoReturn,
)

import array_api_compat
import numpy as np

from deepmd.dpmodel import (
    DEFAULT_PRECISION,
    PRECISION_DICT,
    NativeOP,
)
from deepmd.dpmodel.array_api import (
    Array,
)
from deepmd.dpmodel.common import (
    cast_precision,
    get_xp_precision,
    to_numpy_array,
)
from deepmd.dpmodel.utils import (
    EmbeddingNet,
    EnvMat,
    NetworkCollection,
    PairExcludeMask,
)
from deepmd.dpmodel.utils.env_mat_stat import (
    EnvMatStatSe,
)
from deepmd.dpmodel.utils.seed import (
    child_seed,
)
from deepmd.dpmodel.utils.update_sel import (
    UpdateSel,
)
from deepmd.utils.data_system import (
    DeepmdDataSystem,
)
from deepmd.utils.path import (
    DPPath,
)
from deepmd.utils.version import (
    check_version_compatibility,
)

from .base_descriptor import (
    BaseDescriptor,
)


@BaseDescriptor.register("se_e3")
@BaseDescriptor.register("se_at")
@BaseDescriptor.register("se_a_3be")

[docs]
class DescrptSeT(NativeOP, BaseDescriptor):
    r"""DeepPot-SE constructed from all information (both angular and radial) of atomic
    configurations.

    The embedding takes angles between two neighboring atoms as input.

    The descriptor :math:`\mathcal{D}^i \in \mathbb{R}^{M}` is given by

    .. math::
        \mathcal{D}^i = \sum_{t_j, t_k} \frac{1}{N_{t_j} N_{t_k}} \sum_{j \in t_j, k \in t_k} \tilde{g}_{jk} \, \mathcal{N}_{t_j, t_k}(\tilde{g}_{jk}),

    where :math:`\tilde{g}_{jk} = \boldsymbol{rr}_j \cdot \boldsymbol{rr}_k` is the dot product
    of the smoothed directional vectors from the environment matrix, :math:`N_{t_j}` and
    :math:`N_{t_k}` are the numbers of neighbors of types :math:`t_j` and :math:`t_k`,
    and :math:`\mathcal{N}_{t_j, t_k}` is the embedding network that depends only on the
    types of neighbor atoms :math:`j` and :math:`k`.

    The smoothed directional vector :math:`\boldsymbol{rr}_j` is computed as:

    .. math::
        \boldsymbol{rr}_j = s(r_{ji}) \frac{\boldsymbol{R}_j - \boldsymbol{R}_i}{r_{ji}},

    where :math:`s(r)` is the switching function.

    Parameters
    ----------
    rcut : float
            The cut-off radius
    rcut_smth : float
            From where the environment matrix should be smoothed
    sel : list[int]
            sel[i] specifies the maxmum number of type i atoms in the cut-off radius
    neuron : list[int]
            Number of neurons in each hidden layers of the embedding net
    resnet_dt : bool
            Time-step `dt` in the resnet construction:
            y = x + dt * \phi (Wx + b)
    set_davg_zero : bool
            Set the shift of embedding net input to zero.
    activation_function : str
            The activation function in the embedding net. Supported options are |ACTIVATION_FN|
    env_protection : float
            Protection parameter to prevent division by zero errors during environment matrix calculations.
    exclude_types : list[list[int]]
            The excluded pairs of types which have no interaction with each other.
            For example, `[[0, 1]]` means no interaction between type 0 and type 1.
    precision : str
            The precision of the embedding net parameters. Supported options are |PRECISION|
    trainable : bool
            If the weights of embedding net are trainable.
    seed : int, Optional
            Random seed for initializing the network parameters.
    type_map: list[str], Optional
            A list of strings. Give the name to each type of atoms.
    ntypes : int
            Number of element types.
            Not used in this descriptor, only to be compat with input.
    """


[docs]
    _update_sel_cls = UpdateSel


    def __init__(
        self,
        rcut: float,
        rcut_smth: float,
        sel: list[int],
        neuron: list[int] = [24, 48, 96],
        resnet_dt: bool = False,
        set_davg_zero: bool = False,
        activation_function: str = "tanh",
        env_protection: float = 0.0,
        exclude_types: list[tuple[int, int]] = [],
        precision: str = DEFAULT_PRECISION,
        trainable: bool = True,
        seed: int | list[int] | None = None,
        type_map: list[str] | None = None,
        ntypes: int | None = None,  # to be compat with input
    ) -> None:
        del ntypes

[docs]
        self.rcut = rcut


[docs]
        self.rcut_smth = rcut_smth


[docs]
        self.sel = sel


[docs]
        self.neuron = neuron


[docs]
        self.filter_neuron = self.neuron


[docs]
        self.set_davg_zero = set_davg_zero


[docs]
        self.activation_function = activation_function


[docs]
        self.precision = precision


[docs]
        self.prec = PRECISION_DICT[self.precision]


[docs]
        self.resnet_dt = resnet_dt


[docs]
        self.env_protection = env_protection


[docs]
        self.ntypes = len(sel)


[docs]
        self.seed = seed


[docs]
        self.type_map = type_map

        # order matters, placed after the assignment of self.ntypes
        self.reinit_exclude(exclude_types)

[docs]
        self.trainable = trainable


[docs]
        self.sel_cumsum = [0, *np.cumsum(self.sel).tolist()]


[docs]
        self.compress = False


        in_dim = 1  # not considiering type embedding
        embeddings = NetworkCollection(
            ntypes=self.ntypes,
            ndim=2,
            network_type="embedding_network",
        )
        for ii, embedding_idx in enumerate(
            itertools.product(range(self.ntypes), repeat=embeddings.ndim)
        ):
            embeddings[embedding_idx] = EmbeddingNet(
                in_dim,
                self.neuron,
                self.activation_function,
                self.resnet_dt,
                self.precision,
                seed=child_seed(self.seed, ii),
                trainable=trainable,
            )

[docs]
        self.embeddings = embeddings


[docs]
        self.env_mat = EnvMat(self.rcut, self.rcut_smth, protection=self.env_protection)


[docs]
        self.nnei = sum(self.sel)


[docs]
        self.davg = np.zeros(
            [self.ntypes, self.nnei, 4], dtype=PRECISION_DICT[self.precision]
        )


[docs]
        self.dstd = np.ones(
            [self.ntypes, self.nnei, 4], dtype=PRECISION_DICT[self.precision]
        )


[docs]
        self.orig_sel = self.sel


[docs]
        self.ndescrpt = self.nnei * 4



[docs]
    def __setitem__(self, key: str, value: Array) -> None:
        if key in ("avg", "data_avg", "davg"):
            self.davg = value
        elif key in ("std", "data_std", "dstd"):
            self.dstd = value
        else:
            raise KeyError(key)



[docs]
    def __getitem__(self, key: str) -> Array:
        if key in ("avg", "data_avg", "davg"):
            return self.davg
        elif key in ("std", "data_std", "dstd"):
            return self.dstd
        else:
            raise KeyError(key)


    @property

[docs]
    def dim_out(self) -> int:
        """Returns the output dimension of this descriptor."""
        return self.get_dim_out()



[docs]
    def change_type_map(
        self, type_map: list[str], model_with_new_type_stat: Any = None
    ) -> None:
        """Change the type related params to new ones, according to `type_map` and the original one in the model.
        If there are new types in `type_map`, statistics will be updated accordingly to `model_with_new_type_stat` for these new types.
        """
        raise NotImplementedError(
            "Descriptor se_e3 does not support changing for type related params!"
            "This feature is currently not implemented because it would require additional work to support the non-mixed-types case. "
            "We may consider adding this support in the future if there is a clear demand for it."
        )



[docs]
    def get_dim_out(self) -> int:
        """Returns the output dimension of this descriptor."""
        return self.neuron[-1]



[docs]
    def get_dim_emb(self) -> int:
        """Returns the embedding (g2) dimension of this descriptor."""
        return self.neuron[-1]



[docs]
    def get_rcut(self) -> float:
        """Returns cutoff radius."""
        return self.rcut



[docs]
    def get_rcut_smth(self) -> float:
        """Returns the radius where the neighbor information starts to smoothly decay to 0."""
        return self.rcut_smth



[docs]
    def get_sel(self) -> list:
        """Returns cutoff radius."""
        return self.sel



[docs]
    def mixed_types(self) -> bool:
        """Returns if the descriptor requires a neighbor list that distinguish different
        atomic types or not.
        """
        return False



[docs]
    def has_message_passing(self) -> bool:
        """Returns whether the descriptor has message passing."""
        return False



[docs]
    def has_message_passing_across_ranks(self) -> bool:
        """Returns whether per-layer node embeddings need MPI ghost exchange."""
        return False



[docs]
    def need_sorted_nlist_for_lower(self) -> bool:
        """Returns whether the descriptor needs sorted nlist when using `forward_lower`."""
        return False



[docs]
    def get_env_protection(self) -> float:
        """Returns the protection of building environment matrix."""
        return self.env_protection



[docs]
    def share_params(
        self, base_class: Any, shared_level: int, resume: bool = False
    ) -> NoReturn:
        """
        Share the parameters of self to the base_class with shared_level during multitask training.
        If not start from checkpoint (resume is False),
        some separated parameters (e.g. mean and stddev) will be re-calculated across different classes.
        """
        raise NotImplementedError



[docs]
    def get_ntypes(self) -> int:
        """Returns the number of element types."""
        return self.ntypes



[docs]
    def get_type_map(self) -> list[str]:
        """Get the name to each type of atoms."""
        return self.type_map



[docs]
    def compute_input_stats(
        self,
        merged: Callable[[], list[dict]] | list[dict],
        path: DPPath | None = None,
    ) -> None:
        """
        Compute the input statistics (e.g. mean and stddev) for the descriptors from packed data.

        Parameters
        ----------
        merged : Union[Callable[[], list[dict]], list[dict]]
            - list[dict]: A list of data samples from various data systems.
                Each element, `merged[i]`, is a data dictionary containing `keys`: `paddle.Tensor`
                originating from the `i`-th data system.
            - Callable[[], list[dict]]: A lazy function that returns data samples in the above format
                only when needed. Since the sampling process can be slow and memory-intensive,
                the lazy function helps by only sampling once.
        path : Optional[DPPath]
            The path to the stat file.

        """
        env_mat_stat = EnvMatStatSe(self)
        if path is not None:
            path = path / env_mat_stat.get_hash()
        if path is None or not path.is_dir():
            if callable(merged):
                # only get data for once
                sampled = merged()
            else:
                sampled = merged
        else:
            sampled = []
        env_mat_stat.load_or_compute_stats(sampled, path)
        self.stats = env_mat_stat.stats
        mean, stddev = env_mat_stat()
        xp = array_api_compat.array_namespace(self.dstd)
        device = array_api_compat.device(self.dstd)
        if not self.set_davg_zero:
            self.davg = xp.asarray(
                mean, dtype=self.davg.dtype, copy=True, device=device
            )
        self.dstd = xp.asarray(stddev, dtype=self.dstd.dtype, copy=True, device=device)



[docs]
    def set_stat_mean_and_stddev(
        self,
        mean: Array,
        stddev: Array,
    ) -> None:
        """Update mean and stddev for descriptor."""
        self.davg = mean
        self.dstd = stddev



[docs]
    def get_stat_mean_and_stddev(self) -> tuple[Array, Array]:
        """Get mean and stddev for descriptor."""
        return self.davg, self.dstd



[docs]
    def reinit_exclude(
        self,
        exclude_types: list[tuple[int, int]] = [],
    ) -> None:
        self.exclude_types = exclude_types
        self.emask = PairExcludeMask(self.ntypes, exclude_types=exclude_types)


    @cast_precision

[docs]
    def call(
        self,
        coord_ext: Array,
        atype_ext: Array,
        nlist: Array,
        mapping: Array | None = None,
        fparam: Array | None = None,
        comm_dict: dict | None = None,
        charge_spin: Array | None = None,
    ) -> tuple[Array, Array]:
        """Compute the descriptor.

        Parameters
        ----------
        coord_ext
            The extended coordinates of atoms. shape: nf x (nallx3)
        atype_ext
            The extended aotm types. shape: nf x nall
        nlist
            The neighbor list. shape: nf x nloc x nnei
        mapping
            The index mapping from extended to local region. not used by this descriptor.

        Returns
        -------
        descriptor
            The descriptor. shape: nf x nloc x ng
        gr
            The rotationally equivariant and permutationally invariant single particle
            representation.
            This descriptor returns None.
        g2
            The rotationally invariant pair-partical representation.
            This descriptor returns None.
        h2
            The rotationally equivariant pair-partical representation.
            This descriptor returns None.
        sw
            The smooth switch function.
        """
        del mapping
        xp = array_api_compat.array_namespace(coord_ext, atype_ext, nlist)
        # nf x nloc x nnei x 4
        rr, diff, ww = self.env_mat.call(
            coord_ext,
            atype_ext,
            nlist,
            self.davg[...],
            self.dstd[...],
        )
        nf, nloc, nnei, _ = rr.shape
        sec = self.sel_cumsum

        ng = self.neuron[-1]
        result = xp.zeros(
            [nf * nloc, ng],
            dtype=get_xp_precision(xp, self.precision),
            device=array_api_compat.device(coord_ext),
        )
        exclude_mask = self.emask.build_type_exclude_mask(nlist, atype_ext)
        # merge nf and nloc axis, so for type_one_side == False,
        # we don't require atype is the same in all frames
        exclude_mask = xp.reshape(exclude_mask, (nf * nloc, nnei))
        rr = xp.reshape(rr, (nf * nloc, nnei, 4))

        for embedding_idx in itertools.product(
            range(self.ntypes), repeat=self.embeddings.ndim
        ):
            ti, tj = embedding_idx
            nei_type_i = self.sel[ti]
            nei_type_j = self.sel[tj]
            if ti <= tj:
                # avoid repeat calculation
                # nfnl x nt_i x 3
                rr_i = rr[:, sec[ti] : sec[ti + 1], 1:]
                mm_i = exclude_mask[:, sec[ti] : sec[ti + 1]]
                rr_i = rr_i * xp.astype(mm_i[:, :, None], rr_i.dtype)
                # nfnl x nt_j x 3
                rr_j = rr[:, sec[tj] : sec[tj + 1], 1:]
                mm_j = exclude_mask[:, sec[tj] : sec[tj + 1]]
                rr_j = rr_j * xp.astype(mm_j[:, :, None], rr_j.dtype)
                # nfnl x nt_i x nt_j
                # env_ij = np.einsum("ijm,ikm->ijk", rr_i, rr_j)
                env_ij = xp.sum(rr_i[:, :, None, :] * rr_j[:, None, :, :], axis=-1)
                # nfnl x nt_i x nt_j x 1
                env_ij_reshape = env_ij[:, :, :, None]
                # nfnl x nt_i x nt_j x ng
                gg = self.embeddings[embedding_idx].call(env_ij_reshape)
                # nfnl x nt_i x nt_j x ng
                # res_ij = np.einsum("ijk,ijkm->im", env_ij, gg)
                res_ij = xp.sum(env_ij[:, :, :, None] * gg, axis=(1, 2))
                res_ij = res_ij * (1.0 / float(nei_type_i) / float(nei_type_j))
                result += res_ij
        # nf x nloc x ng
        result = xp.reshape(result, (nf, nloc, ng))
        return result, None, None, None, ww



[docs]
    def serialize(self) -> dict:
        """Serialize the descriptor to dict."""
        for embedding_idx in itertools.product(range(self.ntypes), repeat=2):
            # not actually used; to match serilization data from TF to pass the test
            ti, tj = embedding_idx
            if (self.exclude_types and embedding_idx in self.emask) or tj < ti:
                self.embeddings[embedding_idx].clear()

        data = {
            "@class": "Descriptor",
            "type": "se_e3",
            "@version": 3 if self.compress else 2,
            "rcut": self.rcut,
            "rcut_smth": self.rcut_smth,
            "sel": self.sel,
            "neuron": self.neuron,
            "resnet_dt": self.resnet_dt,
            "set_davg_zero": self.set_davg_zero,
            "activation_function": self.activation_function,
            "precision": np.dtype(PRECISION_DICT[self.precision]).name,
            "embeddings": self.embeddings.serialize(),
            "env_mat": self.env_mat.serialize(),
            "exclude_types": self.exclude_types,
            "env_protection": self.env_protection,
            "@variables": {
                "davg": to_numpy_array(self.davg),
                "dstd": to_numpy_array(self.dstd),
            },
            "type_map": self.type_map,
            "trainable": self.trainable,
        }
        if self.compress:
            data["compress"] = {
                "@variables": {
                    "compress_data": [to_numpy_array(d) for d in self.compress_data],
                    "compress_info": [to_numpy_array(i) for i in self.compress_info],
                },
            }
        return data


    @classmethod

[docs]
    def deserialize(cls, data: dict) -> "DescrptSeT":
        """Deserialize from dict."""
        data = data.copy()
        check_version_compatibility(data.pop("@version", 1), 3, 1)
        data.pop("@class", None)
        data.pop("type", None)
        variables = data.pop("@variables")
        embeddings = data.pop("embeddings")
        env_mat = data.pop("env_mat")
        compress = data.pop("compress", None)
        obj = cls(**data)

        obj["davg"] = variables["davg"]
        obj["dstd"] = variables["dstd"]
        obj.embeddings = NetworkCollection.deserialize(embeddings)
        if compress is not None:
            obj._load_compress_data(compress)
        return obj



[docs]
    def _load_compress_data(self, compress: dict) -> None:
        """Load compression state from serialized data."""
        variables = compress["@variables"]
        self.compress_data = variables["compress_data"]
        self.compress_info = variables["compress_info"]
        self.compress = True


    @classmethod

[docs]
    def update_sel(
        cls,
        train_data: DeepmdDataSystem,
        type_map: list[str] | None,
        local_jdata: dict,
    ) -> tuple[Array, Array]:
        """Update the selection and perform neighbor statistics.

        Parameters
        ----------
        train_data : DeepmdDataSystem
            data used to do neighbor statistics
        type_map : list[str], optional
            The name of each type of atoms
        local_jdata : dict
            The local data refer to the current class

        Returns
        -------
        dict
            The updated local data
        float
            The minimum distance between two atoms
        """
        local_jdata_cpy = local_jdata.copy()
        min_nbor_dist, local_jdata_cpy["sel"] = cls._update_sel_cls().update_one_sel(
            train_data, type_map, local_jdata_cpy["rcut"], local_jdata_cpy["sel"], False
        )
        return local_jdata_cpy, min_nbor_dist