Source code for mattertune.backbones.m3gnet.model

from __future__ import annotations

import contextlib
import importlib.util
import logging
from dataclasses import dataclass
from pathlib import Path
from typing import TYPE_CHECKING, Literal

import nshconfig as C
import torch
import torch.nn.functional as F
from ase import Atoms
from torch.autograd import grad
from typing_extensions import final, override

from ...finetune import properties as props
from ...finetune.base import FinetuneModuleBase, FinetuneModuleBaseConfig, ModelOutput
from ...normalization import NormalizationContext
from ...registry import backbone_registry
from ...util import optional_import_error_message

if TYPE_CHECKING:
    from dgl import DGLGraph  # type: ignore[reportMissingImports] # noqa

log = logging.getLogger(__name__)



[docs]
@dataclass
class MatGLData:
    g: DGLGraph
    """The DGL node graph for pairwise interactions."""
    lg: DGLGraph | None
    """The DGL edge graph for three-body interactions."""
    state_attr: torch.Tensor
    """The global state attributes"""
    lattice: torch.Tensor  # 1 3 3
    """The atomic lattice vectors"""
    labels: dict[str, torch.Tensor]
    """The ground truth labels"""




[docs]
@dataclass
class MatGLBatch:
    g: DGLGraph
    """The DGL node graph for pairwise interactions."""
    lg: DGLGraph | None
    """The DGL edge graph for three-body interactions."""
    state_attr: torch.Tensor
    """The global state attributes"""
    lattice: torch.Tensor  # batch_size 3 3
    """The atomic lattice vectors"""
    strain: torch.Tensor  # batch_size 3 3
    """The strain tensor"""
    labels: dict[str, torch.Tensor]
    """The ground truth labels"""



def _default_elements():
    with optional_import_error_message("matgl"):
        from matgl.config import DEFAULT_ELEMENTS  # type: ignore[reportMissingImports] # noqa

    return DEFAULT_ELEMENTS



[docs]
class M3GNetGraphComputerConfig(C.Config):
    """Configuration for initialize a MatGL Atoms2Graph Convertor."""

    element_types: tuple[str, ...] = C.Field(default_factory=_default_elements)
    """The element types to consider, default is all elements."""
    cutoff: float | None = None
    """The cutoff distance for the neighbor list. If None, the cutoff is loaded from the checkpoint."""
    threebody_cutoff: float | None = None
    """The cutoff distance for the three-body interactions. If None, the cutoff is loaded from the checkpoint."""
    pre_compute_line_graph: bool = False
    """Whether to pre-compute the line graph for three-body interactions in data preparation."""
    graph_labels: list[int | float] | None = None
    """The graph labels to consider, default is None."""




[docs]
@backbone_registry.register
class M3GNetBackboneConfig(FinetuneModuleBaseConfig):
    name: Literal["m3gnet"] = "m3gnet"
    """The type of the backbone."""
    ckpt_path: str | Path
    """The path to the pre-trained model checkpoint."""
    graph_computer: M3GNetGraphComputerConfig
    """Configuration for the graph computer."""


[docs]
    @override
    def create_model(self):
        return M3GNetBackboneModule(self)



[docs]
    @override
    @classmethod
    def ensure_dependencies(cls):
        if importlib.util.find_spec("matgl") is None:
            raise ImportError(
                "The `matgl` module is not installed. Please install it by running"
                " `pip install matgl`."
            )

        if importlib.util.find_spec("dgl") is None:
            raise ImportError(
                "The `dgl` module is not installed. Please install it by running"
                " `pip install dgl`."
            )





[docs]
@final
class M3GNetBackboneModule(
    FinetuneModuleBase[MatGLData, MatGLBatch, M3GNetBackboneConfig]
):
    """
    Implementation of the M3GNet backbone that fits into the MatterTune framework.
    Followed the Matgl version of M3GNet.
    Paper: https://www.nature.com/articles/s43588-022-00349-3
    Matgl Repo: https://github.com/materialsvirtuallab/matgl
    """


[docs]
    @override
    @classmethod
    def hparams_cls(cls):
        return M3GNetBackboneConfig


    def _should_enable_grad(self):
        return self.calc_forces or self.calc_stress


[docs]
    @override
    def requires_disabled_inference_mode(self):
        return self._should_enable_grad()



[docs]
    @override
    def setup(self, stage: str):
        super().setup(stage)

        if self._should_enable_grad():
            for loop in (
                self.trainer.validate_loop,
                self.trainer.test_loop,
                self.trainer.predict_loop,
            ):
                if loop.inference_mode:
                    raise ValueError(
                        "Cannot run inference mode with forces or stress calculation. "
                        "Please set `inference_mode` to False in the trainer configuration."
                    )



[docs]
    @override
    def create_model(self):
        with optional_import_error_message("matgl"):
            from matgl.ext.ase import Atoms2Graph  # type: ignore[reportMissingImports] # noqa
            from matgl.models import M3GNet  # type: ignore[reportMissingImports] # noqa
            from matgl.utils.io import _get_file_paths  # type: ignore[reportMissingImports] # noqa

        ## Load the backbone from the checkpoint
        path = Path(self.hparams.ckpt_path)
        fpaths = _get_file_paths(path)
        self.backbone = M3GNet.load(fpaths)

        ## Build the graph computer
        if isinstance(self.hparams.graph_computer, dict):
            self.hparams.graph_computer = M3GNetGraphComputerConfig(
                **self.hparams.graph_computer
            )
        if self.hparams.graph_computer.cutoff is None:
            self.hparams.graph_computer.cutoff = self.backbone.cutoff
        if self.hparams.graph_computer.threebody_cutoff is None:
            self.hparams.graph_computer.threebody_cutoff = (
                self.backbone.threebody_cutoff
            )
        self.graph_computer = Atoms2Graph(
            element_types=self.hparams.graph_computer.element_types,
            cutoff=self.hparams.graph_computer.cutoff,
        )

        ## Check Properties
        ## For now we only support energy, forces, and stress
        self.energy_prop_name = "energy"
        self.forces_prop_name = "forces"
        self.stress_prop_name = "stress"
        self.calc_forces = False
        self.calc_stress = False
        for prop in self.hparams.properties:
            match prop:
                case props.EnergyPropertyConfig():
                    self.energy_prop_name = prop.name
                case props.ForcesPropertyConfig():
                    assert (
                        prop.conservative
                    ), "Only conservative forces are supported for M3GNet"
                    self.forces_prop_name = prop.name
                    self.calc_forces = True
                case props.StressesPropertyConfig():
                    assert (
                        prop.conservative
                    ), "Only conservative stress are supported for M3GNet"
                    self.stress_prop_name = prop.name
                    self.calc_stress = True
                case _:
                    raise ValueError(
                        f"Unsupported property config: {prop} for M3GNet"
                        "Please ask the maintainers of MatterTune or Matgl for support"
                    )
        if not self.calc_forces and self.calc_stress:
            raise ValueError(
                "Stress calculation requires force calculation, cannot calculate stress without force"
            )



[docs]
    @override
    @contextlib.contextmanager
    def model_forward_context(self, data):
        with contextlib.ExitStack() as stack:
            if self.calc_forces or self.calc_stress:
                stack.enter_context(torch.enable_grad())

            yield



[docs]
    @override
    def model_forward(
        self,
        batch: MatGLBatch,
        return_backbone_output: bool = False,
    ):
        with optional_import_error_message("matgl"):
            import matgl  # type: ignore[reportMissingImports] # noqa

        g, lg, state_attr, lattice, strain = (
            batch.g,
            batch.lg,
            batch.state_attr,
            batch.lattice,
            batch.strain,
        )
        if return_backbone_output:
            backbone_output = self.backbone(
                g, state_attr, lg, return_all_layer_output=True
            )
            energy: torch.Tensor = torch.squeeze(backbone_output["final"])
        else:
            backbone_output = self.backbone(
                g, state_attr, lg, return_all_layer_output=False
            )
            energy: torch.Tensor = backbone_output
        output_pred: dict[str, torch.Tensor] = {self.energy_prop_name: energy}
        grad_vars = [g.ndata["pos"], strain] if self.calc_stress else [g.ndata["pos"]]

        grads = None
        if self.calc_forces:
            grads = grad(
                energy,
                grad_vars,
                grad_outputs=torch.ones_like(energy),
                create_graph=True,
                retain_graph=True,
                allow_unused=True,
            )
            forces: torch.Tensor = -grads[0]
            output_pred[self.forces_prop_name] = forces

        if self.calc_stress:
            volume = (
                torch.abs(torch.det(lattice.float())).half()
                if matgl.float_th == torch.float16
                else torch.abs(torch.det(lattice))
            )
            assert grads is not None, "Forces must be calculated to compute stress"
            sts = -grads[1]
            scale = 1.0 / volume * -160.21766208
            sts = (
                [i * j for i, j in zip(sts, scale)] if sts.dim() == 3 else [sts * scale]
            )
            stress: torch.Tensor = torch.cat(sts)
            output_pred[self.stress_prop_name] = stress.reshape(-1, 3, 3)

        pred: ModelOutput = {"predicted_properties": output_pred}
        if return_backbone_output:
            pred["backbone_output"] = backbone_output
        return pred



[docs]
    @override
    def pretrained_backbone_parameters(self):
        return self.backbone.parameters()



[docs]
    @override
    def output_head_parameters(self):
        return []



[docs]
    @override
    def cpu_data_transform(self, data):
        return data



[docs]
    @override
    def collate_fn(self, data_list):
        with optional_import_error_message("dgl"):
            import dgl  # type: ignore[reportMissingImports] # noqa

        g = dgl.batch([data.g for data in data_list])
        if self.hparams.graph_computer.pre_compute_line_graph:
            lg = dgl.batch([data.lg for data in data_list if data.lg is not None])
        else:
            lg = None
        if self.hparams.graph_computer.graph_labels is not None:
            state_attr = torch.tensor(self.hparams.graph_computer.graph_labels).long()
        else:
            state_attr = torch.stack([data.state_attr for data in data_list])
        lattice = torch.concat([data.lattice for data in data_list], dim=0)
        strain = lattice.new_zeros([g.batch_size, 3, 3])
        labels = {}
        for key in data_list[0].labels:
            try:
                labels[key] = torch.cat([data.labels[key] for data in data_list], dim=0)
            except:
                labels[key] = torch.stack([data.labels[key] for data in data_list])
        return MatGLBatch(g, lg, state_attr, lattice, strain, labels)



[docs]
    @override
    def gpu_batch_transform(self, batch: MatGLBatch) -> MatGLBatch:
        if self.calc_stress:
            batch.strain.requires_grad_(True)
            batch.lattice = batch.lattice @ (
                torch.eye(3, device=batch.lattice.device) + batch.strain
            )
        batch.g.edata["lattice"] = torch.repeat_interleave(
            batch.lattice, batch.g.batch_num_edges(), dim=0
        )
        batch.g.edata["pbc_offshift"] = (
            batch.g.edata["pbc_offset"].unsqueeze(dim=-1) * batch.g.edata["lattice"]
        ).sum(dim=1)
        batch.g.ndata["pos"] = (
            batch.g.ndata["frac_coords"].unsqueeze(dim=-1)
            * torch.repeat_interleave(batch.lattice, batch.g.batch_num_nodes(), dim=0)
        ).sum(dim=1)
        if self.calc_forces:
            batch.g.ndata["pos"].requires_grad_(True)
        return batch



[docs]
    @override
    def batch_to_labels(self, batch):
        return batch.labels



[docs]
    @override
    def atoms_to_data(self, atoms: Atoms, has_labels: bool) -> MatGLData:
        with optional_import_error_message("matgl"):
            import matgl  # type: ignore[reportMissingImports] # noqa
            from matgl.graph.compute import (  # type: ignore[reportMissingImports] # noqa
                compute_pair_vector_and_distance,
                create_line_graph,
            )

        graph, lattice, state_attr = self.graph_computer.get_graph(atoms)
        graph.ndata["pos"] = torch.tensor(atoms.get_positions(), dtype=matgl.float_th)
        graph.edata["pbc_offshift"] = torch.matmul(
            graph.edata["pbc_offset"], lattice[0]
        )
        bond_vec, bond_dist = compute_pair_vector_and_distance(graph)
        graph.edata["bond_vec"] = bond_vec
        graph.edata["bond_dist"] = bond_dist
        if self.hparams.graph_computer.pre_compute_line_graph:
            line_graph = create_line_graph(
                graph, self.hparams.graph_computer.threebody_cutoff, directed=False
            )  # type: ignore
            for name in ["bond_vec", "bond_dist", "pbc_offset"]:
                line_graph.ndata.pop(name)
        else:
            line_graph = None
        graph.ndata.pop("pos")
        graph.edata.pop("pbc_offshift")

        state_attr = torch.tensor(state_attr).long()

        labels = {}
        if has_labels:
            for prop in self.hparams.properties:
                value = prop._from_ase_atoms_to_torch(atoms)
                # For stress, we should make sure it is (3, 3), not the flattened (6,)
                #   that ASE returns.
                if isinstance(prop, props.StressesPropertyConfig):
                    from ase.constraints import voigt_6_to_full_3x3_stress

                    value = voigt_6_to_full_3x3_stress(value.float().numpy())
                    value = torch.from_numpy(value).float().reshape(1, 3, 3)
                labels[prop.name] = value
        return MatGLData(graph, line_graph, state_attr, lattice, labels)



[docs]
    @override
    def create_normalization_context_from_batch(self, batch):
        with optional_import_error_message("dgl"):
            import dgl  # type: ignore[reportMissingImports] # noqa

        with optional_import_error_message("matgl"):
            from matgl.config import DEFAULT_ELEMENTS  # type: ignore[reportMissingImports] # noqa

        g = batch.g
        atomic_numbers: torch.Tensor = g.ndata["node_type"].long()  # (n_atoms,)

        # Convert atomic numbers to one-hot encoding
        g.ndata["atom_types_onehot"] = F.one_hot(
            atomic_numbers, num_classes=len(DEFAULT_ELEMENTS)
        ).float()

        # Sum the one-hot encoded atom types for each graph in the batch
        compositions = dgl.readout_nodes(g, feat="atom_types_onehot", op="sum")

        return NormalizationContext(compositions=compositions)