Source code for torch_sim.models.fairchem_legacy

"""Wrapper for Legacy FairChem ecosystem models in TorchSim.

This module provides a TorchSim wrapper of the FairChem models for computing
energies, forces, and stresses of atomistic systems. It serves as a wrapper around
the FairChem library, integrating it with the torch_sim framework to enable seamless
simulation of atomistic systems with machine learning potentials.

The FairChemV1Model class adapts FairChem models to the ModelInterface protocol,
allowing them to be used within the broader torch_sim simulation framework.

Notes:
    This implementation requires FairChem < 2.0.0 to be installed and accessible.
    It supports various model configurations through configuration files or
    pretrained model checkpoints.
"""

# ruff: noqa: T201

from __future__ import annotations

import copy
import os
import traceback
import typing
import warnings
from pathlib import Path
from types import MappingProxyType
from typing import Any

import torch

from torch_sim.models.interface import ModelInterface


if typing.TYPE_CHECKING:
    from torch_sim.state import SimState


def _validate_fairchem_version() -> None:
    """Check for a compatible legacy FairChem version."""
    from importlib.metadata import version

    from packaging.version import parse

    fairchem_version = parse(version("fairchem-core"))
    if fairchem_version >= parse("2.0.0"):
        raise ImportError("FairChem v1.10.0 or lower is required")


try:
    _validate_fairchem_version()
    from fairchem.core.common.registry import registry
    from fairchem.core.common.utils import (
        load_config,
        setup_imports,
        setup_logging,
        update_config,
    )
    from fairchem.core.models.model_registry import model_name_to_local_file
    from torch_geometric.data import Batch, Data

except ImportError as exc:
    warnings.warn(f"FairChem import failed: {traceback.format_exc()}", stacklevel=2)

    class FairChemV1Model(ModelInterface):
        """FairChem model wrapper for torch_sim.

        This class is a placeholder for the FairChemV1Model class.
        It raises an ImportError if FairChem is not installed.
        """

        def __init__(self, err: ImportError = exc, *_args: Any, **_kwargs: Any) -> None:
            """Dummy init for type checking."""
            raise err


if typing.TYPE_CHECKING:
    from collections.abc import Callable


_DTYPE_DICT = {
    torch.float16: "float16",
    torch.float32: "float32",
    torch.float64: "float64",
}



[docs]
class FairChemV1Model(ModelInterface):
    """Computes atomistic energies, forces and stresses using a FairChem model.

    This class wraps a FairChem model to compute energies, forces, and stresses for
    atomistic systems. It handles model initialization, checkpoint loading, and
    provides a forward pass that accepts a SimState object and returns model
    predictions.

    The model can be initialized either with a configuration file or a pretrained
    checkpoint. It supports various model architectures and configurations supported by
    FairChem.

    Attributes:
        neighbor_list_fn (Callable | None): Function to compute neighbor lists
        config (dict): Complete model configuration dictionary
        trainer: FairChem trainer object that contains the model
        data_object (Batch): Data object containing system information
        implemented_properties (list): Model outputs the model can compute
        pbc (bool): Whether periodic boundary conditions are used
        _dtype (torch.dtype): Data type used for computation
        _compute_stress (bool): Whether to compute stress tensor
        _compute_forces (bool): Whether to compute forces
        _device (torch.device): Device where computation is performed
        _reshaped_props (dict): Properties that need reshaping after computation

    Examples:
        >>> model = FairChemV1Model(model="path/to/checkpoint.pt", compute_stress=True)
        >>> results = model(state)

    """

    _reshaped_props = MappingProxyType(
        {"stress": (-1, 3, 3), "dielectric_tensor": (-1, 3, 3)}
    )

    def __init__(  # noqa: C901, PLR0915
        self,
        model: str | Path | None = None,
        neighbor_list_fn: Callable | None = None,
        *,  # force remaining arguments to be keyword-only
        config_yml: str | None = None,
        local_cache: str | None = None,
        trainer: str | None = None,
        device: torch.device | None = None,
        seed: int | None = None,
        dtype: torch.dtype | None = None,
        compute_stress: bool = False,
        pbc: torch.Tensor | bool = True,
        disable_amp: bool = True,
    ) -> None:
        """Initialize the FairChemV1Model with specified configuration.

        Loads a FairChem model from either a checkpoint path or a configuration file.
        Sets up the model parameters, trainer, and configuration for subsequent use
        in energy and force calculations.

        Args:
            model (str | Path | None): Either a pretrained model name or path to model
                checkpoint file. The function will first check if it's a valid file
                path, and if not, will attempt to load it as a pretrained model name
                (requires local_cache to be set). If None, config_yml must be provided.
            neighbor_list_fn (Callable | None): Function to compute neighbor lists
                (not currently supported)
            config_yml (str | None): Path to configuration YAML file
            local_cache (str | None): Path to local model cache directory (required
                when using pretrained model names)
            trainer (str | None): Name of trainer class to use
            device (torch.device | None): Device to use for computation. If None,
                defaults to CUDA if available, otherwise CPU.
            seed (int | None): Random seed for reproducibility
            dtype (torch.dtype | None): Data type to use for computation
            compute_stress (bool): Whether to compute stress tensor
            pbc (torch.Tensor | bool): Whether to use periodic boundary conditions
            disable_amp (bool): Whether to disable AMP
        Raises:
            NotImplementedError: If custom neighbor list function is provided
            ValueError: If stress computation is requested but not supported by model
            ValueError: If neither config_yml nor model is provided
            ValueError: If model cannot be loaded as file or pretrained model

        Notes:
            Either config_yml or model must be provided. The model loads configuration
            from the checkpoint if config_yml is not specified.
        """
        setup_imports()
        setup_logging()
        super().__init__()

        self._dtype = dtype or torch.float32
        self._compute_stress = compute_stress
        self._compute_forces = True
        self._memory_scales_with = "n_atoms"
        if isinstance(pbc, bool):
            pbc = torch.tensor([pbc] * 3, dtype=torch.bool)
        elif not torch.all(pbc == pbc[0]):
            raise ValueError(
                f"FairChemV1Model does not support mixed PBC (got pbc={pbc.tolist()})"
            )
        self.pbc = pbc

        # Process model parameter if provided
        if model is not None:
            # Convert Path to string for consistency
            if isinstance(model, Path):
                model = str(model)

            # Determine if model is a file path or a pretrained model name
            # First check if it's a valid file path
            if not os.path.isfile(model):
                # If not a file, try to load as pretrained model name
                if local_cache is None:
                    raise ValueError(
                        f"Model '{model}' is not a valid file path. "
                        "If using a pretrained model name, local_cache must be set."
                    )
                # Attempt to load as pretrained model name
                model = model_name_to_local_file(
                    model_name=model, local_cache=local_cache
                )

        # Either the config path or the checkpoint path needs to be provided
        if not config_yml and model is None:
            raise ValueError("Either config_yml or model must be provided")

        checkpoint = None
        if config_yml is not None:
            if isinstance(config_yml, str):
                config, duplicates_warning, duplicates_error = load_config(config_yml)
                if len(duplicates_warning) > 0:
                    print(
                        "Overwritten config parameters from included configs "
                        f"(non-included parameters take precedence): {duplicates_warning}"
                    )
                if len(duplicates_error) > 0:
                    raise ValueError(
                        "Conflicting (duplicate) parameters in simultaneously "
                        f"included configs: {duplicates_error}"
                    )
            else:
                config = config_yml

            # Only keeps the train data that might have normalizer values
            if isinstance(config["dataset"], list):
                config["dataset"] = config["dataset"][0]
            elif isinstance(config["dataset"], dict):
                config["dataset"] = config["dataset"].get("train", None)
        else:
            # Loads the config from the checkpoint directly (always on CPU).
            if model is None:
                raise ValueError("model must be provided when config_yml is not set")
            checkpoint = torch.load(model, map_location=torch.device("cpu"))
            config = checkpoint["config"]

        if trainer is not None:
            config["trainer"] = trainer
        else:
            config["trainer"] = config.get("trainer", "ocp")

        if "model_attributes" in config:
            config["model_attributes"]["name"] = config.pop("model")
            config["model"] = config["model_attributes"]

        self.neighbor_list_fn = neighbor_list_fn

        if neighbor_list_fn is None:
            # Calculate the edge indices on the fly
            config["model"]["otf_graph"] = True
        else:
            raise NotImplementedError(
                "Custom neighbor list is not supported for FairChemV1Model."
            )

        pbc_bool = bool(self.pbc[0].item())

        if "backbone" in config["model"]:
            config["model"]["backbone"]["use_pbc"] = pbc_bool
            config["model"]["backbone"]["use_pbc_single"] = False
            if dtype is not None:
                try:
                    config["model"]["backbone"].update({"dtype": _DTYPE_DICT[dtype]})
                    for key in config["model"]["heads"]:
                        config["model"]["heads"][key].update(
                            {"dtype": _DTYPE_DICT[dtype]}
                        )
                except KeyError:
                    print(
                        "WARNING: dtype not found in backbone, using default model dtype"
                    )
        else:
            config["model"]["use_pbc"] = pbc_bool
            config["model"]["use_pbc_single"] = False
            if dtype is not None:
                try:
                    config["model"].update({"dtype": _DTYPE_DICT[dtype]})
                except KeyError:
                    print(
                        "WARNING: dtype not found in backbone, using default model dtype"
                    )

        ### backwards compatibility with OCP v<2.0
        config = update_config(config)

        self.config = copy.deepcopy(config)
        self.config["checkpoint"] = str(model)
        del config["dataset"]["src"]

        # Determine if CPU should be used (for the legacy trainer API)
        cpu = device is not None and device.type == "cpu"
        if device is None:
            cpu = not torch.cuda.is_available()

        self.trainer = registry.get_trainer_class(config["trainer"])(
            task=config.get("task", {}),
            model=config["model"],
            dataset=[config["dataset"]],
            outputs=config["outputs"],
            loss_functions=config["loss_functions"],
            evaluation_metrics=config["evaluation_metrics"],
            optimizer=config["optim"],
            identifier="",
            slurm=config.get("slurm", {}),
            local_rank=config.get("local_rank", 0),
            is_debug=config.get("is_debug", True),
            cpu=cpu,
            amp=False if dtype is not None else config.get("amp", False),
            inference_only=True,
        )

        if dtype is not None:
            # Convert model parameters to specified dtype
            self.trainer.model = self.trainer.model.to(dtype=self.dtype)

        if model is not None:
            self.load_checkpoint(checkpoint_path=model, checkpoint=checkpoint)

        seed = seed if seed is not None else self.trainer.config["cmd"]["seed"]
        if seed is None:
            print(
                "No seed has been set in model checkpoint or OCPCalculator! Results may "
                "not be reproducible on re-run"
            )
        else:
            self.trainer.set_seed(seed)

        if disable_amp:
            self.trainer.scaler = None

        self.implemented_properties = list(self.config["outputs"])

        self._device = self.trainer.device

        stress_output = "stress" in self.implemented_properties
        if not stress_output and compute_stress:
            raise NotImplementedError("Stress output not implemented for this model")


[docs]
    def load_checkpoint(
        self, checkpoint_path: str, checkpoint: dict | None = None
    ) -> None:
        """Load an existing trained model checkpoint.

        Loads model parameters from a checkpoint file or dictionary,
        setting the model to inference mode.

        Args:
            checkpoint_path (str): Path to the trained model checkpoint file
            checkpoint (dict | None): A pretrained checkpoint dictionary. If provided,
                this dictionary is used instead of loading from checkpoint_path.

        Notes:
            If loading fails, a message is printed but no exception is raised.
        """
        try:
            self.trainer.load_checkpoint(checkpoint_path, checkpoint, inference_only=True)
        except NotImplementedError:
            print("Unable to load checkpoint!")



[docs]
    def forward(  # noqa: C901
        self, state: SimState, **_kwargs: object
    ) -> dict[str, torch.Tensor]:
        """Perform forward pass to compute energies, forces, and other properties.

        Takes a simulation state and computes the properties implemented by the model,
        such as energy, forces, and stresses.

        Args:
            state (SimState): State object containing positions, cells, atomic numbers,
                and other system information.
            **_kwargs: Unused; accepted for interface compatibility.

        Returns:
            dict: Dictionary of model predictions, which may include:
                - energy (torch.Tensor): Energy with shape [batch_size]
                - forces (torch.Tensor): Forces with shape [n_atoms, 3]
                - stress (torch.Tensor): Stress tensor with shape [batch_size, 3, 3],
                    if compute_stress is True

        Notes:
            The state is automatically transferred to the model's device if needed.
            All output tensors are detached from the computation graph.
        """
        sim_state = state

        if sim_state.device != self._device:
            sim_state = sim_state.to(self._device)

        if sim_state.system_idx is None:
            sim_state.system_idx = torch.zeros(
                sim_state.positions.shape[0], dtype=torch.int
            )

        # Extract uniform PBC value from state (validate it's uniform)
        if isinstance(sim_state.pbc, torch.Tensor):
            if not torch.all(sim_state.pbc == sim_state.pbc[0]):
                raise ValueError(
                    "FairChemV1Model does not support mixed PBC "
                    f"(got state.pbc={sim_state.pbc.tolist()})"
                )
            state_pbc_bool = bool(sim_state.pbc[0].item())
        else:
            state_pbc_bool = bool(sim_state.pbc)

        model_pbc_bool = bool(self.pbc[0].item())

        if model_pbc_bool != state_pbc_bool:
            raise ValueError(
                f"PBC mismatch: model has pbc={model_pbc_bool}, "
                f"but state has pbc={state_pbc_bool}. "
                "FairChemV1Model requires model and state PBC to match."
            )

        natoms = torch.bincount(sim_state.system_idx)
        fixed = torch.zeros(
            (sim_state.system_idx.size(0), int(natoms.sum().item())), dtype=torch.int
        )
        data_list = []
        for idx, (n, c) in enumerate(
            zip(natoms, torch.cumsum(natoms, dim=0), strict=False)
        ):
            data_list.append(
                Data(
                    pos=sim_state.positions[c - n : c].detach().clone(),
                    cell=sim_state.row_vector_cell[idx, None].detach().clone(),
                    atomic_numbers=sim_state.atomic_numbers[c - n : c].detach().clone(),
                    fixed=fixed[c - n : c].detach().clone(),
                    natoms=n,
                    pbc=sim_state.pbc,
                )
            )
        self.data_object = Batch.from_data_list(data_list)

        if self.dtype is not None:
            self.data_object.pos = self.data_object.pos.to(self.dtype)
            self.data_object.cell = self.data_object.cell.to(self.dtype)

        predictions = self.trainer.predict(
            self.data_object, per_image=False, disable_tqdm=True
        )

        results = {}

        for key in predictions:
            _pred = predictions[key]
            if key in self._reshaped_props:
                _pred = _pred.reshape(self._reshaped_props.get(key)).squeeze()
            results[key] = _pred

        results["energy"] = results["energy"].squeeze(dim=1)
        if results.get("stress") is not None and len(results["stress"].shape) == 2:
            results["stress"] = results["stress"].unsqueeze(dim=0)
        return {k: v.detach() for k, v in results.items()}