From 4e7f91e0764961c9671ec7b6a36cde70886b4058 Mon Sep 17 00:00:00 2001
From: Rhys Goodall <rhys.goodall@outlook.com>
Date: Tue, 17 Feb 2026 18:08:27 -0500
Subject: [PATCH] fea: use first-party implementation

---
 pyproject.toml           |   2 +-
 tests/models/test_orb.py |  39 ++--
 torch_sim/models/orb.py  | 456 ++-------------------------------------
 3 files changed, 30 insertions(+), 467 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 1428e67b3..152abebbf 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -52,7 +52,7 @@ symmetry = ["moyopy>=0.3"]
 mace = ["mace-torch>=0.3.14"]
 mattersim = ["mattersim>=0.1.2"]
 metatomic = ["metatomic-torch>=0.1.3", "metatrain[pet]>=2025.12"]
-orb = ["orb-models>=0.5.2"]
+orb = ["orb-models[torchsim] @ git+https://github.com/orbital-materials/orb-models.git"]
 sevenn = ["sevenn>=0.11.0"]
 graphpes = ["graph-pes>=0.1", "mace-torch>=0.3.12"]
 nequip = ["nequip>=0.16.2"]
diff --git a/tests/models/test_orb.py b/tests/models/test_orb.py
index 118f6d307..a7bc4d1c9 100644
--- a/tests/models/test_orb.py
+++ b/tests/models/test_orb.py
@@ -1,22 +1,18 @@
 import traceback
 
-import numpy as np
 import pytest
-from ase.geometry.cell import cell_to_cellpar as ase_c2p
 
 from tests.conftest import DEVICE
 from tests.models.conftest import (
     make_model_calculator_consistency_test,
     make_validate_model_outputs_test,
 )
-from torch_sim import SimState
-from torch_sim.models.orb import cell_to_cellpar
 from torch_sim.testing import SIMSTATE_GENERATORS
 
 
 try:
     from orb_models.forcefield import pretrained
-    from orb_models.forcefield.calculator import ORBCalculator
+    from orb_models.forcefield.inference.calculator import ORBCalculator
 
     from torch_sim.models.orb import OrbModel
 except ImportError:
@@ -25,32 +21,36 @@
 
 @pytest.fixture
 def orbv3_conservative_inf_omat_model() -> OrbModel:
-    orb_ff = pretrained.orb_v3_conservative_inf_omat(
+    orb_ff, atoms_adapter = pretrained.orb_v3_conservative_inf_omat(
         device=DEVICE, precision="float32-high"
     )
-    return OrbModel(model=orb_ff, device=DEVICE)
+    return OrbModel(orb_ff, atoms_adapter, device=DEVICE)
 
 
 @pytest.fixture
 def orbv3_direct_20_omat_model() -> OrbModel:
-    orb_ff = pretrained.orb_v3_direct_20_omat(device=DEVICE, precision="float32-high")
-    return OrbModel(model=orb_ff, device=DEVICE)
+    orb_ff, atoms_adapter = pretrained.orb_v3_direct_20_omat(
+        device=DEVICE, precision="float32-high"
+    )
+    return OrbModel(orb_ff, atoms_adapter, device=DEVICE)
 
 
 @pytest.fixture
 def orbv3_conservative_inf_omat_calculator() -> ORBCalculator:
     """Create an ORBCalculator for the pretrained model."""
-    orb_ff = pretrained.orb_v3_conservative_inf_omat(
+    orb_ff, atoms_adapter = pretrained.orb_v3_conservative_inf_omat(
         device=DEVICE, precision="float32-high"
     )
-    return ORBCalculator(model=orb_ff, device=DEVICE)
+    return ORBCalculator(model=orb_ff, atoms_adapter=atoms_adapter, device=DEVICE)
 
 
 @pytest.fixture
 def orbv3_direct_20_omat_calculator() -> ORBCalculator:
     """Create an ORBCalculator for the pretrained model."""
-    orb_ff = pretrained.orb_v3_direct_20_omat(device=DEVICE, precision="float32-high")
-    return ORBCalculator(model=orb_ff, device=DEVICE)
+    orb_ff, atoms_adapter = pretrained.orb_v3_direct_20_omat(
+        device=DEVICE, precision="float32-high"
+    )
+    return ORBCalculator(model=orb_ff, atoms_adapter=atoms_adapter, device=DEVICE)
 
 
 test_orb_conservative_consistency = make_model_calculator_consistency_test(
@@ -78,16 +78,3 @@ def orbv3_direct_20_omat_calculator() -> ORBCalculator:
 test_validate_direct_model_outputs = make_validate_model_outputs_test(
     model_fixture_name="orbv3_direct_20_omat_model",
 )
-
-
-def test_cell_to_cellpar(ti_sim_state: SimState) -> None:
-    assert np.allclose(
-        ase_c2p(ti_sim_state.row_vector_cell.squeeze()),
-        cell_to_cellpar(ti_sim_state.row_vector_cell.squeeze(0)).cpu().numpy(),
-    )
-    assert np.allclose(
-        ase_c2p(ti_sim_state.row_vector_cell.squeeze(), radians=True),
-        cell_to_cellpar(ti_sim_state.row_vector_cell.squeeze(0), radians=True)
-        .cpu()
-        .numpy(),
-    )
diff --git a/torch_sim/models/orb.py b/torch_sim/models/orb.py
index f667b5c85..1a1d1157b 100644
--- a/torch_sim/models/orb.py
+++ b/torch_sim/models/orb.py
@@ -1,46 +1,34 @@
-"""ORB: PyTorch implementation of ORB models for atomistic simulations.
+"""Wrapper for ORB models in TorchSim.
 
-This module provides a TorchSim wrapper of the ORB models for computing
-energies, forces, and stresses of atomistic systems. It serves as a wrapper around
-the ORB models library, integrating it with the torch-sim framework to enable seamless
-simulation of atomistic systems with machine learning potentials.
+This module re-exports the ORB package's torch-sim integration for convenient
+importing. The actual implementation is maintained in the orb-models package.
 
-The OrbModel class adapts ORB models to the ModelInterface protocol,
-allowing them to be used within the broader torch-sim simulation framework.
-
-Notes:
-    This implementation requires orb_models to be installed and accessible.
-    It supports various model configurations through model instances or model paths.
+References:
+    - ORB Models Package: https://github.com/orbital-materials/orb-models
 """
 
-from __future__ import annotations
-
 import traceback
-import typing
 import warnings
-from pathlib import Path
 from typing import Any
 
-import torch
-
-import torch_sim as ts
-from torch_sim.elastic import voigt_6_to_full_3x3_stress
-from torch_sim.models.interface import ModelInterface
-
 
 try:
-    from orb_models.forcefield import featurization_utilities as feat_util
-    from orb_models.forcefield.atomic_system import SystemConfig
-    from orb_models.forcefield.base import AtomGraphs, _map_concat
+    from orb_models.forcefield.inference.orb_torchsim import OrbTorchSimModel
+
+    # Re-export with backward-compatible name
+    class OrbModel(OrbTorchSimModel):
+        """ORB model wrapper for torch-sim."""
 
 except ImportError as exc:
     warnings.warn(f"Orb import failed: {traceback.format_exc()}", stacklevel=2)
 
-    class OrbModel(ModelInterface):
+    from torch_sim.models.interface import ModelInterface
+
+    class OrbModel(ModelInterface):  # type: ignore[no-redef]
         """ORB model wrapper for torch-sim.
 
-        This class is a placeholder for the OrbModel class.
-        It raises an ImportError if orb_models is not installed.
+        NOTE: This class is a placeholder when orb-models is not installed.
+        It raises an ImportError if accessed.
         """
 
         def __init__(self, err: ImportError = exc, *_args: Any, **_kwargs: Any) -> None:
@@ -48,416 +36,4 @@ def __init__(self, err: ImportError = exc, *_args: Any, **_kwargs: Any) -> None:
             raise err
 
 
-if typing.TYPE_CHECKING:
-    from orb_models.forcefield.conservative_regressor import (
-        ConservativeForcefieldRegressor,
-    )
-    from orb_models.forcefield.direct_regressor import DirectForcefieldRegressor
-    from orb_models.forcefield.featurization_utilities import EdgeCreationMethod
-
-    from torch_sim.typing import StateDict
-
-
-def cell_to_cellpar(
-    cell: torch.Tensor,
-    radians: bool = False,  # noqa: FBT001, FBT002
-) -> torch.Tensor:
-    """Returns the cell parameters [a, b, c, alpha, beta, gamma].
-    torch version of ase's cell_to_cellpar.
-
-    Args:
-        cell:  lattice vector in row vector convention, same as ase
-        radians: If True, return angles in radians. Otherwise, return degrees (default).
-
-    Returns:
-        Tensor with [a, b, c, alpha, beta, gamma].
-    """
-    lengths = torch.linalg.norm(cell, dim=1)
-    angles = []
-    for i in range(3):
-        j = i - 1
-        k = i - 2
-        ll = lengths[j] * lengths[k]
-        if ll.item() > 1e-16:
-            x = torch.dot(cell[j], cell[k]) / ll
-            angle = 180.0 / torch.pi * torch.arccos(x)
-        else:
-            angle = torch.tensor(90.0, device=cell.device, dtype=cell.dtype)
-        angles.append(angle)
-    if radians:
-        angles = [angle * torch.pi / 180 for angle in angles]
-    return torch.concat((lengths, torch.stack(angles)))
-
-
-def state_to_atom_graphs(  # noqa: PLR0915
-    state: ts.SimState,
-    *,
-    wrap: bool = True,
-    edge_method: EdgeCreationMethod | None = None,
-    system_config: SystemConfig | None = None,
-    max_num_neighbors: int | None = None,
-    system_id: int | None = None,  # noqa: ARG001
-    half_supercell: bool | torch.Tensor = False,
-    device: torch.device | None = None,
-    output_dtype: torch.dtype | None = None,
-    graph_construction_dtype: torch.dtype | None = None,
-) -> AtomGraphs:
-    """Convert a SimState object into AtomGraphs format, ready for use in an ORB model.
-
-    Args:
-        state: SimState object containing atomic positions, cell, and atomic numbers
-        wrap: Whether to wrap atomic positions into the central unit cell (if there is
-        one).
-        edge_method (EdgeCreationMethod, optional): The method to use for graph edge
-            construction. If None, the edge method is chosen automatically based on
-            device and system size.
-        system_config: The system configuration to use for graph construction.
-        max_num_neighbors: Maximum number of neighbors each node can send messages to.
-            If None, will use system_config.max_num_neighbors.
-        system_id: Optional index that is relative to a particular dataset.
-        half_supercell (bool): Whether to use half the supercell for graph construction.
-            This can improve performance for large systems.
-        device: The device to put the tensors on.
-        output_dtype: The dtype to use for all floating point tensors stored on the
-            AtomGraphs object.
-        graph_construction_dtype: The dtype to use for floating point tensors in the
-            graph construction.
-
-    Returns:
-        AtomGraphs object containing the graph representation of the atomic system
-    """
-    if system_config is None:
-        system_config = SystemConfig(radius=6.0, max_num_neighbors=20)
-
-    # Handle batch information if present
-    n_node = torch.bincount(state.system_idx)
-
-    # Set default dtype if not provided
-    output_dtype = torch.get_default_dtype() if output_dtype is None else output_dtype
-    graph_construction_dtype = (
-        torch.get_default_dtype()
-        if graph_construction_dtype is None
-        else graph_construction_dtype
-    )
-
-    # Extract data from SimState
-    positions = state.positions
-    row_vector_cell = (
-        state.row_vector_cell
-    )  # Orb uses row vector cell convention for neighbor list
-    atomic_numbers = state.atomic_numbers.long()
-
-    max_num_neighbors = max_num_neighbors or system_config.max_num_neighbors
-
-    # Get atom embeddings for the model
-    n_atoms = len(atomic_numbers)
-    k_hot = (
-        system_config.diffuse_atom_types
-        if hasattr(system_config, "diffuse_atom_types")
-        else False
-    )
-
-    if k_hot:
-        atom_type_embedding = torch.ones(n_atoms, 118) * -feat_util.ATOM_TYPE_K
-        atom_type_embedding[torch.arange(n_atoms), atomic_numbers] = feat_util.ATOM_TYPE_K
-    else:
-        atom_type_embedding = torch.nn.functional.one_hot(atomic_numbers, num_classes=118)
-    atomic_numbers_embedding = atom_type_embedding.to(output_dtype)
-
-    # Wrap positions into the central cell if needed
-    if wrap and (torch.any(row_vector_cell != 0) and torch.any(state.pbc)):
-        positions = feat_util.batch_map_to_pbc_cell(positions, row_vector_cell, n_node)
-
-    n_systems = state.system_idx.max().item() + 1
-
-    # Prepare lists to collect data from each system
-    all_edges: list[torch.Tensor] = []
-    all_vectors: list[torch.Tensor] = []
-    all_unit_shifts: list[torch.Tensor] = []
-    num_edges: list[torch.Tensor] = []
-    node_feats_list: list[dict[str, torch.Tensor]] = []
-    edge_feats_list: list[dict[str, torch.Tensor]] = []
-    graph_feats_list: list[dict[str, torch.Tensor]] = []
-
-    # Process each system in a single loop
-    offset = 0
-    for sys_idx in range(n_systems):
-        system_mask = state.system_idx == sys_idx
-        positions_per_system = positions[system_mask]
-        atomic_numbers_per_system = atomic_numbers[system_mask]
-        atomic_numbers_embedding_per_system = atomic_numbers_embedding[system_mask]
-        cell_per_system = row_vector_cell[sys_idx]
-        pbc = state.pbc
-
-        # Compute edges directly for this system
-        edges, vectors, unit_shifts = feat_util.compute_pbc_radius_graph(
-            positions=positions_per_system,
-            cell=cell_per_system,
-            pbc=pbc,
-            radius=system_config.radius,
-            max_number_neighbors=max_num_neighbors,
-            edge_method=edge_method,
-            half_supercell=bool(half_supercell),
-            device=device,
-        )
-
-        # Adjust indices for the global batch
-        all_edges.append(edges + offset)
-        all_vectors.append(vectors)
-        all_unit_shifts.append(unit_shifts)
-        num_edges.append(len(edges[0]))
-
-        # Calculate lattice parameters
-        lattice_per_system = cell_to_cellpar(cell_per_system.squeeze(0))
-
-        # Create features dictionaries
-        node_feats = {
-            "positions": positions_per_system,
-            "atomic_numbers": atomic_numbers_per_system.to(torch.long),
-            "atomic_numbers_embedding": atomic_numbers_embedding_per_system,
-            "atom_identity": torch.arange(
-                len(positions_per_system), device=positions_per_system.device
-            ).to(torch.long),
-        }
-
-        edge_feats = {
-            "vectors": vectors,
-            "unit_shifts": unit_shifts,
-        }
-
-        graph_feats = {
-            "cell": cell_per_system,
-            "pbc": pbc,
-            "lattice": lattice_per_system.to(device=positions_per_system.device),
-        }
-
-        # Add batch dimension to non-scalar graph features
-        graph_feats = {
-            k: v.unsqueeze(0) if v.numel() > 1 else v for k, v in graph_feats.items()
-        }
-
-        node_feats_list.append(node_feats)
-        edge_feats_list.append(edge_feats)
-        graph_feats_list.append(graph_feats)
-
-        # Update offset for next system
-        offset += len(positions_per_system)
-
-    # Concatenate all the edge data
-    edge_index = torch.cat(all_edges, dim=1)
-    unit_shifts = torch.cat(all_unit_shifts, dim=0)
-    system_num_edges = torch.tensor(num_edges, dtype=torch.int64, device=device)
-
-    senders, receivers = edge_index[0], edge_index[1]
-
-    # Create and return AtomGraphs object
-    return AtomGraphs(
-        senders=senders,
-        receivers=receivers,
-        n_node=n_node,
-        n_edge=system_num_edges,
-        node_features=_map_concat(node_feats_list),
-        edge_features=_map_concat(edge_feats_list),
-        system_features=_map_concat(graph_feats_list),
-        node_targets={},  # No targets since we're using for inference
-        edge_targets={},
-        system_targets={},
-        fix_atoms=None,  # No fixed atoms in SimState
-        tags=None,  # No tags in SimState
-        radius=system_config.radius,
-        max_num_neighbors=torch.tensor([max_num_neighbors] * len(n_node)),
-        system_id=None,
-    ).to(device=device, dtype=output_dtype)
-
-
-class OrbModel(ModelInterface):
-    """Computes atomistic energies, forces and stresses using an ORB model.
-
-    This class wraps an ORB model to compute energies, forces, and stresses for
-    atomistic systems. It handles model initialization, configuration, and
-    provides a forward pass that accepts a SimState object and returns model
-    predictions.
-
-    Attributes:
-        model (Union[DirectForcefieldRegressor, ConservativeForcefieldRegressor]):
-            The ORB model
-        system_config (SystemConfig): Configuration for the atomic system
-        conservative (bool): Whether to use conservative forces/stresses calculation
-        implemented_properties (list): Properties the model can compute
-        _dtype (torch.dtype): Data type used for computation
-        _device (torch.device): Device where computation is performed
-        _edge_method (EdgeCreationMethod): Method for creating edges in the graph
-        _max_num_neighbors (int): Maximum number of neighbors for each atom
-        _half_supercell (bool): Whether to use half supercell optimization
-        _memory_scales_with (str): What the memory usage scales with
-
-    Examples:
-        >>> model = OrbModel(model=loaded_orb_model, compute_stress=True)
-        >>> results = model(state)
-    """
-
-    def __init__(
-        self,
-        model: DirectForcefieldRegressor | ConservativeForcefieldRegressor | str | Path,
-        *,  # force remaining arguments to be keyword-only
-        conservative: bool | None = None,
-        compute_stress: bool = True,
-        compute_forces: bool = True,
-        system_config: SystemConfig | None = None,
-        max_num_neighbors: int | None = None,
-        edge_method: EdgeCreationMethod | None = None,
-        half_supercell: bool | None = None,
-        device: torch.device | str | None = None,
-        dtype: torch.dtype = torch.float32,
-    ) -> None:
-        """Initialize the OrbModel with specified configuration.
-
-        Loads an ORB model from either a model object or a model path.
-        Sets up the model parameters for subsequent use in energy and force calculations.
-
-        Args:
-            model (DirectForcefieldRegressor|ConservativeForcefieldRegressor|str|Path):
-                Either a model object or a path to a saved model
-            conservative (bool | None): Whether to use conservative forces/stresses
-                If None, determined based on model type
-            compute_stress (bool): Whether to compute stress tensor
-            compute_forces (bool): Whether to compute forces
-            system_config (SystemConfig | None): Configuration for the atomic system
-                If None, defaults to SystemConfig(radius=6.0, max_num_neighbors=20)
-            max_num_neighbors (int | None): Maximum number of neighbors for each atom
-            edge_method (EdgeCreationMethod | None): Method for creating edges
-            half_supercell (bool | None): Whether to use half supercell optimization
-                If None, determined based on system size
-            device (torch.device | str | None): Device to run the model on
-            dtype (torch.dtype | None): Data type for computation
-
-        Raises:
-            ValueError: If conservative mode is requested but model doesn't support it
-            ImportError: If orb_models is not installed
-        """
-        super().__init__()
-
-        self._device = device or torch.device(
-            "cuda" if torch.cuda.is_available() else "cpu"
-        )
-        if isinstance(self._device, str):
-            self._device = torch.device(self._device)
-
-        self._dtype = dtype
-        self._compute_stress = compute_stress
-        self._compute_forces = compute_forces
-
-        # Load model if path is provided
-        if isinstance(model, str | Path):
-            loaded_model = torch.load(model, map_location=self._device)
-        elif isinstance(model, torch.nn.Module):
-            loaded_model = model
-        else:
-            raise TypeError("Model must be a path or torch.nn.Module")
-
-        # Set up system configuration
-        self.system_config = system_config or loaded_model.system_config
-        self._max_num_neighbors = max_num_neighbors
-        self._edge_method = edge_method
-        self._half_supercell = half_supercell
-        self.conservative = conservative
-
-        self.model = loaded_model.to(self._device)
-        self.model = self.model.eval()
-
-        if self.dtype is not None:
-            self.model = self.model.to(dtype=self.dtype)
-
-        # Determine if the model is conservative
-        model_is_conservative = hasattr(self.model, "grad_forces_name")
-        if self.conservative is None:
-            self.conservative = model_is_conservative
-
-        if self.conservative and not model_is_conservative:
-            raise ValueError(
-                "Conservative mode requested, but model is not a "
-                "ConservativeForcefieldRegressor."
-            )
-
-        # Set up implemented properties
-        self.implemented_properties = self.model.properties
-
-        # Add forces and stress to implemented properties if conservative model
-        if self.conservative:
-            self.implemented_properties.extend(["forces", "stress"])
-
-    def forward(self, state: ts.SimState | StateDict) -> dict[str, torch.Tensor]:
-        """Perform forward pass to compute energies, forces, and other properties.
-
-        Takes a simulation state and computes the properties implemented by the model,
-        such as energy, forces, and stresses.
-
-        Args:
-            state (SimState | StateDict): State object containing positions, cells,
-                atomic numbers, and other system information. If a dictionary is provided,
-                it will be converted to a SimState.
-
-        Returns:
-            dict: Model predictions, which may include:
-                - energy (torch.Tensor): Energy with shape [batch_size]
-                - forces (torch.Tensor): Forces with shape [n_atoms, 3]
-                - stress (torch.Tensor): Stress tensor with shape [batch_size, 3, 3],
-                    if compute_stress is True
-
-        Notes:
-            The state is automatically transferred to the model's device if needed.
-            All output tensors are detached from the computation graph.
-        """
-        sim_state = (
-            state
-            if isinstance(state, ts.SimState)
-            else ts.SimState(**state, masses=torch.ones_like(state["positions"]))
-        )
-
-        if sim_state.device != self._device:
-            sim_state = sim_state.to(self._device)
-
-        half_supercell = (
-            torch.min(sim_state.volume) > 1000
-            if self._half_supercell is None
-            else self._half_supercell
-        )
-
-        # Convert state to atom graphs
-        batch = state_to_atom_graphs(
-            sim_state,
-            system_config=self.system_config,
-            max_num_neighbors=self._max_num_neighbors,
-            edge_method=self._edge_method,
-            half_supercell=half_supercell,
-            device=self.device,
-        )
-
-        # Run forward pass
-        predictions = self.model.predict(batch)
-
-        results: dict[str, torch.Tensor] = {}
-        model_has_direct_heads = (
-            "forces" in self.model.heads and "stress" in self.model.heads
-        )
-        for prop in self.implemented_properties:
-            # The model has no direct heads for forces/stress, so we skip these props.
-            if not model_has_direct_heads and prop == "forces":
-                continue
-            if not model_has_direct_heads and prop == "stress":
-                continue
-            _property = "energy" if prop == "free_energy" else prop
-            results[prop] = predictions[_property]
-
-        if self.conservative:
-            results["forces"] = results[self.model.grad_forces_name]
-            results["stress"] = results[self.model.grad_stress_name]
-
-        if "stress" in results and results["stress"].shape[-1] == 6:
-            # NOTE: atleast_2d needed because orb internally gets rid of the batch
-            # dimension of the stress if it is 1.
-            results["stress"] = voigt_6_to_full_3x3_stress(
-                torch.atleast_2d(results["stress"])
-            )
-
-        return results
+__all__ = ["OrbModel"]