Source code for torch_sim.state

"""The core state representation.

The main SimState class represents atomistic systems with support for batched
operations and conversion to/from various atomistic formats.
"""

import copy
import importlib
import warnings
from dataclasses import dataclass, field
from typing import TYPE_CHECKING, Literal, Self

import torch

import torch_sim as ts
from torch_sim.typing import StateLike


if TYPE_CHECKING:
    from ase import Atoms
    from phonopy.structure.atoms import PhonopyAtoms
    from pymatgen.core import Structure



[docs]
@dataclass
class SimState:
    """State representation for atomistic systems with batched operations support.

    Contains the fundamental properties needed to describe an atomistic system:
    positions, masses, unit cell, periodic boundary conditions, and atomic numbers.
    Supports batched operations where multiple atomistic systems can be processed
    simultaneously, managed through batch indices.

    States support slicing, cloning, splitting, popping, and movement to other
    data structures or devices. Slicing is supported through fancy indexing,
    e.g. `state[[0, 1, 2]]` will return a new state containing only the first three
    batches. The other operations are available through the `pop`, `split`, `clone`,
    and `to` methods.

    Attributes:
        positions (torch.Tensor): Atomic positions with shape (n_atoms, 3)
        masses (torch.Tensor): Atomic masses with shape (n_atoms,)
        cell (torch.Tensor): Unit cell vectors with shape (n_batches, 3, 3).
            Note that we use a column vector convention, i.e. the cell vectors are
            stored as `[[a1, b1, c1], [a2, b2, c2], [a3, b3, c3]]` as opposed to
            the row vector convention `[[a1, a2, a3], [b1, b2, b3], [c1, c2, c3]]`
            used by ASE.
        pbc (bool): Boolean indicating whether to use periodic boundary conditions
        atomic_numbers (torch.Tensor): Atomic numbers with shape (n_atoms,)
        batch (torch.Tensor, optional): Batch indices with shape (n_atoms,),
            defaults to None, must be unique consecutive integers starting from 0

    Properties:
        wrap_positions (torch.Tensor): Positions wrapped according to periodic boundary
            conditions
        device (torch.device): Device of the positions tensor
        dtype (torch.dtype): Data type of the positions tensor
        n_atoms (int): Total number of atoms across all batches
        n_batches (int): Number of unique batches in the system

    Notes:
        - positions, masses, and atomic_numbers must have shape (n_atoms, 3).
        - cell must be in the conventional matrix form.
        - batch indices must be unique consecutive integers starting from 0.

    Examples:
        >>> state = initialize_state(
        ...     [ase_atoms_1, ase_atoms_2, ase_atoms_3], device, dtype
        ... )
        >>> state.n_batches
        3
        >>> new_state = state[[0, 1]]
        >>> new_state.n_batches
        2
        >>> cloned_state = state.clone()
    """

    positions: torch.Tensor
    masses: torch.Tensor
    cell: torch.Tensor
    pbc: bool  # TODO: do all calculators support mixed pbc?
    atomic_numbers: torch.Tensor
    batch: torch.Tensor | None = field(default=None, kw_only=True)

    def __post_init__(self) -> None:
        """Validate and process the state after initialization."""
        # data validation and fill batch
        # should make pbc a tensor here
        # if devices aren't all the same, raise an error, in a clean way
        devices = {
            attr: getattr(self, attr).device
            for attr in ("positions", "masses", "cell", "atomic_numbers")
        }
        if len(set(devices.values())) > 1:
            raise ValueError("All tensors must be on the same device")

        # Check that positions, masses and atomic numbers have compatible shapes
        shapes = [
            getattr(self, attr).shape[0]
            for attr in ("positions", "masses", "atomic_numbers")
        ]

        if len(set(shapes)) > 1:
            raise ValueError(
                f"Incompatible shapes: positions {shapes[0]}, "
                f"masses {shapes[1]}, atomic_numbers {shapes[2]}"
            )

        if self.cell.ndim != 3 and self.batch is None:
            self.cell = self.cell.unsqueeze(0)

        if self.cell.shape[-2:] != (3, 3):
            raise ValueError("Cell must have shape (n_batches, 3, 3)")

        if self.batch is None:
            self.batch = torch.zeros(self.n_atoms, device=self.device, dtype=torch.int64)
        else:
            # assert that batch indices are unique consecutive integers
            _, counts = torch.unique_consecutive(self.batch, return_counts=True)
            if not torch.all(counts == torch.bincount(self.batch)):
                raise ValueError("Batch indices must be unique consecutive integers")

        if self.cell.shape[0] != self.n_batches:
            raise ValueError(
                f"Cell must have shape (n_batches, 3, 3), got {self.cell.shape}"
            )

    @property
    def wrap_positions(self) -> torch.Tensor:
        """Atomic positions wrapped according to periodic boundary conditions if pbc=True,
        otherwise returns unwrapped positions with shape (n_atoms, 3).
        """
        # TODO: implement a wrapping method
        return self.positions

    @property
    def device(self) -> torch.device:
        """The device where the tensor data is located."""
        return self.positions.device

    @property
    def dtype(self) -> torch.dtype:
        """The data type of the positions tensor."""
        return self.positions.dtype

    @property
    def n_atoms(self) -> int:
        """Total number of atoms in the system across all batches."""
        return self.positions.shape[0]

    @property
    def n_atoms_per_batch(self) -> torch.Tensor:
        """Number of atoms per batch."""
        return (
            self.batch.bincount()
            if self.batch is not None
            else torch.tensor([self.n_atoms], device=self.device)
        )

    @property
    def n_batches(self) -> int:
        """Number of batches in the system."""
        return torch.unique(self.batch).shape[0]

    @property
    def volume(self) -> torch.Tensor:
        """Volume of the system."""
        return torch.det(self.cell) if self.pbc else None

    @property
    def column_vector_cell(self) -> torch.Tensor:
        """Unit cell following the column vector convention."""
        return self.cell

    @column_vector_cell.setter
    def column_vector_cell(self, value: torch.Tensor) -> None:
        """Set the unit cell from value following the column vector convention.

        Args:
            value: The unit cell as a column vector
        """
        self.cell = value

    @property
    def row_vector_cell(self) -> torch.Tensor:
        """Unit cell following the row vector convention."""
        return self.cell.mT

    @row_vector_cell.setter
    def row_vector_cell(self, value: torch.Tensor) -> None:
        """Set the unit cell from value following the row vector convention.

        Args:
            value: The unit cell as a row vector
        """
        self.cell = value.mT


[docs]
    def clone(self) -> Self:
        """Create a deep copy of the SimState.

        Creates a new SimState object with identical but independent tensors,
        allowing modification without affecting the original.

        Returns:
            SimState: A new SimState object with the same properties as the original
        """
        attrs = {}
        for attr_name, attr_value in vars(self).items():
            if isinstance(attr_value, torch.Tensor):
                attrs[attr_name] = attr_value.clone()
            else:
                attrs[attr_name] = copy.deepcopy(attr_value)

        return self.__class__(**attrs)



[docs]
    def to_atoms(self) -> list["Atoms"]:
        """Convert the SimState to a list of ASE Atoms objects.

        Returns:
            list[Atoms]: A list of ASE Atoms objects, one per batch
        """
        return ts.io.state_to_atoms(self)



[docs]
    def to_structures(self) -> list["Structure"]:
        """Convert the SimState to a list of pymatgen Structure objects.

        Returns:
            list[Structure]: A list of pymatgen Structure objects, one per batch
        """
        return ts.io.state_to_structures(self)



[docs]
    def to_phonopy(self) -> list["PhonopyAtoms"]:
        """Convert the SimState to a list of PhonopyAtoms objects.

        Returns:
            list[PhonopyAtoms]: A list of PhonopyAtoms objects, one per batch
        """
        return ts.io.state_to_phonopy(self)



[docs]
    def split(self) -> list[Self]:
        """Split the SimState into a list of single-batch SimStates.

        Divides the current state into separate states, each containing a single batch,
        preserving all properties appropriately for each batch.

        Returns:
            list[SimState]: A list of SimState objects, one per batch
        """
        return _split_state(self)



[docs]
    def pop(self, batch_indices: int | list[int] | slice | torch.Tensor) -> list[Self]:
        """Pop off states with the specified batch indices.

        This method modifies the original state object by removing the specified
        batches and returns the removed batches as separate SimState objects.

        Args:
            batch_indices (int | list[int] | slice | torch.Tensor): The batch indices
                to pop

        Returns:
            list[SimState]: Popped SimState objects, one per batch index

        Notes:
            This method modifies the original SimState in-place.
        """
        batch_indices = _normalize_batch_indices(
            batch_indices, self.n_batches, self.device
        )

        # Get the modified state and popped states
        modified_state, popped_states = _pop_states(self, batch_indices)

        # Update all attributes of self with the modified state's attributes
        for attr_name, attr_value in vars(modified_state).items():
            setattr(self, attr_name, attr_value)

        return popped_states



[docs]
    def to(
        self, device: torch.device | None = None, dtype: torch.dtype | None = None
    ) -> Self:
        """Convert the SimState to a new device and/or data type.

        Args:
            device (torch.device, optional): The target device.
                Defaults to current device.
            dtype (torch.dtype, optional): The target data type.
                Defaults to current dtype.

        Returns:
            SimState: A new SimState with tensors on the specified device and dtype
        """
        return state_to_device(self, device, dtype)


    def __getitem__(self, batch_indices: int | list[int] | slice | torch.Tensor) -> Self:
        """Enable standard Python indexing syntax for slicing batches.

        Args:
            batch_indices (int | list[int] | slice | torch.Tensor): The batch indices
                to include

        Returns:
            SimState: A new SimState containing only the specified batches
        """
        # TODO: need to document that slicing is supported
        # Reuse the existing slice method
        batch_indices = _normalize_batch_indices(
            batch_indices, self.n_batches, self.device
        )

        return _slice_state(self, batch_indices)




[docs]
class DeformGradMixin:
    """Mixin for states that support deformation gradients."""

    @property
    def momenta(self) -> torch.Tensor:
        """Calculate momenta from velocities and masses.

        Returns:
            The momenta of the particles
        """
        return self.velocities * self.masses.unsqueeze(-1)

    @property
    def reference_row_vector_cell(self) -> torch.Tensor:
        """Get the original unit cell in terms of row vectors."""
        return self.reference_cell.mT

    @reference_row_vector_cell.setter
    def reference_row_vector_cell(self, value: torch.Tensor) -> None:
        """Set the original unit cell in terms of row vectors."""
        self.reference_cell = value.mT

    @staticmethod
    def _deform_grad(
        reference_row_vector_cell: torch.Tensor, row_vector_cell: torch.Tensor
    ) -> torch.Tensor:
        """Calculate the deformation gradient from original cell to current cell.

        Returns:
            The deformation gradient
        """
        return torch.linalg.solve(reference_row_vector_cell, row_vector_cell).transpose(
            -2, -1
        )


[docs]
    def deform_grad(self) -> torch.Tensor:
        """Calculate the deformation gradient from original cell to current cell.

        Returns:
            The deformation gradient
        """
        return self._deform_grad(self.reference_row_vector_cell, self.row_vector_cell)




def _normalize_batch_indices(
    batch_indices: int | list[int] | slice | torch.Tensor,
    n_batches: int,
    device: torch.device,
) -> torch.Tensor:
    """Normalize batch indices to handle negative indices and different input types.

    Converts various batch index representations to a consistent tensor format,
    handling negative indices in the Python style (counting from the end).

    Args:
        batch_indices (int | list[int] | slice | torch.Tensor): The batch indices to
            normalize
        n_batches (int): Total number of batches in the system
        device (torch.device): Device to place the output tensor on

    Returns:
        torch.Tensor: Normalized batch indices as a tensor

    Raises:
        TypeError: If batch_indices is of an unsupported type
    """
    if isinstance(batch_indices, int):
        # Handle negative integer indexing
        if batch_indices < 0:
            batch_indices = n_batches + batch_indices
        return torch.tensor([batch_indices], device=device)
    if isinstance(batch_indices, list):
        # Handle negative indices in lists
        normalized = [idx if idx >= 0 else n_batches + idx for idx in batch_indices]
        return torch.tensor(normalized, device=device)
    if isinstance(batch_indices, slice):
        # Let PyTorch handle the slice conversion with negative indices
        return torch.arange(n_batches, device=device)[batch_indices]
    if isinstance(batch_indices, torch.Tensor):
        # Handle negative indices in tensors
        return torch.where(batch_indices < 0, n_batches + batch_indices, batch_indices)
    raise TypeError(f"Unsupported index type: {type(batch_indices)}")



[docs]
def state_to_device(
    state: SimState,
    device: torch.device | None = None,
    dtype: torch.dtype | None = None,
) -> Self:
    """Convert the SimState to a new device and dtype.

    Creates a new SimState with all tensors moved to the specified device and
    with the specified data type.

    Args:
        state (SimState): The state to convert
        device (torch.device, optional): The target device. Defaults to current device.
        dtype (torch.dtype, optional): The target data type. Defaults to current dtype.

    Returns:
        SimState: A new SimState with tensors on the specified device and dtype
    """
    if device is None:
        device = state.device
    if dtype is None:
        dtype = state.dtype

    attrs = vars(state)
    for attr_name, attr_value in attrs.items():
        if isinstance(attr_value, torch.Tensor):
            attrs[attr_name] = attr_value.to(device=device)

    if dtype is not None:
        attrs["positions"] = attrs["positions"].to(dtype=dtype)
        attrs["masses"] = attrs["masses"].to(dtype=dtype)
        attrs["cell"] = attrs["cell"].to(dtype=dtype)
        attrs["atomic_numbers"] = attrs["atomic_numbers"].to(dtype=torch.int)
    return type(state)(**attrs)




[docs]
def infer_property_scope(
    state: SimState,
    ambiguous_handling: Literal["error", "globalize", "globalize_warn"] = "error",
) -> dict[Literal["global", "per_atom", "per_batch"], list[str]]:
    """Infer whether a property is global, per-atom, or per-batch.

    Analyzes the shapes of tensor attributes to determine their scope within
    the atomistic system representation.

    Args:
        state (SimState): The state to analyze
        ambiguous_handling ("error" | "globalize" | "globalize_warn"): How to
            handle properties with ambiguous scope. Options:
            - "error": Raise an error for ambiguous properties
            - "globalize": Treat ambiguous properties as global
            - "globalize_warn": Treat ambiguous properties as global with a warning

    Returns:
        dict[Literal["global", "per_atom", "per_batch"], list[str]]: Map of scope
            category to list of property names

    Raises:
        ValueError: If n_atoms equals n_batches (making scope inference ambiguous) or
            if ambiguous_handling="error" and an ambiguous property is encountered
    """
    # TODO: this cannot effectively resolve global properties with
    # length of n_atoms or n_batches, they will be classified incorrectly,
    # no clear fix

    if state.n_atoms == state.n_batches:
        raise ValueError(
            f"n_atoms ({state.n_atoms}) and n_batches ({state.n_batches}) are equal, "
            "which means shapes cannot be inferred unambiguously."
        )

    scope = {
        "global": [],
        "per_atom": [],
        "per_batch": [],
    }

    # Iterate through all attributes
    for attr_name, attr_value in vars(state).items():
        # Handle scalar values (global properties)
        if not isinstance(attr_value, torch.Tensor):
            scope["global"].append(attr_name)
            continue

        # Handle tensor properties based on shape
        shape = attr_value.shape

        # Empty tensor case
        if len(shape) == 0:
            scope["global"].append(attr_name)
        # Vector/matrix with first dimension matching number of atoms
        elif shape[0] == state.n_atoms:
            scope["per_atom"].append(attr_name)
        # Tensor with first dimension matching number of batches
        elif shape[0] == state.n_batches:
            scope["per_batch"].append(attr_name)
        # Any other shape is ambiguous
        elif ambiguous_handling == "error":
            raise ValueError(
                f"Cannot categorize property '{attr_name}' with shape {shape}. "
                f"Expected first dimension to be either {state.n_atoms} (per-atom) or "
                f"{state.n_batches} (per-batch), or a scalar (global)."
            )
        elif ambiguous_handling in ("globalize", "globalize_warn"):
            scope["global"].append(attr_name)

            if ambiguous_handling == "globalize_warn":
                warnings.warn(
                    f"Property '{attr_name}' with shape {shape} is ambiguous, "
                    "treating as global. This may lead to unexpected behavior "
                    "and suggests the State is not being used as intended.",
                    stacklevel=1,
                )

    return scope



def _get_property_attrs(
    state: SimState, ambiguous_handling: Literal["error", "globalize"] = "error"
) -> dict[str, dict]:
    """Get global, per-atom, and per-batch attributes from a state.

    Categorizes all attributes of the state based on their scope
    (global, per-atom, or per-batch).

    Args:
        state (SimState): The state to extract attributes from
        ambiguous_handling ("error" | "globalize"): How to handle ambiguous
            properties

    Returns:
        dict[str, dict]: Keys are 'global', 'per_atom', and 'per_batch', each
            containing a dictionary of attribute names to values
    """
    scope = infer_property_scope(state, ambiguous_handling=ambiguous_handling)

    attrs = {"global": {}, "per_atom": {}, "per_batch": {}}

    # Process global properties
    for attr_name in scope["global"]:
        attrs["global"][attr_name] = getattr(state, attr_name)

    # Process per-atom properties
    for attr_name in scope["per_atom"]:
        attrs["per_atom"][attr_name] = getattr(state, attr_name)

    # Process per-batch properties
    for attr_name in scope["per_batch"]:
        attrs["per_batch"][attr_name] = getattr(state, attr_name)

    return attrs


def _filter_attrs_by_mask(
    attrs: dict[str, dict],
    atom_mask: torch.Tensor,
    batch_mask: torch.Tensor,
) -> dict:
    """Filter attributes by atom and batch masks.

    Selects subsets of attributes based on boolean masks for atoms and batches.

    Args:
        attrs (dict[str, dict]): Keys are 'global', 'per_atom', and 'per_batch', each
            containing a dictionary of attribute names to values
        atom_mask (torch.Tensor): Boolean mask for atoms to include with shape
            (n_atoms,)
        batch_mask (torch.Tensor): Boolean mask for batches to include with shape
            (n_batches,)

    Returns:
        dict: Filtered attributes with appropriate handling for each scope
    """
    filtered_attrs = {}

    # Copy global attributes directly
    filtered_attrs.update(attrs["global"])

    # Filter per-atom attributes
    for attr_name, attr_value in attrs["per_atom"].items():
        if attr_name == "batch":
            # Get the old batch indices for the selected atoms
            old_batch = attr_value[atom_mask]

            # Get the batch indices that are kept
            kept_indices = torch.arange(attr_value.max() + 1, device=attr_value.device)[
                batch_mask
            ]

            # Create a mapping from old batch indices to new consecutive indices
            batch_map = {idx.item(): i for i, idx in enumerate(kept_indices)}

            # Create new batch tensor with remapped indices
            new_batch = torch.tensor(
                [batch_map[b.item()] for b in old_batch],
                device=attr_value.device,
                dtype=attr_value.dtype,
            )
            filtered_attrs[attr_name] = new_batch
        else:
            filtered_attrs[attr_name] = attr_value[atom_mask]

    # Filter per-batch attributes
    for attr_name, attr_value in attrs["per_batch"].items():
        filtered_attrs[attr_name] = attr_value[batch_mask]

    return filtered_attrs


def _split_state(
    state: SimState,
    ambiguous_handling: Literal["error", "globalize"] = "error",
) -> list[SimState]:
    """Split a SimState into a list of states, each containing a single batch element.

    Divides a multi-batch state into individual single-batch states, preserving
    appropriate properties for each batch.

    Args:
        state (SimState): The SimState to split
        ambiguous_handling ("error" | "globalize"): How to handle ambiguous
            properties. If "error", an error is raised if a property has ambiguous
            scope. If "globalize", properties with ambiguous scope are treated as
            global.

    Returns:
        list[SimState]: A list of SimState objects, each containing a single
            batch element
    """
    attrs = _get_property_attrs(state, ambiguous_handling)
    batch_sizes = torch.bincount(state.batch).tolist()

    # Split per-atom attributes by batch
    split_per_atom = {}
    for attr_name, attr_value in attrs["per_atom"].items():
        if attr_name == "batch":
            continue
        split_per_atom[attr_name] = torch.split(attr_value, batch_sizes, dim=0)

    # Split per-batch attributes into individual elements
    split_per_batch = {}
    for attr_name, attr_value in attrs["per_batch"].items():
        split_per_batch[attr_name] = torch.split(attr_value, 1, dim=0)

    # Create a state for each batch
    states = []
    for i in range(state.n_batches):
        batch_attrs = {
            # Create a batch tensor with all zeros for this batch
            "batch": torch.zeros(batch_sizes[i], device=state.device, dtype=torch.int64),
            # Add the split per-atom attributes
            **{attr_name: split_per_atom[attr_name][i] for attr_name in split_per_atom},
            # Add the split per-batch attributes
            **{attr_name: split_per_batch[attr_name][i] for attr_name in split_per_batch},
            # Add the global attributes
            **attrs["global"],
        }
        states.append(type(state)(**batch_attrs))

    return states


def _pop_states(
    state: SimState,
    pop_indices: list[int] | torch.Tensor,
    ambiguous_handling: Literal["error", "globalize"] = "error",
) -> tuple[SimState, list[SimState]]:
    """Pop off the states with the specified indices.

    Extracts and removes the specified batch indices from the state.

    Args:
        state (SimState): The SimState to modify
        pop_indices (list[int] | torch.Tensor): The batch indices to extract and remove
        ambiguous_handling ("error" | "globalize"): How to handle ambiguous
            properties. If "error", an error is raised if a property has ambiguous
            scope. If "globalize", properties with ambiguous scope are treated as
            global.

    Returns:
        tuple[SimState, list[SimState]]: A tuple containing:
            - The modified original state with specified batches removed
            - A list of the extracted SimStates, one per popped batch

    Notes:
        Unlike the pop method, this function does not modify the input state.
    """
    if len(pop_indices) == 0:
        return state, []

    if isinstance(pop_indices, list):
        pop_indices = torch.tensor(pop_indices, device=state.device, dtype=torch.int64)

    attrs = _get_property_attrs(state, ambiguous_handling)

    # Create masks for the atoms and batches to keep and pop
    batch_range = torch.arange(state.n_batches, device=state.device)
    pop_batch_mask = torch.isin(batch_range, pop_indices)
    keep_batch_mask = ~pop_batch_mask

    pop_atom_mask = torch.isin(state.batch, pop_indices)
    keep_atom_mask = ~pop_atom_mask

    # Filter attributes for keep and pop states
    keep_attrs = _filter_attrs_by_mask(attrs, keep_atom_mask, keep_batch_mask)
    pop_attrs = _filter_attrs_by_mask(attrs, pop_atom_mask, pop_batch_mask)

    # Create the keep state
    keep_state = type(state)(**keep_attrs)

    # Create and split the pop state
    pop_state = type(state)(**pop_attrs)
    pop_states = _split_state(pop_state, ambiguous_handling)

    return keep_state, pop_states


def _slice_state(
    state: SimState,
    batch_indices: list[int] | torch.Tensor,
    ambiguous_handling: Literal["error", "globalize"] = "error",
) -> SimState:
    """Slice a substate from the SimState containing only the specified batch indices.

    Creates a new SimState containing only the specified batches, preserving
    all relevant properties.

    Args:
        state (SimState): The state to slice
        batch_indices (list[int] | torch.Tensor): Batch indices to include in the
            sliced state
        ambiguous_handling ("error" | "globalize"): How to handle ambiguous
            properties. If "error", an error is raised if a property has ambiguous
            scope. If "globalize", properties with ambiguous scope are treated as
            global.

    Returns:
        SimState: A new SimState object containing only the specified batches

    Raises:
        ValueError: If batch_indices is empty
    """
    if isinstance(batch_indices, list):
        batch_indices = torch.tensor(
            batch_indices, device=state.device, dtype=torch.int64
        )

    if len(batch_indices) == 0:
        raise ValueError("batch_indices cannot be empty")

    attrs = _get_property_attrs(state, ambiguous_handling)

    # Create masks for the atoms and batches to include
    batch_range = torch.arange(state.n_batches, device=state.device)
    batch_mask = torch.isin(batch_range, batch_indices)
    atom_mask = torch.isin(state.batch, batch_indices)

    # Filter attributes
    filtered_attrs = _filter_attrs_by_mask(attrs, atom_mask, batch_mask)

    # Create the sliced state
    return type(state)(**filtered_attrs)



[docs]
def concatenate_states(
    states: list[SimState], device: torch.device | None = None
) -> SimState:
    """Concatenate a list of SimStates into a single SimState.

    Combines multiple states into a single state with multiple batches.
    Global properties are taken from the first state, and per-atom and per-batch
    properties are concatenated.

    Args:
        states (list[SimState]): A list of SimState objects to concatenate
        device (torch.device, optional): The device to place the concatenated state on.
            Defaults to the device of the first state.

    Returns:
        SimState: A new SimState containing all input states as separate batches

    Raises:
        ValueError: If states is empty
        TypeError: If not all states are of the same type
    """
    if not states:
        raise ValueError("Cannot concatenate an empty list of states")

    # Get the first state to determine properties
    first_state = states[0]

    # Ensure all states are of the same class
    state_class = type(first_state)
    if not all(isinstance(state, state_class) for state in states):
        raise TypeError("All states must be of the same type")

    # Use the target device or default to the first state's device
    target_device = device or first_state.device

    # Get property scopes from the first state to identify
    # global/per-atom/per-batch properties
    first_scope = infer_property_scope(first_state)
    global_props = set(first_scope["global"])
    per_atom_props = set(first_scope["per_atom"])
    per_batch_props = set(first_scope["per_batch"])

    # Initialize result with global properties from first state
    concatenated = {prop: getattr(first_state, prop) for prop in global_props}

    # Pre-allocate lists for tensors to concatenate
    per_atom_tensors = {prop: [] for prop in per_atom_props}
    per_batch_tensors = {prop: [] for prop in per_batch_props}
    new_batch_indices = []
    batch_offset = 0

    # Process all states in a single pass
    for state in states:
        # Move state to target device if needed
        if state.device != target_device:
            state = state_to_device(state, target_device)

        # Collect per-atom properties
        for prop in per_atom_props:
            # if hasattr(state, prop):
            per_atom_tensors[prop].append(getattr(state, prop))

        # Collect per-batch properties
        for prop in per_batch_props:
            # if hasattr(state, prop):
            per_batch_tensors[prop].append(getattr(state, prop))

        # Update batch indices
        num_batches = state.n_batches
        new_indices = state.batch + batch_offset
        new_batch_indices.append(new_indices)
        batch_offset += num_batches

    # Concatenate collected tensors
    for prop, tensors in per_atom_tensors.items():
        # if tensors:
        concatenated[prop] = torch.cat(tensors, dim=0)

    for prop, tensors in per_batch_tensors.items():
        # if tensors:
        concatenated[prop] = torch.cat(tensors, dim=0)

    # Concatenate batch indices
    concatenated["batch"] = torch.cat(new_batch_indices)

    # Create a new instance of the same class
    return state_class(**concatenated)




[docs]
def initialize_state(
    system: StateLike,
    device: torch.device,
    dtype: torch.dtype,
) -> SimState:
    """Initialize state tensors from a atomistic system representation.

    Converts various atomistic system representations (ASE Atoms, pymatgen Structure,
    PhonopyAtoms, or existing SimState) to a SimState object.

    Args:
        system (StateLike): Input system to convert to state tensors
        device (torch.device): Device to create tensors on
        dtype (torch.dtype): Data type for tensor values

    Returns:
        SimState: State representation initialized from input system

    Raises:
        ValueError: If system type is not supported or if list items have inconsistent
        types
    """
    # TODO: create a way to pass velocities from pmg and ase

    if isinstance(system, SimState):
        return state_to_device(system, device, dtype)

    if isinstance(system, list) and all(isinstance(s, SimState) for s in system):
        if not all(state.n_batches == 1 for state in system):
            raise ValueError(
                "When providing a list of states, to the initialize_state function, "
                "all states must have n_batches == 1. To fix this, you can split the "
                "states into individual states with the split_state function."
            )
        return concatenate_states(system)

    converters = [
        ("pymatgen.core", "Structure", ts.io.structures_to_state),
        ("ase", "Atoms", ts.io.atoms_to_state),
        ("phonopy.structure.atoms", "PhonopyAtoms", ts.io.phonopy_to_state),
    ]

    # Try each converter
    for module_path, class_name, converter_func in converters:
        try:
            module = importlib.import_module(module_path)
            cls = getattr(module, class_name)

            if isinstance(system, cls) or (
                isinstance(system, list) and all(isinstance(s, cls) for s in system)
            ):
                return converter_func(system, device, dtype)
        except ImportError:
            continue

    # remaining code just for informative error
    is_list = isinstance(system, list)
    all_same_type = (
        is_list and all(isinstance(s, type(system[0])) for s in system) and system
    )
    if is_list and not all_same_type:
        raise ValueError(
            f"All items in list must be of the same type, "
            f"found {type(system[0])} and {type(system[1])}"
        )

    system_type = f"list[{type(system[0])}]" if is_list else type(system)

    raise ValueError(f"Unsupported system type, {system_type}")