Source code for pisces.models.core.base

"""Base model abstraction for Pisces HDF5-backed physical models.

This module defines the :class:`BaseModel`, a foundational abstraction for all
Pisces-compatible models that are stored and accessed via HDF5 files. It provides
a unified interface for loading, saving, introspecting, and interacting with model
components. For more details on the Pisces model format and conventions, see :ref:`models_overview`.
"""

import datetime
from abc import ABC
from pathlib import Path
from typing import TYPE_CHECKING, Any, Union

import h5py
import numpy as np
from unyt import Unit, unyt_array

from pisces._generic import RegistryMeta
from pisces._registries import __default_model_registry__
from pisces.geometry.grids.utils import load_grid_from_hdf5_group
from pisces.profiles.base import BaseProfile
from pisces.utilities.io_tools import HDF5Serializer
from pisces.utilities.log import LogDescriptor

from .hooks import _HookTools
from .utils import ModelConfig

if TYPE_CHECKING:
    from logging import Logger

    from pisces._generic import Registry
    from pisces.geometry.coordinates.base import CoordinateSystem
    from pisces.geometry.grids.base import Grid



[docs]
class BaseModel(_HookTools, ABC, metaclass=RegistryMeta):
    """Abstract base class for Pisces-compatible physical models.

    The :class:`BaseModel` defines the foundational logic and storage conventions for
    HDF5-backed physical models used throughout the Pisces framework. It provides
    a consistent interface for:

    - Loading and validating model files
    - Accessing physical fields, analytic profiles, and metadata
    - Saving models from in-memory components
    - Subclass extension via hooks and typed configuration

    Model Structure
    ---------------
    Pisces models are stored as structured HDF5 files with the following layout:

    .. code-block:: text

        /
        ├── FIELDS/        # Physical field arrays (e.g., density, temperature)
        ├── PROFILES/      # Serialized analytic profile definitions
        ├── GRID/          # The spatial grid for the model.
        └── attrs/         # Model metadata and identity tags

    Each subclass is expected to match this layout and may define additional groups
    or attributes as needed. At minimum, each model must store its `__model_class__`
    identifier at the root to verify identity during loading.

    Access Patterns
    ---------------
    This class supports dictionary-like access and assignment:

    .. code-block:: python

        model["density"]  # returns field array
        model["temperature"]  # returns profile object
        model["description"]  # returns metadata string

        "pressure" in model  # checks all three namespaces
        model["mass"] = new_arr  # updates field

    Subclassing Guidelines
    ----------------------
    To implement a new model type:

    1. Subclass `BaseModel` and define the appropriate sampling or analysis methods.
    2. Optionally override `__post_init__()` to customize setup after loading.
    3. Optionally override `_construct_model_file_skeleton()` to define a custom layout.
    4. Register the model in your configuration under `[models.MyModelClass]`.
    """

    # ----------------------- #
    # Class Flags             #
    # ----------------------- #
    __IS_ABSTRACT__: bool = True
    __DEFAULT_REGISTRY__: "Registry" = __default_model_registry__

    # ------------------------ #
    # Class Variables          #
    # ------------------------ #
    logger: "Logger" = LogDescriptor(mode="models")
    """
    Logger interface for this model.

    This logger provides structured logging functionality specific to the model's
    operation within the Pisces framework. It captures status updates, warnings,
    debug information, and other messages emitted during model construction,
    file I/O, sampling, or analysis.

    Use this logger for:

    - Reporting progress or diagnostics in custom model methods
    - Emitting debug messages during development or profile tuning
    - Logging warnings for missing data, invalid configuration, etc.

    Access the logger via:

    .. code-block:: python

        self.logger.info("Loaded profile '%s'", name)
        self.logger.warning("Missing metadata for '%s'", key)

    The logger is registered under the ``models`` subsystem. You can configure
    its behavior (e.g., log level or format) by editing the ``[logging.models]``
    section in your Pisces configuration file.
    """
    config: dict = ModelConfig()
    """
    Model-specific configuration settings.

    This dictionary provides access to optional, model-scoped settings defined
    in the Pisces configuration system. Each model class can retrieve its default
    parameters from the global config file under the section:

    .. code-block:: yaml

        models:
          MyGalaxyClusterModel:
            sampling_resolution: 1000
            enable_logging: true

    Access the config like a normal dictionary:

    .. code-block:: python

        resolution = self.config.get("sampling_resolution", 1000)
        enable_logging = self.config.get("log_fields", True)

    This allows you to customize model behavior without hardcoding values into
    your Python code. If the model class is not registered in the config file,
    accessing `self.config` will raise an error with guidance.
    """
    metadata_serializer: HDF5Serializer = HDF5Serializer
    """~pisces.utilities.io.HDF5Serializer: Serializer for model metadata.

    This serializer is used to convert complex Python objects (like `unyt` arrays,
    quantities, and custom types) into JSON-compatible formats that can be stored
    as attributes in HDF5 files. It provides methods for serializing and deserializing
    model metadata, ensuring that all necessary information can be preserved and
    reconstructed when loading models.

    The serializer for a particular model can be customized by subclassing
    `HDF5Serializer` and overriding the `metadata_serializer` property in your model
    class. This allows you to define custom serialization logic for any additional
    types or structures you need to store in the model's metadata.
    """

    # ========================================= #
    # Initialization and Configuration          #
    # ========================================= #
    def __read_fields__(self) -> dict[str, unyt_array | np.ndarray]:
        """Load the physical fields from the Pisces model file.

        This method reads all physical fields stored in the model file and returns
        them as a dictionary mapping field names to arrays (with or without units).
        It is intended for internal use during model loading and assumes compliance
        with Pisces model HDF5 layout conventions.

        Pisces Format Standard
        ----------------------
        Pisces models store all field data under the `/FIELDS` group of the HDF5 file.
        Each field is saved as an individual HDF5 dataset with the following conventions:

        - **Dataset Name**: The name of the dataset should match the field name (e.g., "density").
        - **Units Attribute** (optional): If present, the dataset must define a `UNITS` attribute
          as a string parsable by `unyt.Unit`. If no units are found, the field is treated
          as unitless.

        Field arrays **must** have a shape exactly matching the model's spatial grid shape,
        unless explicitly documented as a scalar field or a reduced representation.

        Developer Guidance
        ------------------
        When implementing or modifying this method for a custom subclass:

        - Validate that `/FIELDS` exists before attempting to access datasets.
        - For each dataset:
            * Extract the raw data using slicing (`[...]`).
            * Check for a `units` attribute and apply it using `unyt_array(...)`.
            * Validate the array shape against `self.__grid__.shape`.
        - Store each field under its corresponding name in a `dict`.

        Shape Validation
        ----------------
        This method enforces that all field arrays have shapes matching the model grid.
        If a mismatch is detected, a `ValueError` is raised to prevent inconsistent data loads.

        Returns
        -------
        dict of str, unyt_array or ndarray
            A dictionary containing all loaded field arrays, indexed by field name.

        Raises
        ------
        ValueError
            If a field's shape does not match the grid shape.

        Examples
        --------
        .. code-block:: text

            /FIELDS
                ├── density       [shape: (128,), units: "Msun/kpc**3"]
                ├── temperature   [shape: (128,), units: "keV"]
                └── pressure      [shape: (128,), units: "dyne/cm**2"]

        .. code-block:: python

            {
                "density": unyt_array([...], "Msun/kpc**3"),
                "temperature": unyt_array([...], "keV"),
                "pressure": unyt_array([...], "dyne/cm**2"),
            }

        """
        # Generate a fields dictionary to hold the fields that we load. This
        # is what will be returned at the end of the method.
        fields = {}

        # Check that the FIELDS group exists. If it does not, we log a warning
        # and return an empty dictionary.
        if "FIELDS" not in self.__handle__:
            self.logger.warning("No `FIELDS` group found in model file '%s'.", self.__path__)
            return fields

        # Require that the grid is already loaded for shape checking. This is
        # somewhat redundant, but subclasses might screw up the ordering.
        if not hasattr(self, "__grid__"):
            raise RuntimeError(
                "Grid must be loaded before reading fields to perform shape validation.\n"
                "This error likely indicates that this subclass is loading the fields before the grid..."
            )
        expected_shape = self.__grid__.shape

        for field_name, field_data in self.__handle__["FIELDS"].items():
            # Perform the check on the shape. We require that the
            # leading shape of the dataset matches the grid shape, but
            # the trailing shape can be anything (e.g., for vector fields).
            field_shape = field_data.shape
            field_ndim = field_data.ndim

            if len(field_shape) < len(expected_shape):
                raise ValueError(f"Field `{field_name}` has dimension {field_ndim}, but grid has larger dimension.")
            if field_shape[: len(expected_shape)] != expected_shape:
                raise ValueError(
                    f"Field '{field_name}' has leading shape {field_shape[: len(expected_shape)]}, "
                    f"expected {expected_shape} to match grid."
                )

            # The shape check has passed. Now we can just load the data.
            units = field_data.attrs.get("units", None)

            # Convert to unyt_array if units are present
            if units is None:
                arr = np.array(field_data[...])
            else:
                arr = unyt_array(field_data[...], units)

            # Validate shape
            if arr.shape != expected_shape:
                self.logger.error(
                    "Field '%s' has shape %s but expected grid shape %s.",
                    field_name,
                    arr.shape,
                    expected_shape,
                )
                raise ValueError(
                    f"Field '{field_name}' has shape {arr.shape}, expected {expected_shape} to match grid."
                )

            fields[field_name] = arr
            self.logger.debug("Loaded field: '%s'. Units=%s", field_name, str(units))

        return fields

    def __read_metadata__(self) -> dict[str, Any]:
        """Load model metadata from the root-level attributes of the Pisces HDF5 model file.

        This method extracts metadata stored in the root-level attributes (`attrs`) of
        the HDF5 file and returns it as a dictionary. These metadata values serve as
        persistent identifiers, descriptive tags, or build-time diagnostics that are
        relevant to the model as a whole.

        Pisces Format Standard
        ----------------------
        Metadata in Pisces models is stored at the **file root level** as plain attributes.
        Each entry should be a simple key-value pair compatible with HDF5 attribute types,
        such as:

        - Strings (e.g., `"description"`, `"author"`)
        - Numbers (int, float)
        - Dates or timestamps (typically stored as ISO strings)
        - Small arrays (e.g., version tags or configuration flags)

        Required Keys (by Convention)
        -----------------------------
        While not strictly enforced, Pisces models generally include:

        - `"__model_class__"` : Name of the class that generated the model.
        - `"date_created"` : ISO timestamp of model file creation.
        - `"source"` : Optional tag indicating model origin or provenance.
        - `"description"` : Optional summary of the model contents.

        These values are typically injected at model export time (e.g., via `from_components()`).

        Developer Guidance
        ------------------
        When extending this method or modifying metadata formats:

        - Avoid parsing or interpreting values at load time—just read and return raw values.
        - Do not hardcode expected keys unless your subclass guarantees them.
        - If the file lacks metadata entirely, this method should return an empty dictionary.

        Logging
        -------
        This method is intentionally silent (no logging), since absence of metadata
        may be normal in some intermediate outputs or synthetic models.

        Returns
        -------
        A dictionary of all root-level metadata attributes stored in the model file.

        Example Layout
        --------------
        .. code-block:: text

            /
            ├── FIELDS/
            ├── PROFILES/
            └── attrs:
                ├── "__model_class__" = "SphericalGalaxyClusterModel"
                ├── "date_created"    = "2025-07-24T15:31:10.103Z"
                ├── "description"     = "Hydrostatic mass test model."
                └── "source"          = "test_suite"

        This results in:

        .. code-block:: python

            {
                "__model_class__": "SphericalGalaxyClusterModel",
                "date_created": "2025-07-24T15:31:10.103Z",
                "description": "Hydrostatic mass test model.",
                "source": "test_suite",
            }

        """
        return self.__class__.metadata_serializer.deserialize_dict(dict(self.__handle__.attrs))

    def __read_profiles__(self) -> dict[str, "BaseProfile"]:
        """Load all analytic profiles from the `/PROFILES` group of the model file.

        This method reads all stored analytic profiles in the Pisces model file
        and reconstructs them using the standardized class method
        :meth:`BaseProfile.from_hdf5`. Each profile is loaded into memory and
        returned as part of a dictionary keyed by its group name.

        Pisces Format Standard
        ----------------------
        Analytic profiles are stored in a dedicated group at `/PROFILES` in the HDF5 model.
        Each profile is represented as a subgroup under `/PROFILES`, where:

        - The **key** is the profile name (e.g., `"density"`, `"temperature"`).
        - The **value** is an HDF5 group containing serialized data and metadata
          as required by the corresponding `BaseProfile` subclass.

        The structure and interpretation of each profile group is delegated to the
        :meth:`BaseProfile.from_hdf5` loader, which must be implemented for all
        profile subclasses.

        Example Structure
        -----------------
        .. code-block:: text

            /
            ├── FIELDS/
            ├── PROFILES/
            │   ├── density/
            │   │   ├── parameters
            │   │   ├── metadata
            │   ├── temperature/
            │   │   ├── parameters
            │   │   ├── metadata
            └── attrs/

        The resulting dictionary will contain:

        .. code-block:: python

            {
                "density": <SphericalNFWProfile(...)>,
                "temperature": <VikhlininProfile(...)>,
            }

        Developer Notes
        ---------------
        - This method is silent if the `/PROFILES` group is missing, but logs a warning.
        - If subclassed, developers may override this method to implement custom
          logic for filtering or categorizing profiles.
        - If profiles are optional for a given model class, ensure your code gracefully
          handles an empty return.

        Logging
        -------
        - Each loaded profile logs a DEBUG-level message with its name.
        - Missing `/PROFILES` group triggers a WARNING message.

        Returns
        -------
        dict of str -> BaseProfile
            Dictionary of profile names to fully instantiated profile objects.

        """
        profiles = {}
        if "PROFILES" in self.__handle__:
            for profile_name, profile_data in self.__handle__["PROFILES"].items():
                profiles[profile_name] = BaseProfile.from_hdf5(profile_data, profile_name)
                self.logger.debug("Loaded profile: '%s'.", profile_name)
        else:
            self.logger.warning("No `PROFILES` group found in model file '%s'.", self.__path__)

        return profiles

    def __read_grid__(self, registry: "Registry" = None) -> "Grid":
        """Load the spatial grid from the `/GRID` group of the Pisces model file.

        This method reads the spatial grid stored in the model's HDF5 file and
        reconstructs it using :func:`pisces.geometry.grids.utils.load_grid_from_hdf5_group`.

        Pisces Format Standard
        ----------------------
        The model's spatial grid is stored under the `/GRID` group in the HDF5 file.
        This group contains the serialized representation of a :class:`~pisces.geometry.grids.base.Grid`
        object.

        The :func:`~pisces.geometry.grids.utils.load_grid_from_hdf5_group` function
        handles the deserialization and instantiation of the appropriate grid subclass.

        Parameters
        ----------
        registry : Registry, optional
            Optional class registry used to look up the correct grid subclass when
            deserializing. If ``None``, the default Pisces registry will be used.

        Returns
        -------
        Grid
            A fully instantiated :class:`~pisces.geometry.grids.base.Grid` object.

        Raises
        ------
        ValueError
            If the `/GRID` group is missing from the model file.
        RuntimeError
            If an error occurs during grid deserialization.
        """
        # Ensure that the grid is present in the HDF5 file. If it
        # is not, then we cannot proceed.
        if "GRID" not in self.__handle__:
            raise ValueError(f"No `GRID` group found in model file '{self.__path__}'.")

        # Attempt to load the grid and raise an error if we fail.
        try:
            grid = load_grid_from_hdf5_group(self.__handle__["GRID"], registry=registry)
            self.logger.debug("Loaded grid from model file '%s'.", self.__path__)
        except Exception as exp:
            raise RuntimeError(f"Failed to load model grid due to an error: {exp}") from exp

        # Pass it back to become an attribute.
        return grid


[docs]
    def __init__(self, filepath: str | Path, *args, **kwargs):
        """Load a Pisces model from an existing HDF5 file.

        This loads the model from disk, verifies that the file matches the expected
        model class, and reads its core components:

        - Metadata (from root attributes)
        - Analytical profiles (from ``/PROFILES``)
        - The spatial grid (from ``/GRID``)
        - Physical field data (from ``/FIELDS``)

        Subclasses may extend loading behavior by overriding :meth:`__post_init__` or
        modifying the ``__init__`` method directly.

        Parameters
        ----------
        filepath : str or Path
            Path to the existing HDF5 model file.
        *args, **kwargs :
            Optional arguments forwarded to :meth:`__post_init__`.

        Raises
        ------
        FileNotFoundError
            If the specified file does not exist.
        TypeError
            If the file does not belong to this model class.

        """
        # Configure the path, ensure it is a Path object,
        # and then check that it exists before opening it.
        self.__path__ = Path(filepath)

        if not self.__path__.exists():
            raise FileNotFoundError(f"File {self.__path__} does not exist.")

        self.__handle__ = h5py.File(self.__path__, mode="r+")

        # Verify that the file was generated by this model class. This
        # ensures that we cannot open a model with the wrong model class.
        model_tag = self.metadata_serializer.deserialize_data(self.__handle__.attrs.get("__model_class__", None))
        if model_tag != self.__class__.__name__:
            raise TypeError(
                f"File {self.__path__} is not a valid model of type {self.__class__.__name__} (found tag: {model_tag})."
            )

        # --- Data Loading --- #
        # This is the meaty bit of the loading process. We read
        # the metadata, profiles, and fields before passing off to
        # the post init hook. Subclasses may override any or all of
        # these methods to customize the loading process.
        self.__metadata__: dict[str, Any] = self.__read_metadata__()
        self.__profiles__: dict[str, BaseProfile] = self.__read_profiles__()
        self.__grid__: Grid = self.__read_grid__(registry=kwargs.pop("registry", None))
        self.__fields__: dict[str, unyt_array] = self.__read_fields__()

        # Allow subclass extensions
        self.__post_init__(*args, **kwargs)

        # Log model load
        self.logger.info(
            "Loaded model from '%s' [%s]: %d fields, %d profiles, %d metadata entries, grid shape=%s.",
            str(self.__path__),
            self.__class__.__name__,
            len(self.__fields__),
            len(self.__profiles__),
            len(self.__metadata__),
            self.__grid__.shape,
        )


    def __post_init__(self, *args, **kwargs):
        """Add additional structure to subclass initialization.

        This method is automatically called at the end of `__init__()`.
        Subclasses may override it to perform additional setup or data processing
        without rewriting the entire constructor.

        Parameters
        ----------
        *args, **kwargs :
            Arbitrary arguments forwarded from the constructor.

        Examples
        --------
        .. code-block:: python

            class MyModel(BaseModel):
                def __post_init__(self):
                    self.mass_field = self.__fields__["mass"]
                    self.density_profile = self.__profiles__[
                        "density"
                    ]

        """
        pass

    # ========================================= #
    # Model Generator Methods                   #
    # ========================================= #
    # These methods are the generator methods for the model. They
    # should take some set of inputs (whatever is needed for the model)
    # and yield a resulting model.
    @classmethod
    def _construct_model_file_skeleton(cls, filepath: str | Path, overwrite: bool = False) -> Path:
        """Create an empty HDF5 file with the necessary structure for a model.

        This method should be called before any data is written to the file.
        It sets up the basic structure of the HDF5 file, including groups for
        fields and profiles.

        Parameters
        ----------
        filepath : str or Path
            The path to the HDF5 file to create.
        overwrite : bool, optional
            Whether to overwrite the file if it already exists (default: False).

        """
        # Ensure that the filepath is a valid path object and
        # then handle issues with overwriting existing files.
        filepath = Path(filepath)
        if filepath.exists() and not overwrite:
            raise FileExistsError(f"File {filepath} already exists. Use 'overwrite=True' to overwrite it.")

        # Open the HDF5 file in write mode and start managing the
        # relevant structure. This can be overwritten in subclasses as
        # needed to add additional structure. By default, we simply
        # create the FIELDS and PROFILES groups, which are the
        # two main components of the model. We then add the class
        # name as an attribute on the file to ensure that we can
        # identify the model type later on.
        with h5py.File(filepath, mode="w") as handle:
            handle.create_group("FIELDS")
            handle.create_group("PROFILES")
            handle.create_group("GRID")

            # Add the class name as an attribute on the file.
            handle.attrs["__model_class__"] = cls.__name__

            # Add any other necessary groups or attributes here.

        return filepath


[docs]
    @classmethod
    def from_components(
        cls,
        filepath: str | Path,
        grid: "Grid",
        fields: dict[str, unyt_array | np.ndarray],
        profiles: dict[str, "BaseProfile"],
        metadata: dict[str, Any],
        overwrite: bool = False,
    ) -> "BaseModel":
        """Create and save a Pisces model from in-memory components.

        This method assembles a fully specified model from its constituent parts—
        spatial grid, physical fields, analytic profiles, and metadata—and writes
        it to disk in Pisces HDF5 format. The resulting file can be loaded
        directly using the class constructor.

        The output file will follow the standard Pisces model layout:

        .. code-block:: text

            /
            ├── FIELDS/        # Physical field arrays (e.g., density, temperature)
            ├── PROFILES/      # Serialized analytic profile definitions
            ├── GRID/          # Serialized spatial grid object
            └── attrs/         # Model metadata and identity tags

        Parameters
        ----------
        filepath : str or Path
            Path to the output HDF5 model file. If the file already exists and
            ``overwrite`` is False, a :class:`FileExistsError` will be raised.

        grid : ~pisces.geometry.grids.base.Grid
            The spatial grid defining the model's geometry. This object must be a
            subclass of :class:`~pisces.geometry.grids.base.Grid` and will be
            serialized to the ``/GRID`` group via its
            :meth:`~pisces.geometry.grids.base.Grid._save_grid_to_hdf5_group` method.

        fields : dict of str, (unyt_array or numpy.ndarray)
            Dictionary mapping field names to their corresponding arrays.

            - **Keys**: Field names (e.g., ``"density"`` or ``"temperature"``)
            - **Values**: Either a :class:`unyt.array.unyt_array` with units or a plain
              :class:`numpy.ndarray` for unitless data.

            Each array's leading shape must exactly match ``grid.shape``; additional
            trailing dimensions (e.g., for vector/tensor components) are allowed.

        profiles : dict of str -> BaseProfile
            Dictionary mapping profile names to fully instantiated analytic profile
            objects. Each profile must implement
            :meth:`~pisces.profiles.base.BaseProfile.to_hdf5` for serialization.

        metadata : dict
            Dictionary of model metadata to store as root-level attributes in the
            HDF5 file. This can include descriptive information, provenance tags,
            and other auxiliary data. The following keys are generally recommended:

            - ``"description"``: Short summary of the model
            - ``"source"``: Origin or generating process
            - ``"date_created"``: Will be set automatically if not provided
            - ``"__model_class__"``: Will be set automatically to match ``cls.__name__``

        overwrite : bool, optional
            Whether to overwrite an existing file at ``filepath``. Defaults to
            ``False``. If set to ``True``, any existing file will be replaced.

        Returns
        -------
        BaseModel
            An instance of the model loaded from the saved file.

        """
        # Construct a model skeleton at the required filepath so
        # that the file exists and has the right structure.
        filepath = cls._construct_model_file_skeleton(filepath, overwrite=overwrite)

        # Insert the relevant required metadata into the metadata dictionary.
        # From there, we just serialize the metadata dictionary and write it to
        # disk.
        metadata["date_created"] = datetime.datetime.now().isoformat()
        metadata["__model_class__"] = cls.__name__
        metadata = cls.metadata_serializer.serialize_dict(metadata)

        # Save the grid to disk using the .to_hdf5 method. This is
        # abstracted down to the grid to allow saving consistently.
        try:
            grid.to_hdf5(filepath, group="GRID", overwrite=True)
        except Exception as exp:
            raise RuntimeError(f"Failed to save grid to model file due to an error: {exp}") from exp

        # Now write all of the relevant data to disk vis-a-vis the HDF5 file.
        with h5py.File(filepath, "r+") as f:
            # Store metadata in root attributes
            for key, val in metadata.items():
                f.attrs[key] = val

            # Write fields and verify shapes.
            field_group = f["FIELDS"]
            for name, arr in fields.items():
                # Start by verifying that the array shape matches the grid shape.
                expected_shape = grid.shape
                expected_ndim = len(expected_shape)
                arr_shape = arr.shape
                arr_ndim = arr.ndim

                if arr_ndim < expected_ndim:
                    raise ValueError(
                        f"Field '{name}' has dimension {arr_ndim}, but grid has larger dimension {expected_ndim}."
                    )
                if arr_shape[:expected_ndim] != expected_shape:
                    raise ValueError(
                        f"Field '{name}' has leading shape {arr_shape[:expected_ndim]}, "
                        f"expected {expected_shape} to match grid."
                    )

                # The consistency checks have passed. Now we can write the data.
                data = arr.to_base().value if hasattr(arr, "to_base") else np.asarray(arr)
                dset = field_group.create_dataset(name, data=data)
                if hasattr(arr, "units"):
                    dset.attrs["units"] = str(arr.units)

            # Write profiles
            profile_group = f["PROFILES"]
            for name, profile in profiles.items():
                subgrp = profile_group.create_group(name)
                profile.to_hdf5(subgrp, name)

        return cls(filepath)


    # ========================================= #
    # Dunder Methods                            #
    # ========================================= #
    def __str__(self):
        """Return a readable string representation of the model."""
        return f"<{self.__class__.__name__} @ {self.__path__}>"

    def __repr__(self):
        """Return the default representation of the model."""
        return super().__repr__()

    def __del__(self):
        """Ensure that the HDF5 file handle is closed when the model is deleted."""
        handle = getattr(self, "__handle__", None)
        if handle is not None and handle.id.valid:
            handle.close()

    def __getitem__(self, item):
        """Allow for dictionary-like access to the model's fields."""
        if item in self.__fields__:
            return self.__fields__[item]
        if item in self.__grid__.active_axes:
            return self.__grid__.get_axis_array(axis=item)
        else:
            raise KeyError(f"Item '{item}' not found in model.")

    def __setitem__(self, key: str, value: Any):
        """Allow for dictionary-like setting of the model's fields."""
        if key in self.__fields__:
            self.__fields__[key] = value
        if key in self.__grid__.active_axes:
            raise KeyError(f"Cannot set grid axis '{key}' directly. Modify the grid object instead.")
        else:
            raise KeyError(f"Item '{key}' not found in model.")

    def __contains__(self, key):
        """Check if a key exists in the fields, profiles, or metadata."""
        return key in self.__fields__

    def __len__(self):
        """Return the number of physical fields in the model."""
        return len(self.__fields__)

    def __iter__(self):
        """Iterate over the field names in the model."""
        return iter(self.__fields__)

    # ========================================= #
    # Properties                                #
    # ========================================= #
    @property
    def path(self) -> Path:
        """The path to the model's HDF5 file."""
        return self.__path__

    @property
    def handle(self) -> h5py.File:
        """The open HDF5 file handle."""
        return self.__handle__

    @property
    def metadata(self) -> dict[str, Any]:
        """Model metadata dictionary."""
        return self.__metadata__

    @property
    def profiles(self) -> dict[str, "BaseProfile"]:
        """Model profile objects."""
        return self.__profiles__

    @property
    def fields(self) -> dict[str, unyt_array | np.ndarray]:
        """Model field buffers."""
        return self.__fields__

    @property
    def grid(self) -> "Grid":
        """The spatial grid of the model."""
        return self.__grid__

    @property
    def coordinate_system(self) -> "CoordinateSystem":
        """The coordinate system of the model's grid."""
        return self.__grid__.coordinate_system

    @property
    def active_grid_axes(self) -> list[str]:
        """List of active axes in the model's grid."""
        return self.__grid__.active_axes

    # ========================================= #
    # Modification Methods: Fields              #
    # ========================================= #
    # These methods provide a safe and consistent interface for
    # retrieving, adding, modifying, copying, and removing fields.


[docs]
    def get_field(self, name: str) -> unyt_array | np.ndarray:
        """Retrieve a physical field by name.

        Parameters
        ----------
        name : str
            The name of the field to retrieve.

        Returns
        -------
        unyt_array or numpy.ndarray
            The requested field as a :class:`unyt_array` with units,
            or a plain :class:`numpy.ndarray` if unitless.

        Raises
        ------
        KeyError
            If the field does not exist in the model.
        """
        if name not in self.__fields__:
            raise KeyError(f"Field '{name}' not found in model.")
        return self.__fields__[name]



[docs]
    def add_field(
        self,
        name: str,
        element_shape: tuple[int, ...] = (),
        units: Union[str, Unit] = None,
        data: unyt_array | np.ndarray = None,
        overwrite: bool = False,
        **kwargs,
    ):
        """Add a new physical field to the model.

        Fields represent physical quantities (e.g., density, temperature, velocity)
        defined on the model’s spatial grid. This method creates a new field with
        optional initialization from user-provided data.

        Parameters
        ----------
        name : str
            Name of the field (e.g., ``"density"``).
        element_shape : tuple of int, optional
            Extra trailing dimensions for vector/tensor fields (e.g., ``(3,)``).
            Defaults to ``()``.
        units : str or unyt.Unit, optional
            Units for the field. If ``None``, the field is unitless.
        data : unyt_array or numpy.ndarray, optional
            Values to initialize the field. If ``None``, initialized to zeros.
            Must have shape ``grid.shape + element_shape``.
        overwrite : bool, optional
            If ``True``, replaces an existing field with the same name. If ``False``,
            raises :class:`KeyError` if the field already exists.

        Raises
        ------
        ValueError
            If provided data does not match the expected shape.
        KeyError
            If the field already exists and ``overwrite=False``.

        Notes
        -----
        - The field is written to both memory and the on-disk HDF5 file under
          ``/FIELDS/{name}``.
        - Unit handling is powered by :mod:`unyt`.

        """
        expected_shape = self.__grid__.shape + element_shape

        # Initialize array
        if data is None:
            arr = np.zeros(expected_shape, dtype=kwargs.get("dtype", "f8"))
            arr = unyt_array(arr, units) if units is not None else arr
        else:
            if data.shape != expected_shape:
                raise ValueError(f"Field '{name}' has shape {data.shape}, expected {expected_shape}.")
            arr = unyt_array(data, units) if units is not None else unyt_array(data)

        # Handle overwrite logic
        if name in self.__fields__ and not overwrite:
            raise KeyError(f"Field '{name}' already exists. Use overwrite=True to replace it.")

        fields_group = self.__handle__["FIELDS"]
        if name in fields_group:
            if overwrite:
                del fields_group[name]
            else:
                raise KeyError(f"Field '{name}' already exists in file.")

        # Write dataset
        dset = fields_group.create_dataset(name, data=arr.d if hasattr(arr, "d") else np.asarray(arr))
        if hasattr(arr, "units"):
            dset.attrs["units"] = str(arr.units)

        # Reload cache
        self.__fields__ = self.__read_fields__()
        self.logger.info("Added field '%s' (shape=%s, units=%s).", name, expected_shape, units)



[docs]
    def remove_field(self, name: str):
        """Remove a physical field from the model.

        Deletes the field from both memory and the HDF5 file.

        Parameters
        ----------
        name : str
            Name of the field to remove.

        Raises
        ------
        KeyError
            If the field does not exist.
        """
        if name not in self.__fields__:
            raise KeyError(f"Field '{name}' not found in model.")

        del self.__handle__["FIELDS"][name]
        del self.__fields__[name]

        self.logger.info("Removed field '%s'.", name)



[docs]
    def list_fields(self) -> list[str]:
        """List all physical fields currently stored in the model.

        Returns
        -------
        list of str
            Field names available in the model.
        """
        return list(self.__fields__.keys())



[docs]
    def rename_field(self, old_name: str, new_name: str):
        """Rename an existing field in the model.

        Changes the field name in both memory and the HDF5 file.

        Parameters
        ----------
        old_name : str
            Current name of the field.
        new_name : str
            New name for the field.

        Raises
        ------
        KeyError
            If ``old_name`` does not exist or ``new_name`` already exists.
        """
        if old_name not in self.__fields__:
            raise KeyError(f"Field '{old_name}' not found in model.")
        if new_name in self.__fields__:
            raise KeyError(f"Field '{new_name}' already exists.")

        self.__handle__["FIELDS"].move(old_name, new_name)
        self.__fields__ = self.__read_fields__()

        self.logger.info("Renamed field '%s' → '%s'.", old_name, new_name)



[docs]
    def copy_field(self, old_name: str, new_name: str):
        """Create a duplicate of an existing field under a new name.

        Parameters
        ----------
        old_name : str
            Name of the existing field.
        new_name : str
            Name for the copied field.

        Raises
        ------
        KeyError
            If ``old_name`` does not exist or ``new_name`` already exists.
        """
        if old_name not in self.__fields__:
            raise KeyError(f"Field '{old_name}' not found in model.")
        if new_name in self.__fields__:
            raise KeyError(f"Field '{new_name}' already exists in model.")

        self.__handle__["FIELDS"].copy(old_name, new_name)
        self.__fields__ = self.__read_fields__()

        self.logger.info("Copied field '%s' → '%s'.", old_name, new_name)


    # ========================================= #
    # Modification Methods: Profiles            #
    # ========================================= #
    # These methods provide a safe and consistent interface for
    # retrieving, adding, modifying, copying, and removing profiles.


[docs]
    def get_profile(self, name: str) -> "BaseProfile":
        """Retrieve an analytic profile by name.

        Parameters
        ----------
        name : str
            The name of the profile to retrieve.

        Returns
        -------
        BaseProfile
            The requested profile object.

        Raises
        ------
        KeyError
            If the profile does not exist in the model.
        """
        if name not in self.__profiles__:
            raise KeyError(f"Profile '{name}' not found in model.")
        return self.__profiles__[name]



[docs]
    def add_profile(
        self,
        name: str,
        profile: "BaseProfile",
        overwrite: bool = False,
    ):
        """Add a new analytic profile to the model.

        Profiles represent analytic functions (e.g., NFW, Vikhlinin) that can
        generate fields or describe physical quantities. This method saves the
        profile in both memory and the on-disk HDF5 file.

        Parameters
        ----------
        name : str
            Name of the profile (e.g., ``"density"``).
        profile : BaseProfile
            An instance of a subclass of :class:`BaseProfile`.
        overwrite : bool, optional
            If ``True``, replaces an existing profile with the same name.
            Defaults to ``False``.

        Raises
        ------
        KeyError
            If the profile already exists and ``overwrite=False``.
        """
        if name in self.__profiles__ and not overwrite:
            raise KeyError(f"Profile '{name}' already exists. Use overwrite=True to replace it.")

        profiles_group = self.__handle__["PROFILES"]
        if name in profiles_group:
            if overwrite:
                del profiles_group[name]
            else:
                raise KeyError(f"Profile '{name}' already exists in file.")

        subgrp = profiles_group.create_group(name)
        profile.to_hdf5(subgrp, name)

        self.__profiles__ = self.__read_profiles__()
        self.logger.info("Added profile '%s'.", name)



[docs]
    def remove_profile(self, name: str):
        """Remove an analytic profile from the model.

        Deletes the profile from both memory and the HDF5 file.

        Parameters
        ----------
        name : str
            Name of the profile to remove.

        Raises
        ------
        KeyError
            If the profile does not exist.
        """
        if name not in self.__profiles__:
            raise KeyError(f"Profile '{name}' not found in model.")

        del self.__handle__["PROFILES"][name]
        del self.__profiles__[name]

        self.logger.info("Removed profile '%s'.", name)



[docs]
    def rename_profile(self, old_name: str, new_name: str):
        """Rename an existing profile in the model.

        Changes the profile name in both memory and the HDF5 file.

        Parameters
        ----------
        old_name : str
            Current name of the profile.
        new_name : str
            New name for the profile.

        Raises
        ------
        KeyError
            If ``old_name`` does not exist or ``new_name`` already exists.
        """
        if old_name not in self.__profiles__:
            raise KeyError(f"Profile '{old_name}' not found in model.")
        if new_name in self.__profiles__:
            raise KeyError(f"Profile '{new_name}' already exists.")

        self.__handle__["PROFILES"].move(old_name, new_name)
        self.__profiles__ = self.__read_profiles__()

        self.logger.info("Renamed profile '%s' → '%s'.", old_name, new_name)



[docs]
    def copy_profile(self, old_name: str, new_name: str):
        """Create a duplicate of an existing profile under a new name.

        Parameters
        ----------
        old_name : str
            Name of the existing profile.
        new_name : str
            Name for the copied profile.

        Raises
        ------
        KeyError
            If ``old_name`` does not exist or ``new_name`` already exists.
        """
        if old_name not in self.__profiles__:
            raise KeyError(f"Profile '{old_name}' not found in model.")
        if new_name in self.__profiles__:
            raise KeyError(f"Profile '{new_name}' already exists in model.")

        self.__handle__["PROFILES"].copy(old_name, new_name)
        self.__profiles__ = self.__read_profiles__()

        self.logger.info("Copied profile '%s' → '%s'.", old_name, new_name)



[docs]
    def list_profiles(self) -> list[str]:
        """List all analytic profiles currently stored in the model.

        Returns
        -------
        list of str
            Profile names available in the model.
        """
        return list(self.__profiles__.keys())