Source code for metatrain.utils.omegaconf

from typing import Any, Union

import torch
from omegaconf import DictConfig, ListConfig, OmegaConf
from omegaconf.basecontainer import BaseContainer

from metatrain.utils.hypers import init_with_defaults
from metatrain.utils.loss import LossParams, LossSpecification

from .. import RANDOM_SEED
from .architectures import import_architecture
from .devices import pick_devices


def _get_architecture_model(conf: BaseContainer) -> Any:
    architecture = import_architecture(conf["architecture"]["name"])
    return architecture.__model__



[docs]
def default_device(_root_: BaseContainer) -> str:
    """
    Custom OmegaConf resolver to find the default device of an architecture.

    Device is found using the :py:func:metatrain.utils.devices.pick_devices`
    function.

    :param _root_: The root configuration.
    :return: The default device as a string. If multiple devices are found, returns
        "multi-cuda".
    """

    Model = _get_architecture_model(_root_)
    desired_device = pick_devices(Model.__supported_devices__)

    if len(desired_device) > 1:
        return "multi-cuda"
    else:
        return desired_device[0].type




[docs]
def default_precision(_root_: BaseContainer) -> int:
    """
    Custom OmegaConf resolver to find the default precision of an architecture.

    File format is obtained based on the architecture name and its first entry in the
    ``supported_dtypes`` list.

    :param _root_: The root configuration.
    :return: The default precision in bits (16, 32, or 64).
    """

    Model = _get_architecture_model(_root_)

    # desired `dtype` is the first entry
    default_dtype = Model.__supported_dtypes__[0]

    # `base_precision` in options has to be a integer and not a torch.dtype
    if default_dtype in [torch.float64, torch.double]:
        return 64
    elif default_dtype == torch.float32:
        return 32
    elif default_dtype == torch.float16:
        return 16
    else:
        raise ValueError(
            f"architectures `default_dtype` ({default_dtype}) refers to an unknown "
            "torch dtype. This should not happen."
        )




[docs]
def default_huber_loss_delta() -> float:
    """
    Return the default delta for the huber loss.

    :return: The default delta for the huber loss.
    """
    return 1.0



# Register custom resolvers
OmegaConf.register_new_resolver("default_device", default_device)
OmegaConf.register_new_resolver("default_precision", default_precision)
OmegaConf.register_new_resolver("default_random_seed", lambda: RANDOM_SEED)


def _resolve_single_str(config: str) -> DictConfig:
    return OmegaConf.create({"read_from": config})


# Base options/configurations
BASE_OPTIONS = OmegaConf.create(
    {
        "device": "${default_device:}",
        "base_precision": "${default_precision:}",
        "seed": "${default_random_seed:}",
        "test_set": 0.0,
    }
)


CONF_SYSTEMS = OmegaConf.create(
    {
        "read_from": "${..read_from}",
        "reader": None,
        "length_unit": "",
    }
)

CONF_TARGET_FIELDS = OmegaConf.create(
    {
        "quantity": "energy",
        "read_from": "${...systems.read_from}",
        "reader": None,
        "key": None,
        "unit": "",
        "per_atom": False,
        "type": "scalar",
        "num_subtargets": 1,
        "description": "",
    }
)

CONF_EXTRA_FIELDS = OmegaConf.create(
    {
        "quantity": "",
        "read_from": "${...systems.read_from}",
        "reader": None,
        "key": None,
        "unit": "",
        "per_atom": False,
        "type": "scalar",
        "num_subtargets": 1,
        "description": "",
    }
)

CONF_GRADIENTS = OmegaConf.create({"forces": False, "stress": False, "virial": False})
CONF_GRADIENT = OmegaConf.create(
    {
        "read_from": "${..read_from}",
        "reader": None,
        "key": None,
    }
)

KNOWN_GRADIENTS = list(CONF_GRADIENTS.keys())

# Merge configs to get default configs for energies and other targets
CONF_TARGET = OmegaConf.merge(CONF_TARGET_FIELDS, CONF_GRADIENTS)
CONF_ENERGY = CONF_TARGET.copy()
CONF_ENERGY["forces"] = CONF_GRADIENT.copy()
CONF_ENERGY["stress"] = CONF_GRADIENT.copy()
CONF_EXTRA_DATA = CONF_EXTRA_FIELDS.copy()



[docs]
def check_dataset_options(dataset_config: ListConfig) -> None:
    """Perform consistency checks within one dataset config.

    This is useful if the dataset config is made of several datasets.

    - The function checks if ``length_units`` in each system section are known and the
       same.
    - For unknown quantities a warning is given.
    - If the names of the ``"targets"`` sections are the same between the elements of
       the list of datasets also the units must be the same.
    - Two targets with the names `{target}` and `mtt::{target}` are not allowed.

    :param dataset_config: A List of configuration to be checked. In the list contains
        only one element no checks are performed.
    :raises ValueError: If the units are not consistent between the dataset options or
        if two different targets have the `{target}` and `mtt::{target}` names.
    """
    desired_config = dataset_config[0]

    if hasattr(desired_config, "targets"):
        # save unit for each target seaction for later comparison
        unit_dict = {k: v["unit"] for k, v in desired_config["targets"].items()}
    else:
        unit_dict = {}

    if hasattr(desired_config, "systems"):
        desired_length_unit = desired_config["systems"]["length_unit"]
    else:
        desired_length_unit = None

    if hasattr(desired_config, "extra_data"):
        # save unit for each extra_data section for later comparison
        for extra_data_key, extra_data in desired_config["extra_data"].items():
            unit_dict[extra_data_key] = extra_data["unit"]

    # loop over ALL configs because we have check units for all elements in
    # `dataset_config`
    for actual_config in dataset_config:
        if desired_length_unit:
            # Perform consistency checks between config elements
            actual_length_unit = actual_config["systems"]["length_unit"]
            if actual_length_unit != desired_length_unit:
                raise ValueError(
                    "`length_unit`s are inconsistent between one of the dataset "
                    f"options. {actual_length_unit!r} != {desired_length_unit!r}."
                )

        if hasattr(actual_config, "targets"):
            for target_key, target in actual_config["targets"].items():
                unit = target["unit"]

                # If a target section name is not part of the saved units we add it for
                # later comparison. We do not have to start the loop again because this
                # target section name is not present in one of the datasets checked
                # before.
                if target_key not in unit_dict.keys():
                    unit_dict[target_key] = unit

                if unit_dict[target_key] != unit:
                    raise ValueError(
                        f"Units of target section {target_key!r} are inconsistent. "
                        f"Found {unit!r} and {unit_dict[target_key]!r}!"
                    )

        # `target` and `mtt::target` are not allowed to be present at the same time
        if hasattr(actual_config, "targets"):
            for target_key in actual_config["targets"].keys():
                if f"mtt::{target_key}" in actual_config["targets"].keys():
                    raise ValueError(
                        f"Two targets with the names `{target_key}` and "
                        f"`mtt::{target_key}` are not allowed to be present "
                        "at the same time."
                    )

        if hasattr(actual_config, "extra_data"):
            for extra_data_key, extra_data in actual_config["extra_data"].items():
                unit = extra_data["unit"]

                # If a extra_data section name is not part of the saved units we add it
                # for later comparison. We do not have to start the loop again because
                # this extra_data section name is not present in one of the datasets
                # checked before.
                if extra_data_key not in unit_dict.keys():
                    unit_dict[extra_data_key] = unit

                if unit_dict[extra_data_key] != unit:
                    raise ValueError(
                        f"Units of extra_data section {extra_data_key!r} are "
                        "inconsistent. "
                        f"Found {unit!r} and {unit_dict[extra_data_key]!r}!"
                    )




[docs]
def expand_dataset_config(conf: Union[str, DictConfig, ListConfig]) -> ListConfig:
    """Expands shorthand notations in a dataset configuration to its full format.

    This function takes a dataset configuration, either as a :py:class:str,
    :py:class:`omegaconf.DictConfig` or a :py:class:`omegaconf.ListConfig`, and expands
    it into a detailed configuration format. It processes systems, targets, and gradient
    sections, setting default values and inferring missing information. Unknown keys are
    ignored, allowing for flexibility.

    If the dataset configuration is either a :class:`str` or a
    :class:`omegaconf.DictConfig`

    The function performs the following steps for each config

    - Merges and interpolates the input configuration with the base configurations.
    - Expands shorthand notations like file paths or simple true/false settings to full
      dictionary systems. This includes setting the units to the base units of
      ``"angstrom"`` and ``"eV"``.
    - Handles special cases, such as the mandatory nature of the "energy" section for MD
      simulations and the mutual exclusivity of 'stress' and 'virial' sections.
      Additionally the gradient sections for "forces" are enables by default.

    :param conf: The dataset configuration, either as a file path string or a DictConfig
        object.
    :raises ValueError: If both ``virial`` and ``stress`` sections are enabled in the
        "energy" target, as this is not permissible for training.
    :return: List of datasets configurations. If ``conf`` was a :class:`str` or a
        :class:`omegaconf.DictConfig` the list contains only a single element.
    """
    # Expand str -> DictConfig
    if isinstance(conf, str):
        read_from = conf
        conf = OmegaConf.create(
            {"systems": read_from, "targets": {"energy": read_from}}
        )

    # Expand DictConfig -> ListConfig
    if isinstance(conf, DictConfig):
        conf = OmegaConf.create([conf])

    # Perform expansion per config inside the ListConfig
    for conf_element in conf:
        if hasattr(conf_element, "systems"):
            if type(conf_element["systems"]) is str:
                conf_element["systems"] = _resolve_single_str(conf_element["systems"])

            conf_element["systems"] = OmegaConf.merge(
                CONF_SYSTEMS, conf_element["systems"]
            )

        if hasattr(conf_element, "targets"):
            for target_key, target in conf_element["targets"].items():
                if type(target) is str:
                    target = _resolve_single_str(target)

                # for special case "energy" we enable sections for `forces` and `stress`
                # gradients by default
                if target_key == "energy" or target.get("quantity") == "energy":
                    target = OmegaConf.merge(CONF_ENERGY, target)
                else:
                    target = OmegaConf.merge(CONF_TARGET, target)

                if target["key"] is None:
                    target["key"] = target_key

                # update DictConfig to allow for config node interpolation
                conf_element["targets"][target_key] = target

                # merge and interpolate possibly present gradients with default gradient
                # config
                for gradient_key, gradient_conf in conf_element["targets"][
                    target_key
                ].items():
                    if gradient_key in KNOWN_GRADIENTS:
                        if gradient_conf is True:
                            gradient_conf = CONF_GRADIENT.copy()
                        elif type(gradient_conf) is str:
                            gradient_conf = _resolve_single_str(gradient_conf)

                        if isinstance(gradient_conf, DictConfig):
                            gradient_conf = OmegaConf.merge(
                                CONF_GRADIENT, gradient_conf
                            )

                            if gradient_conf["key"] is None:
                                gradient_conf["key"] = gradient_key

                            conf_element["targets"][target_key][gradient_key] = (
                                gradient_conf
                            )

                # If user sets the virial gradient and leaves the stress gradient
                # untouched, we disable the by default enabled stress gradient section.
                base_stress_gradient_conf = CONF_GRADIENT.copy()
                base_stress_gradient_conf["key"] = "stress"

                if (
                    (target_key == "energy" or target.get("quantity") == "energy")
                    and conf_element["targets"][target_key]["virial"]
                    and conf_element["targets"][target_key]["stress"]
                    == base_stress_gradient_conf
                ):
                    conf_element["targets"][target_key]["stress"] = False

                if (
                    conf_element["targets"][target_key]["stress"]
                    and conf_element["targets"][target_key]["virial"]
                ):
                    raise ValueError(
                        f"Cannot perform training with respect to virial and stress "
                        f"as in section {target_key}. Set either `virial: off` or "
                        "`stress: off`."
                    )

        if hasattr(conf_element, "extra_data"):
            for extra_data_key, extra_data in conf_element["extra_data"].items():
                if type(extra_data) is str:
                    extra_data = _resolve_single_str(extra_data)

                extra_data = OmegaConf.merge(CONF_EXTRA_DATA, extra_data)

                if extra_data["key"] is None:
                    extra_data["key"] = extra_data_key

                # update DictConfig to allow for config node interpolation
                conf_element["extra_data"][extra_data_key] = extra_data

    check_dataset_options(conf)
    return conf




[docs]
def expand_loss_config(conf: DictConfig) -> DictConfig:
    """
    Expand the loss configuration to fully specify loss terms for different targets and
    their gradients.

    Supported user forms
    --------------------

    1. Global type

       .. code-block:: yaml

          loss: <loss_type>

       Sets the default loss ``type`` for all targets **and** their gradients.

    2. Per-target types

       .. code-block:: yaml

          loss:
            <target_1>: <loss_type_1>
            <target_2>: <loss_type_2>

       Sets the loss type for the listed targets.
       Gradients for these targets keep their default configuration.

    3. Energy shorthands (forces / stress / virial)

       .. code-block:: yaml

          loss:
            <energy_target>:
              type: <loss_type>
              forces: <loss_type_for_forces>      # or mapping with loss fields
              stress: <loss_type_for_stress>      # or mapping

       or

       .. code-block:: yaml

          loss:
            <energy_target>:
              type: <loss_type>
              virial: <loss_type_for_virial>      # or mapping

       These are only allowed for energy-like targets (``quantity: energy`` or
       target name ``"energy"``):

       * ``forces`` expands to ``gradients.positions``
       * ``stress`` and ``virial`` expand to ``gradients.strain``

    4. Explicit gradient configuration

       .. code-block:: yaml

          loss:
            <target>:
              type: <loss_type>
              gradients:
                positions: <loss_type_for_grad>   # or mapping with loss fields
                strain:
                  type: ...
                  weight: ...
                  reduction: ...
                  ...

       This gives a fully explicit gradient specification for any target.

    :param conf: The (possibly shorthand) loss configuration to expand.
    :return: The expanded loss configuration with fully specified targets
             and gradients.
    """

    # Helpers
    def _new_defaults_spec() -> DictConfig:
        """
        Create a new loss config with default values.

        :return: A new loss config with default values.
        """
        return OmegaConf.create(init_with_defaults(LossSpecification))

    def _new_defaults_params() -> DictConfig:
        """
        Create a new loss config with default values.

        :return: A new loss config with default values.
        """
        return OmegaConf.create(init_with_defaults(LossParams))

    def _add_defaults_in_place(node: DictConfig) -> None:
        """
        Fill missing fields {type, weight, reduction, delta(if huber)}.

        :param node: The loss config node to fill in place.
        """
        d = _new_defaults_params()
        if "type" not in node:
            node["type"] = d["type"]
        if "weight" not in node:
            node["weight"] = d["weight"]
        if "reduction" not in node:
            node["reduction"] = d["reduction"]
        if node.get("type") == "huber" and "delta" not in node:
            node["delta"] = default_huber_loss_delta()

    # 1) Collect target / gradient info from training_set
    training_confs = conf["training_set"]
    if not isinstance(training_confs, ListConfig):
        training_confs = OmegaConf.create([training_confs])

    per_target_flags: dict[str, dict[str, bool]] = {}
    for ds in training_confs:
        targets = ds.get("targets") or {}
        for tname, tinfo in targets.items():
            is_energy = (tname == "energy") or (tinfo.get("quantity") == "energy")
            forces_flag = isinstance(tinfo.get("forces"), (dict, DictConfig))
            stress_flag = any(
                isinstance(tinfo.get(k), (dict, DictConfig))
                for k in ("stress", "virial")
            )

            entry = per_target_flags.setdefault(
                tname, {"is_energy": False, "forces": False, "stress": False}
            )
            entry["is_energy"] |= is_energy
            entry["forces"] |= forces_flag
            entry["stress"] |= stress_flag

    # 2) Create default loss entries per target
    defaults_map: dict[str, DictConfig] = {}
    for tname, flags in per_target_flags.items():
        base = _new_defaults_spec()
        g = base["gradients"]
        if flags["is_energy"]:
            if flags["forces"]:
                g["positions"] = _new_defaults_params()
            if flags["stress"]:
                g["strain"] = _new_defaults_params()
        defaults_map[tname] = base

    # 3) Parse user-provided loss configuration
    train_loss = conf["architecture"]["training"].get("loss", None)

    # Reject top-level entries that are not target names
    if isinstance(train_loss, (dict, DictConfig)):
        # Allowed top-level entries: only target names present in the dataset.
        allowed_targets = set(per_target_flags.keys())

        for key in train_loss.keys():
            val = train_loss[key]

            if key not in allowed_targets:
                raise ValueError(
                    f"Invalid top-level loss entry '{key}'. "
                    f"Allowed keys are: {sorted(allowed_targets)} or a single string."
                )

    global_loss_type: str | None = None
    per_target_raw: dict[str, DictConfig] = {}

    # Global string
    if isinstance(train_loss, str):
        global_loss_type = train_loss

    # Per-target dict
    elif isinstance(train_loss, (dict, DictConfig)):
        for tname, val in train_loss.items():
            if isinstance(val, str):
                # type-only shorthand on target
                node = OmegaConf.create({"type": val})
            else:
                node = OmegaConf.create(val)

            per_target_raw[tname] = node

    # 4) Assemble final loss per target
    final_loss = OmegaConf.create({})
    all_targets = set(per_target_flags.keys()) | set(per_target_raw.keys())

    for tname in all_targets:
        flags = per_target_flags.get(
            tname, {"is_energy": False, "forces": False, "stress": False}
        )
        is_energy = flags["is_energy"]

        # Start from defaults for known targets, otherwise from bare defaults
        if tname in defaults_map:
            base = OmegaConf.create(
                OmegaConf.to_container(defaults_map[tname], resolve=False)
            )
        else:
            base = _new_defaults_spec()

        gradients = base["gradients"]

        raw = per_target_raw.get(tname)

        # Override target fields from per-target config
        if raw is not None:
            target_overrides = {
                k: v
                for k, v in raw.items()
                if k not in ("forces", "stress", "virial", "gradients")
            }
            if target_overrides:
                base.merge_with(target_overrides)

        # Apply global loss type to targets and any existing default gradients
        if global_loss_type is not None:
            base["type"] = global_loss_type
            for g_cfg in gradients.values():
                g_cfg["type"] = global_loss_type

        # Gradient overrides from per-target config
        gradient_overrides: dict[str, dict] = {}

        if raw is not None:
            # Energy shorthands: forces, stress or virial
            has_forces_key = "forces" in raw
            has_stress_key = "stress" in raw
            has_virial_key = "virial" in raw

            if (has_forces_key or has_stress_key or has_virial_key) and not is_energy:
                raise ValueError(
                    f"'forces', 'stress', 'virial' loss entries are only allowed "
                    f"for energy-like targets, but target '{tname}' is not energy-like."
                )

            if has_stress_key and has_virial_key:
                raise ValueError(
                    f"Both 'stress' and 'virial' provided for target '{tname}'. "
                    "Use only one of them."
                )

            if is_energy:
                # forces -> positions
                if has_forces_key:
                    fval = raw["forces"]
                    cfg = (
                        {"type": fval}
                        if isinstance(fval, str)
                        else OmegaConf.to_container(fval, resolve=False)
                    )
                    gradient_overrides["positions"] = cfg

                # stress/virial -> strain
                if has_stress_key or has_virial_key:
                    sval = raw["stress"] if has_stress_key else raw["virial"]
                    cfg = (
                        {"type": sval}
                        if isinstance(sval, str)
                        else OmegaConf.to_container(sval, resolve=False)
                    )
                    gradient_overrides["strain"] = cfg

            # Explicit gradients section
            gnode = raw.get("gradients")
            if isinstance(gnode, (dict, DictConfig)):
                for gname, gval in gnode.items():
                    cfg = (
                        {"type": gval}
                        if isinstance(gval, str)
                        else OmegaConf.to_container(gval, resolve=False)
                    )
                    cur = gradient_overrides.get(gname, {})
                    cur_dc = OmegaConf.create(cur)
                    cfg_dc = OmegaConf.create(cfg)
                    merged = OmegaConf.merge(cur_dc, cfg_dc)
                    gradient_overrides[gname] = OmegaConf.to_container(
                        merged, resolve=False
                    )

        # Merge gradient overrides into base.gradients
        for gname, gcfg in gradient_overrides.items():
            if gname not in gradients:
                gradients[gname] = OmegaConf.create({})
            gradients[gname].merge_with(gcfg)

        # Fill in missing defaults for target
        _add_defaults_in_place(base)

        # Fill in missing defaults for each gradient
        for gcfg in gradients.values():
            _add_defaults_in_place(gcfg)

        final_loss[tname] = base

    conf["architecture"]["training"]["loss"] = final_loss
    return conf




[docs]
def check_units(
    actual_options: Union[DictConfig, ListConfig],
    desired_options: Union[DictConfig, ListConfig],
) -> None:
    """Perform consistency checks between two dataset configs.

    :param actual_options: The dataset options that you want to test.
    :param desired_options: The dataset options ``actual_options`` is tested against.

    :raises ValueError: If the length units are not consistent between
        the system in the dataset options.
    :raises ValueError: If a target is present only in desider_option and
        not in actual_option.
    :raises ValueError: If the unit of a target quantity is not consistent between
        the dataset option.
    """
    if type(actual_options) is DictConfig:
        actual_options = OmegaConf.create([actual_options])
    if type(desired_options) is DictConfig:
        desired_options = OmegaConf.create([desired_options])

    if len(actual_options) != len(desired_options):
        raise ValueError(
            f"Length of actual_options ({len(actual_options)}) and desired_options "
            f"({len(desired_options)}) is different!"
        )

    for actual_options_element, desired_options_element in zip(
        actual_options, desired_options, strict=True
    ):
        actual_length_unit = actual_options_element["systems"]["length_unit"]
        desired_length_unit = desired_options_element["systems"]["length_unit"]

        if actual_length_unit != desired_length_unit:
            raise ValueError(
                "`length_unit`s are inconsistent between one of the dataset options. "
                f"{actual_length_unit!r} != {desired_length_unit!r}."
            )

        for target in actual_options_element["targets"]:
            actual_unit = actual_options_element["targets"][target]["unit"]
            if target in desired_options_element["targets"]:
                desired_unit = desired_options_element["targets"][target]["unit"]
                if actual_unit != desired_unit:
                    raise ValueError(
                        f"Units of target {target!r} are inconsistent between one of "
                        f"the dataset options. {actual_unit!r} != {desired_unit!r}."
                    )
            else:
                raise ValueError(
                    f"Target {target!r} is not present in one of the given dataset "
                    "options."
                )