Source code for imod.mf6.simulation

from __future__ import annotations

import collections
import pathlib
import subprocess
from copy import deepcopy
from datetime import datetime
from pathlib import Path
from typing import Any, Callable, DefaultDict, Iterable, Optional, Union, cast

import cftime
import dask
import jinja2
import numpy as np
import tomli
import tomli_w
import xarray as xr
import xugrid as xu

import imod
import imod.logging
import imod.mf6.exchangebase
from imod.common.interfaces.imodel import IModel
from imod.common.interfaces.isimulation import ISimulation
from imod.common.statusinfo import NestedStatusInfo
from imod.common.utilities.dataclass_type import DataclassType
from imod.common.utilities.mask import _mask_all_models
from imod.common.utilities.regrid import _regrid_like
from imod.common.utilities.version import (
    get_version,
    log_versions,
    prepend_content_with_version_info,
)
from imod.logging import standard_log_decorator
from imod.mf6.gwfgwf import GWFGWF
from imod.mf6.gwfgwt import GWFGWT
from imod.mf6.gwtgwt import GWTGWT
from imod.mf6.ims import Solution, SolutionPresetModerate
from imod.mf6.model import Modflow6Model
from imod.mf6.model_gwf import GroundwaterFlowModel
from imod.mf6.model_gwt import GroundwaterTransportModel
from imod.mf6.multimodel.exchange_creator_structured import ExchangeCreator_Structured
from imod.mf6.multimodel.exchange_creator_unstructured import (
    ExchangeCreator_Unstructured,
)
from imod.mf6.multimodel.modelsplitter import create_partition_info, slice_model
from imod.mf6.out import open_cbc, open_conc, open_hds
from imod.mf6.package import Package
from imod.mf6.ssm import SourceSinkMixing
from imod.mf6.validation_settings import ValidationSettings
from imod.mf6.write_context import WriteContext
from imod.prepare.partition import create_partition_labels
from imod.prepare.topsystem.default_allocation_methods import (
    SimulationAllocationOptions,
    SimulationDistributingOptions,
)
from imod.schemata import ValidationError
from imod.typing import GridDataArray, GridDataset
from imod.typing.grid import (
    concat,
    is_equal,
    is_unstructured,
    merge_partitions,
)

OUTPUT_FUNC_MAPPING: dict[str, Callable] = {
    "head": open_hds,
    "concentration": open_conc,
    "budget-flow": open_cbc,
    "budget-transport": open_cbc,
}

OUTPUT_MODEL_MAPPING: dict[
    str, type[GroundwaterFlowModel] | type[GroundwaterTransportModel]
] = {
    "head": GroundwaterFlowModel,
    "concentration": GroundwaterTransportModel,
    "budget-flow": GroundwaterFlowModel,
    "budget-transport": GroundwaterTransportModel,
}


def get_models(simulation: Modflow6Simulation) -> dict[str, Modflow6Model]:
    return {k: v for k, v in simulation.items() if isinstance(v, Modflow6Model)}


def get_packages(simulation: Modflow6Simulation) -> dict[str, Package]:
    return {
        pkg_name: pkg
        for pkg_name, pkg in simulation.items()
        if isinstance(pkg, Package)
    }



[docs]
class Modflow6Simulation(collections.UserDict, ISimulation):
    """
    Modflow6Simulation is a class that represents a Modflow 6 simulation. It
    contains data on simulation timing, models that are present in the
    simulation, how models exchange information, and how models are solved.
    More information can be found here:
    https://water.usgs.gov/water-resources/software/MODFLOW-6/mf6io_6.4.2.pdf#page=20

    Parameters
    ----------
    name: str
        Name of the simulation. This is used to create the simulation name file
        and the directory in which the simulation is written.
    validation_settings: ValidationSettings, optional
        Settings for validation of the simulation. If not provided, default
        settings are used. These settings can be used to control whether the
        simulation is validated at write time, and whether strict validation
        rules are applied.

    Examples
    --------
    Create a Modflow 6 simulation and add a groundwater flow model to it:

    >>> import imod
    >>> simulation = imod.mf6.Modflow6Simulation("example_simulation")
    >>> simulation["GWF"] = imod.mf6.GroundwaterFlowModel()

    You can configure the validation settings for the simulation as follows:

    >>> validation_settings = imod.mf6.ValidationSettings(ignore_time=True)
    >>> simulation = imod.mf6.Modflow6Simulation("example_simulation", validation_settings)

    See :class:`imod.mf6.ValidationSettings` for information on how to configure
    validation settings. Configuring :class:`imod.mf6.ValidationSettings` can
    help performance or reduce the strictness of validation for some packages,
    namely the Well and HFB packages.
    """

    def _initialize_template(self):
        loader = jinja2.PackageLoader("imod", "templates/mf6")
        env = jinja2.Environment(loader=loader, keep_trailing_newline=True)
        self._template = env.get_template("sim-nam.j2")


[docs]
    def __init__(
        self, name: str, validation_settings: Optional[ValidationSettings] = None
    ):
        super().__init__()
        self.name = name
        self.directory = None
        self._initialize_template()
        if validation_settings is None:
            self._validation_context = ValidationSettings()
        else:
            self._validation_context = validation_settings


    def __setitem__(self, key, value):
        super().__setitem__(key, value)

    def update(self, *args, **kwargs):
        for k, v in dict(*args, **kwargs).items():
            self[k] = v

    def _get_pkgkey(self, pkg_id):
        """
        Get package key that belongs to a certain pkg_id, since the keys are
        user specified.
        """
        key = [
            pkgname
            for pkgname, pkg in self.items()
            if isinstance(pkg, Package) and (pkg._pkg_id == pkg_id)
        ]
        nkey = len(key)
        if nkey > 1:
            raise ValueError(f"Multiple instances of {key} detected")
        elif nkey == 1:
            return key[0]
        else:
            return None


[docs]
    @standard_log_decorator()
    def create_time_discretization(self, additional_times, validate: bool = True):
        """
        Collect all unique times from model packages and additional given
        `times`. These unique times are used as stress periods in the model. All
        stress packages must have the same starting time. Function creates
        TimeDiscretization object which is set to self["time_discretization"]

        The time discretization in imod-python works as follows:

        - The datetimes of all packages you send in are always respected
        - Subsequently, the input data you use is always included fully as well
        - All times are treated as starting times for the stress: a stress is
          always applied until the next specified date
        - For this reason, a final time is required to determine the length of
          the last stress period
        - Additional times can be provided to force shorter stress periods &
          more detailed output
        - Every stress has to be defined on the first stress period (this is a
          modflow requirement)

        Or visually (every letter a date in the time axes):

        >>> recharge a - b - c - d - e - f
        >>> river    g - - - - h - - - - j
        >>> times    - - - - - - - - - - - i
        >>> model    a - b - c h d - e - f i

        with the stress periods defined between these dates. I.e. the model
        times are the set of all times you include in the model.

        Parameters
        ----------
        additional_times : str, datetime; or iterable of str, datetimes.
            Times to add to the time discretization. At least one single time
            should be given, which will be used as the ending time of the
            simulation.

        Note
        ----
        To set the other parameters of the TimeDiscretization object, you have
        to set these to the object after calling this function.

        Example
        -------
        >>> simulation = imod.mf6.Modflow6Simulation("example")
        >>> simulation.create_time_discretization(times=["2000-01-01", "2000-01-02"])
        >>> # Set number of timesteps
        >>> simulation["time_discretization"]["n_timesteps"] = 5
        """
        self.use_cftime = any(
            model._use_cftime()
            for model in self.values()
            if isinstance(model, Modflow6Model)
        )

        times = [
            imod.util.time.to_datetime_internal(time, self.use_cftime)
            for time in additional_times
        ]
        for model in self.values():
            if isinstance(model, Modflow6Model):
                times.extend(model._yield_times())

        # np.unique also sorts
        times = np.unique(np.hstack(times))

        duration = imod.util.time.timestep_duration(times, self.use_cftime)
        # Generate time discretization, just rely on default arguments
        # Probably won't be used that much anyway?
        timestep_duration = xr.DataArray(
            duration, coords={"time": np.array(times)[:-1]}, dims=("time",)
        )
        self["time_discretization"] = imod.mf6.TimeDiscretization(
            timestep_duration=timestep_duration, validate=validate
        )


    def _render(self, write_context: WriteContext):
        """Renders simulation namefile"""
        d: dict[str, Any] = {}
        models = []
        solutiongroups = []
        for key, value in self.items():
            if isinstance(value, Modflow6Model):
                model_name_file = pathlib.Path(
                    write_context.root_directory / pathlib.Path(f"{key}", f"{key}.nam")
                ).as_posix()
                models.append((value.model_id, model_name_file, key))
            elif isinstance(value, Package):
                if value._pkg_id == "tdis":
                    d["tdis6"] = f"{key}.tdis"
                elif value._pkg_id == "ims":
                    slnnames = value["modelnames"].values
                    modeltypes = set()
                    for name in slnnames:
                        try:
                            modeltypes.add(type(self[name]))
                        except KeyError:
                            raise KeyError(f"model {name} of {key} not found")

                    if len(modeltypes) > 1:
                        raise ValueError(
                            "Only a single type of model allowed in a solution"
                        )
                    solutiongroups.append(("ims6", f"{key}.ims", slnnames))

        d["models"] = models
        if len(models) > 1:
            d["exchanges"] = self.get_exchange_relationships()

        d["solutiongroups"] = [solutiongroups]
        return self._template.render(d)

    def _write_tdis_package(self, globaltimes, write_context):
        """Write time discretization package, and set/clear ats filename if needed"""
        ats_pkgname = self._get_pkgkey("ats")
        if ats_pkgname:
            self["time_discretization"]._set_ats_filename(ats_pkgname, write_context)
        else:
            # Make sure no ats_filename is set (in case it was set before)
            self["time_discretization"]._clear_ats_filename()
        self["time_discretization"]._write(
            pkgname="time_discretization",
            globaltimes=globaltimes,
            write_context=write_context,
        )


[docs]
    @standard_log_decorator()
    def write(
        self,
        directory=".",
        binary=True,
        validate: bool = True,
        use_absolute_paths=False,
    ):
        """
        Write Modflow6 simulation, including assigned groundwater flow and
        transport models.

        Parameters
        ----------
        directory: str, pathlib.Path
            Directory to write Modflow 6 simulation to.
        binary: ({True, False}, optional)
            Whether to write time-dependent input for stress packages as binary
            files, which are smaller in size, or more human-readable text files.
        validate: ({True, False}, optional)
            Whether to validate the Modflow6 simulation, including models, at
            write. If True, erronous model input will throw a
            ``ValidationError``.
        use_absolute_paths: ({True, False}, optional)
            True if all paths written to the mf6 inputfiles should be absolute.

        Examples
        --------
        Write the simulation to a directory:

        >>> simulation.write("path/to/simulation")

        If you continue to run into ValidationErrors, you can disable the validation
        by setting the ``validate`` argument to ``False``. This is not recommended:

        >>> simulation.write("path/to/simulation", validate=False)
        """
        # create write context
        write_context = WriteContext(directory, binary, use_absolute_paths)
        self._validation_context.validate = validate
        if self.is_split():
            self._validation_context.strict_well_validation = False

        # Check models for required content
        for key, model in self.items():
            # skip timedis, exchanges
            if isinstance(model, Modflow6Model):
                model._model_checks(key)

        # Generate GWF-GWT exchanges
        if gwfgwt_exchanges := self._generate_gwfgwt_exchanges():
            self["gwtgwf_exchanges"] = gwfgwt_exchanges

        directory = pathlib.Path(directory)
        directory.mkdir(exist_ok=True, parents=True)

        # Write simulation namefile
        mfsim_content = self._render(write_context)
        mfsim_content = prepend_content_with_version_info(mfsim_content)
        mfsim_path = directory / "mfsim.nam"
        with open(mfsim_path, "w") as f:
            f.write(mfsim_content)

        # Write time discretization file
        globaltimes = self["time_discretization"]["time"].values
        self._write_tdis_package(globaltimes, write_context)

        # Write individual models
        status_info = NestedStatusInfo("Simulation validation status")

        for key, value in self.items():
            model_write_context = write_context.copy_with_new_write_directory(
                write_context.simulation_directory
            )
            # skip timedis, exchanges
            if isinstance(value, Modflow6Model):
                status_info.add(
                    value._write(
                        modelname=key,
                        globaltimes=globaltimes,
                        write_context=model_write_context,
                        validate_context=self._validation_context,
                    )
                )
            elif isinstance(value, Package):
                if value._pkg_id in ["ims", "ats"]:
                    # Copy write_context again for packages to avoid changing it
                    # down the line and risk clashing with the model write
                    # context.
                    pkg_write_context = write_context.copy_with_new_write_directory(
                        write_context.simulation_directory
                    )
                    value._write(key, globaltimes, pkg_write_context)
            elif isinstance(value, list):
                for exchange in value:
                    if isinstance(exchange, imod.mf6.exchangebase.ExchangeBase):
                        exchange._write(
                            exchange.package_name(), globaltimes, write_context
                        )

        if status_info.has_errors():
            raise ValidationError("\n" + status_info.to_string())

        self.directory = directory



[docs]
    @standard_log_decorator()
    def run(self, mf6path: Union[str, Path] = "mf6") -> None:
        """
        Run Modflow 6 simulation. This method runs a subprocess calling
        ``mf6path``. This argument is set to ``mf6``, which means the Modflow 6
        executable is expected to be added to your PATH environment variable.
        :doc:`See this writeup how to add Modflow 6 to your PATH on Windows </examples/mf6/index>`

        Note that the ``write`` method needs to be called before this method is
        called.

        Parameters
        ----------
        mf6path: Union[str, Path]
            Path to the Modflow 6 executable. Defaults to calling ``mf6``.

        Examples
        --------
        Make sure you write your model first

        >>> simulation.write(path/to/model)
        >>> simulation.run()
        """
        if self.directory is None:
            raise RuntimeError(f"Simulation {self.name} has not been written yet.")
        with imod.util.cd(self.directory):
            result = subprocess.run(mf6path, capture_output=True)
            if result.returncode != 0:
                raise RuntimeError(
                    f"Simulation {self.name}: {mf6path} failed to run with returncode "
                    f"{result.returncode}, and error message:\n\n{result.stdout.decode()} "
                )



[docs]
    @standard_log_decorator()
    def open_head(
        self,
        dry_nan: bool = False,
        simulation_start_time: Optional[np.datetime64] = None,
        time_unit: Optional[str] = "d",
    ) -> GridDataArray:
        """
        Open heads of finished simulation, requires that the ``run`` method has
        been called.

        The data is lazily read per timestep and automatically converted into
        (dense) xr.DataArrays or xu.UgridDataArrays, for DIS and DISV
        respectively. The conversion is done via the information stored in the
        Binary Grid file (GRB).

        Parameters
        ----------
        dry_nan: bool, default value: False.
            Whether to convert dry values to NaN.
        simulation_start_time : Optional datetime
            The time and date correpsonding to the beginning of the simulation.
            Use this to convert the time coordinates of the output array to
            calendar time/dates. time_unit must also be present if this argument is present.
        time_unit: Optional str
            The time unit MF6 is working in, in string representation.
            Only used if simulation_start_time was provided.
            Admissible values are:
            ns -> nanosecond
            ms -> microsecond
            s -> second
            m -> minute
            h -> hour
            d -> day
            w -> week
            Units "month" or "year" are not supported, as they do not represent unambiguous timedelta values durations.

        Returns
        -------
        head: Union[xr.DataArray, xu.UgridDataArray]

        Examples
        --------
        Make sure you write and run your model first

        >>> simulation.write(path/to/model)
        >>> simulation.run()

        Then open heads:

        >>> head = simulation.open_head()
        """
        return self._open_output(
            "head",
            dry_nan=dry_nan,
            simulation_start_time=simulation_start_time,
            time_unit=time_unit,
        )



[docs]
    @standard_log_decorator()
    def open_transport_budget(
        self,
        species_ls: Optional[list[str]] = None,
        simulation_start_time: Optional[np.datetime64] = None,
        time_unit: Optional[str] = "d",
    ) -> GridDataArray | GridDataset:
        """
        Open transport budgets of finished simulation, requires that the ``run``
        method has been called.

        The data is lazily read per timestep and automatically converted into
        (dense) xr.DataArrays or xu.UgridDataArrays, for DIS and DISV
        respectively. The conversion is done via the information stored in the
        Binary Grid file (GRB).

        Parameters
        ----------
        species_ls: list of strings, default value: None.
            List of species names, which will be used to concatenate the
            concentrations along the ``"species"`` dimension, in case the
            simulation has multiple species and thus multiple transport models.
            If None, transport model names will be used as species names.

        Returns
        -------
        budget: Dict[str, xr.DataArray|xu.UgridDataArray]
            DataArray contains float64 data of the budgets, with dimensions ("time",
            "layer", "y", "x").

        """
        return self._open_output(
            "budget-transport",
            species_ls=species_ls,
            simulation_start_time=simulation_start_time,
            time_unit=time_unit,
            merge_to_dataset=True,
            flowja=False,
        )



[docs]
    @standard_log_decorator()
    def open_flow_budget(
        self,
        flowja: bool = False,
        simulation_start_time: Optional[np.datetime64] = None,
        time_unit: Optional[str] = "d",
    ) -> GridDataArray | GridDataset:
        """
        Open flow budgets of finished simulation, requires that the ``run``
        method has been called.

        The data is lazily read per timestep and automatically converted into
        (dense) xr.DataArrays or xu.UgridDataArrays, for DIS and DISV
        respectively. The conversion is done via the information stored in the
        Binary Grid file (GRB).

        The ``flowja`` argument controls whether the flow-ja-face array (if
        present) is returned in grid form as "as is". By default
        ``flowja=False`` and the array is returned in "grid form", meaning:

            * DIS: in right, front, and lower face flow. All flows are placed in
              the cell.
            * DISV: in horizontal and lower face flow.the horizontal flows are
              placed on the edges and the lower face flow is placed on the faces.

        When ``flowja=True``, the flow-ja-face array is returned as it is found in
        the CBC file, with a flow for every cell to cell connection. Additionally,
        a ``connectivity`` DataArray is returned describing for every cell (n) its
        connected cells (m).

        Parameters
        ----------
        flowja: bool, default value: False
            Whether to return the flow-ja-face values "as is" (``True``) or in a
            grid form (``False``).

        Returns
        -------
        budget: Dict[str, xr.DataArray|xu.UgridDataArray]
            DataArray contains float64 data of the budgets, with dimensions ("time",
            "layer", "y", "x").

        Examples
        --------
        Make sure you write and run your model first

        >>> simulation.write(path/to/model)
        >>> simulation.run()

        Then open budgets:

        >>> budget = simulation.open_flow_budget()

        Check the contents:

        >>> print(budget.keys())

        Get the drainage budget, compute a time mean for the first layer:

        >>> drn_budget = budget["drn]
        >>> mean = drn_budget.sel(layer=1).mean("time")
        """
        return self._open_output(
            "budget-flow",
            flowja=flowja,
            simulation_start_time=simulation_start_time,
            time_unit=time_unit,
            merge_to_dataset=True,
        )



[docs]
    @standard_log_decorator()
    def open_concentration(
        self,
        species_ls: Optional[list[str]] = None,
        dry_nan: bool = False,
        simulation_start_time: Optional[np.datetime64] = None,
        time_unit: Optional[str] = "d",
    ) -> GridDataArray:
        """
        Open concentration of finished simulation, requires that the ``run``
        method has been called.

        The data is lazily read per timestep and automatically converted into
        (dense) xr.DataArrays or xu.UgridDataArrays, for DIS and DISV
        respectively. The conversion is done via the information stored in the
        Binary Grid file (GRB).

        Parameters
        ----------
        species_ls: list of strings, default value: None.
            List of species names, which will be used to concatenate the
            concentrations along the ``"species"`` dimension, in case the
            simulation has multiple species and thus multiple transport models.
            If None, transport model names will be used as species names.
        dry_nan: bool, default value: False.
            Whether to convert dry values to NaN.

        Returns
        -------
        concentration: Union[xr.DataArray, xu.UgridDataArray]

        Examples
        --------
        Make sure you write and run your model first

        >>> simulation.write(path/to/model)
        >>> simulation.run()

        Then open concentrations:

        >>> concentration = simulation.open_concentration()
        """
        return self._open_output(
            "concentration",
            species_ls=species_ls,
            dry_nan=dry_nan,
            simulation_start_time=simulation_start_time,
            time_unit=time_unit,
        )


    def _open_output(self, output: str, **settings) -> GridDataArray | GridDataset:
        """
        Opens output of one or multiple models.

        Parameters
        ----------
        output: str
            Output variable name to open
        **settings:
            Extra settings that need to be passed through to the respective
            output function.
        """
        modeltype = OUTPUT_MODEL_MAPPING[output]
        modelnames = self.get_models_of_type(modeltype._model_id).keys()
        if len(modelnames) == 0:
            modeltype = OUTPUT_MODEL_MAPPING[output]
            raise ValueError(
                f"Could not find any models of appropriate type for {output}, "
                f"make sure a model of type {modeltype} is assigned to simulation."
            )

        if output in ["head", "budget-flow"]:
            return self._open_single_output(list(modelnames), output, **settings)
        elif output in ["concentration", "budget-transport"]:
            return self._concat_species(output, **settings)
        else:
            raise RuntimeError(
                f"Unexpected error when opening {output} for {modelnames}"
            )

    def _open_single_output(
        self, modelnames: list[str], output: str, **settings
    ) -> GridDataArray | GridDataset:
        """
        Open single output, e.g. concentration of single species, or heads. This
        can be output of partitioned models that need to be merged.
        """
        if len(modelnames) == 0:
            modeltype = OUTPUT_MODEL_MAPPING[output]
            raise ValueError(
                f"Could not find any models of appropriate type for {output}, "
                f"make sure a model of type {modeltype} is assigned to simulation."
            )
        elif len(modelnames) == 1:
            modelname = next(iter(modelnames))
            return self._open_single_output_single_model(modelname, output, **settings)
        elif self.is_split():
            if "budget" in output:
                return self._merge_budgets(modelnames, output, **settings)
            else:
                return self._merge_states(modelnames, output, **settings)
        raise ValueError("error in _open_single_output")

    def _merge_states(
        self, modelnames: list[str], output: str, **settings
    ) -> GridDataArray:
        state_partitions = []
        for modelname in modelnames:
            state_partitions.append(
                self._open_single_output_single_model(modelname, output, **settings)
            )
        return merge_partitions(state_partitions)

    def _merge_and_assign_exchange_budgets(self, cbc: GridDataset) -> GridDataset:
        """
        Merge and assign exchange budgets to cell by cell budgets:
        cbc[[gwf-gwf_1, gwf-gwf_3]] to cbc[gwf-gwf]
        """
        exchange_names = [
            key
            for key in cast(Iterable[str], cbc.keys())
            if (("gwf-gwf" in key) or ("gwt-gwt" in key))
        ]
        exchange_budgets = cbc[exchange_names].to_array().sum(dim="variable")
        cbc = cbc.drop_vars(exchange_names)
        # "gwf-gwf" or "gwt-gwt"
        exchange_key = exchange_names[0].split("_")[1]
        cbc[exchange_key] = exchange_budgets
        return cbc

    def _pad_missing_variables(self, cbc_per_partition: list[GridDataset]) -> None:
        """
        Boundary conditions can be missing in certain partitions, as do their
        budgets, in which case we manually assign an empty grid of nans.
        """
        dims_per_unique_key = {
            key: cbc[key].dims for cbc in cbc_per_partition for key in cbc.keys()
        }
        for cbc in cbc_per_partition:
            missing_keys = set(dims_per_unique_key.keys()) - set(cbc.keys())

            for missing in missing_keys:
                missing_dims = dims_per_unique_key[missing]
                missing_coords = {dim: cbc.coords[dim] for dim in missing_dims}

                shape = tuple([len(missing_coords[dim]) for dim in missing_dims])
                chunks = (1,) + shape[1:]
                missing_data = dask.array.full(shape, np.nan, chunks=chunks)

                missing_grid = xr.DataArray(
                    missing_data, dims=missing_dims, coords=missing_coords
                )
                if isinstance(cbc, xu.UgridDataset):
                    missing_grid = xu.UgridDataArray(
                        missing_grid,
                        grid=cbc.ugrid.grid,
                    )
                cbc[missing] = missing_grid

    def _merge_budgets(
        self, modelnames: list[str], output: str, **settings
    ) -> GridDataset:
        if settings["flowja"] is True:
            raise ValueError("``flowja`` cannot be set to True when merging budgets.")

        cbc_per_partition = []
        for modelname in modelnames:
            cbc = self._open_single_output_single_model(modelname, output, **settings)
            # Merge and assign exchange budgets to dataset
            # FUTURE: Refactor to insert these exchange budgets in horizontal
            # flows.
            cbc = self._merge_and_assign_exchange_budgets(cbc)
            if not is_unstructured(cbc):
                cbc = cbc.where(self[modelname].domain, other=np.nan)
            cbc_per_partition.append(cbc)

        self._pad_missing_variables(cbc_per_partition)

        return merge_partitions(cbc_per_partition)

    def _concat_species(
        self, output: str, species_ls: Optional[list[str]] = None, **settings
    ) -> GridDataArray | GridDataset:
        # groupby flow model, to somewhat enforce consistent transport model
        # ordening. Say:
        # F = Flow model, T = Transport model
        # a = species "a", b = species "b"
        # 1 = partition 1, 2 = partition 2
        # then this:
        # F1Ta1 F1Tb1 F2Ta2 F2Tb2 -> F1: [Ta1, Tb1], F2: [Ta2, Tb2]
        # F1Ta1 F2Tb1 F1Ta1 F2Tb2 -> F1: [Ta1, Tb1], F2: [Ta2, Tb2]
        tpt_models_per_flow_model = self._get_transport_models_per_flow_model()
        all_tpt_names = list(tpt_models_per_flow_model.values())

        # [[Ta_1, Tb_1], [Ta_2, Tb_2]] -> [[Ta_1, Ta_2], [Tb_1, Tb_2]]
        # [[Ta, Tb]] -> [[Ta], [Tb]]
        tpt_names_per_species = list(zip(*all_tpt_names))

        if self.is_split():
            # [[Ta_1, Tb_1], [Ta_2, Tb_2]] -> [Ta, Tb]
            unpartitioned_modelnames = [
                tpt_name.rpartition("_")[0] for tpt_name in all_tpt_names[0]
            ]
        else:
            # [[Ta, Tb]] -> [Ta, Tb]
            unpartitioned_modelnames = all_tpt_names[0]

        if not species_ls:
            species_ls = unpartitioned_modelnames

        if len(species_ls) != len(tpt_names_per_species):
            raise ValueError(
                "species_ls does not equal the number of transport models, "
                f"expected length {len(tpt_names_per_species)}, received {species_ls}"
            )

        if len(species_ls) == 1:
            return self._open_single_output(
                list(tpt_names_per_species[0]), output, **settings
            )

        # Concatenate species
        outputs = []
        for species, tpt_names in zip(species_ls, tpt_names_per_species):
            output_data = self._open_single_output(list(tpt_names), output, **settings)
            output_data = output_data.assign_coords(species=species)
            outputs.append(output_data)
        return concat(outputs, dim="species")

    def _open_single_output_single_model(
        self, modelname: str, output: str, **settings
    ) -> GridDataArray | GridDataset:
        """
        Opens single output of single model

        Parameters
        ----------
        modelname: str
            Name of groundwater model from which output should be read.
        output: str
            Output variable name to open.
        **settings:
            Extra settings that need to be passed through to the respective
            output function.
        """
        open_func = OUTPUT_FUNC_MAPPING[output]
        expected_modeltype = OUTPUT_MODEL_MAPPING[output]

        if self.directory is None:
            raise RuntimeError(f"Simulation {self.name} has not been written yet.")
        model_path = self.directory / modelname

        # Get model
        model = self[modelname]
        if not isinstance(model, expected_modeltype):
            raise TypeError(
                f"{modelname} not a {expected_modeltype}, instead got {type(model)}"
            )
        # Get output file path
        oc_key = model._get_pkgkey("oc")
        oc_pkg = model[oc_key]
        # Ensure "-transport" and "-flow" are stripped from "budget"
        oc_output = output.split("-")[0]
        output_path = oc_pkg._get_output_filepath(model_path, oc_output)
        # Force path to always include simulation directory.
        output_path = self.directory / output_path

        grb_path = self._get_grb_path(modelname)

        if not output_path.exists():
            raise RuntimeError(
                f"Could not find output in {output_path}, check if you already ran simulation {self.name}"
            )

        return open_func(output_path, grb_path, **settings)

    def _get_flow_modelname_coupled_to_transport_model(
        self, transport_modelname: str
    ) -> str:
        """
        Get name of flow model coupled to transport model, throws error if
        multiple flow models are couple to 1 transport model.
        """
        exchanges = self.get_exchange_relationships()
        coupled_flow_models = [
            i[2]
            for i in exchanges
            if (i[3] == transport_modelname) & (i[0] == "GWF6-GWT6")
        ]
        if len(coupled_flow_models) != 1:
            raise ValueError(
                f"Exactly one flow model must be coupled to transport model {transport_modelname}, got: {coupled_flow_models}"
            )
        return coupled_flow_models[0]

    def _get_grb_path(self, modelname: str) -> Path:
        """
        Finds appropriate grb path belonging to modelname. Grb files are not
        written for transport models, so this method always returns a path to a
        flowmodel. In case of a transport model, it returns the path to the grb
        file its coupled flow model.
        """
        if self.directory is None:
            raise ValueError("Directory not set")

        model = self[modelname]
        # Get grb path
        if isinstance(model, GroundwaterTransportModel):
            flow_model_name = self._get_flow_modelname_coupled_to_transport_model(
                modelname
            )
            flow_model_path = self.directory / flow_model_name
        else:
            flow_model_path = self.directory / modelname

        diskey = model.get_diskey()
        dis_id = model[diskey]._pkg_id
        return flow_model_path / f"{diskey}.{dis_id}.grb"


[docs]
    @standard_log_decorator()
    def dump(
        self,
        directory=".",
        validate: bool = True,
        mdal_compliant: bool = False,
        crs=None,
    ) -> None:
        """
        Dump simulation to files. Writes a model definition as .TOML file, which
        points to data for each package. Each package is stored as a separate
        NetCDF. Structured grids are saved as regular NetCDFs, unstructured
        grids are saved as UGRID NetCDF. Structured grids are always made GDAL
        compliant, unstructured grids can be made MDAL compliant optionally.

        Parameters
        ----------
        directory: str or Path, optional
            directory to dump simulation into. Defaults to current working directory.
        validate: bool, optional
            Whether to validate simulation data. Defaults to True.
        mdal_compliant: bool, optional
            Convert data with
            :func:`imod.prepare.spatial.mdal_compliant_ugrid2d` to MDAL
            compliant unstructured grids. Defaults to False.
        crs: Any, optional
            Anything accepted by rasterio.crs.CRS.from_user_input
            Requires ``rioxarray`` installed.

        Examples
        --------
        Dump simulation to directory:

        >>> mf6_sim.dump("path/to/directory")

        You can load the dumped simulation back with:

        >>> loaded_sim = Modflow6Simulation.from_file("path/to/directory/simulation_name.toml")

        If you keep on getting ValidationErrors, you can set
        ``validate=False`` to skip validation, but this is not recommended.

        >>> mf6_sim.dump("path/to/directory", validate=False)

        You can then fix the issues later after loading the simulation in a
        later stage. If you want to dump the simulation in a form that is nicely
        loaded into QGIS, you can set ``mdal_compliant=True``:

        >>> mf6_sim.dump("path/to/directory", mdal_compliant=True, crs="EPSG:4326")
        """
        directory = pathlib.Path(directory)
        directory.mkdir(parents=True, exist_ok=True)

        toml_content: DefaultDict[str, dict] = collections.defaultdict(dict)
        # Dump version number
        version = get_version()
        toml_content["version"] = {"imod-python": version}
        # Dump models and exchanges
        for key, value in self.items():
            cls_name = type(value).__name__
            if isinstance(value, Modflow6Model):
                model_toml_path = value.dump(
                    directory, key, validate, mdal_compliant, crs
                )
                toml_content[cls_name][key] = model_toml_path.relative_to(
                    directory
                ).as_posix()
            elif key in ["gwtgwf_exchanges", "split_exchanges"]:
                toml_content[key] = collections.defaultdict(list)
                for exchange_package in self[key]:
                    _, filename, _, _ = exchange_package.get_specification()
                    exchange_class_short = type(exchange_package).__name__
                    path = f"{filename}.nc"
                    exchange_package.dataset.to_netcdf(directory / path)
                    toml_content[key][exchange_class_short].append(path)

            else:
                path = f"{key}.nc"
                value.dataset.to_netcdf(directory / path)
                toml_content[cls_name][key] = path

        with open(directory / f"{self.name}.toml", "wb") as f:
            tomli_w.dump(toml_content, f)



[docs]
    @staticmethod
    @standard_log_decorator()
    def from_file(toml_path):
        """
        Load Modflow6Simulation, previously dumped to TOML file with
        :meth:`imod.mf6.Modflow6Simulation.dump` from a TOML file.

        Parameters
        ----------
        toml_path: str or Path
            Path to TOML file containing Modflow6Simulation data.

        Returns
        -------
        Modflow6Simulation
            Modflow6Simulation object with models and packages loaded from

        Examples
        --------
        Dump simulation to directory:

        >>> mf6_sim.dump("path/to/directory")

        You can load the dumped simulation back with:

        >>> loaded_sim = Modflow6Simulation.from_file("path/to/directory/simulation_name.toml")
        """
        classes = {
            item_cls.__name__: item_cls
            for item_cls in (
                GroundwaterFlowModel,
                GroundwaterTransportModel,
                imod.mf6.TimeDiscretization,
                imod.mf6.Solution,
                imod.mf6.GWFGWF,
                imod.mf6.GWFGWT,
                imod.mf6.GWTGWT,
            )
        }

        toml_path = pathlib.Path(toml_path)
        with open(toml_path, "rb") as f:
            toml_content = tomli.load(f)

        version_saved = toml_content.pop("version", None)
        log_versions(version_saved)

        simulation = Modflow6Simulation(name=toml_path.stem)
        for key, entry in toml_content.items():
            if key not in ["gwtgwf_exchanges", "split_exchanges"]:
                item_cls = classes[key]
                for name, filename in entry.items():
                    path = toml_path.parent / filename
                    simulation[name] = item_cls.from_file(path)
            else:
                simulation[key] = []
                for exchange_class, exchange_list in entry.items():
                    item_cls = classes[exchange_class]
                    for filename in exchange_list:
                        path = toml_path.parent / filename
                        simulation[key].append(item_cls.from_file(path))

        return simulation



[docs]
    def get_exchange_relationships(self) -> list:
        """
        Get exchange relationships in the simulation.

        Returns
        -------
        list
            List with exchange relationships in the simulation.
        """
        result = []

        if "gwtgwf_exchanges" in self:
            for exchange in self["gwtgwf_exchanges"]:
                result.append(exchange.get_specification())

        # exchange for splitting models
        if self.is_split():
            for exchange in self["split_exchanges"]:
                result.append(exchange.get_specification())
        return result



[docs]
    def get_models_of_type(self, model_id) -> dict[str, IModel]:
        """
        Get all models in the simulation of a specific type.

        Parameters
        ----------
        model_id: str
            Model type identifier, e.g. "gwf6" for groundwater flow models,
            "gwt6" for groundwater transport models.

        Returns
        -------
        dict[str, Modflow6Model]
            Dictionary with model names as keys and Modflow6Model objects as values.
        """
        return {
            k: v
            for k, v in self.items()
            if isinstance(v, Modflow6Model) and (v.model_id == model_id)
        }



[docs]
    def get_models(self) -> dict[str, IModel]:
        """
        Get all models in the simulation.

        Returns
        -------
        dict[str, Modflow6Model]
            Dictionary with model names as keys and Modflow6Model objects as values.
        """
        return {k: v for k, v in self.items() if isinstance(v, Modflow6Model)}



[docs]
    @standard_log_decorator()
    def clip_box(
        self,
        time_min: Optional[cftime.datetime | np.datetime64 | str] = None,
        time_max: Optional[cftime.datetime | np.datetime64 | str] = None,
        layer_min: Optional[int] = None,
        layer_max: Optional[int] = None,
        x_min: Optional[float] = None,
        x_max: Optional[float] = None,
        y_min: Optional[float] = None,
        y_max: Optional[float] = None,
        states_for_boundary: Optional[dict[str, GridDataArray]] = None,
    ) -> Modflow6Simulation:
        """
        Clip a simulation by a bounding box (time, layer, y, x).

        Parameters
        ----------
        time_min: optional, np.datetime64
            Start time to select. Data will be forward filled to this date. If
            time_min is before the start time of the dataset, data is
            backfilled.
        time_max: optional
            End time to select.
        layer_min: optional, int
            Minimum layer to select.
        layer_max: optional, int
            Maximum layer to select.
        x_min: optional, float
            Minimum x-coordinate to select.
        x_max: optional, float
            Maximum x-coordinate to select.
        y_min: optional, float
            Minimum y-coordinate to select.
        y_max: optional, float
            Maximum y-coordinate to select.
        states_for_boundary : optional, Dict[str, Union[xr.DataArray, xu.UgridDataArray]]
            A dictionary with model names as keys and grids with states that are
            used to put as boundary values.
            :class:`imod.mf6.GroundwaterFlowModel` will get a
            :class:`imod.mf6.ConstantHead`,
            :class:`imod.mf6.GroundwaterTransportModel` will get a
            :class:`imod.mf6.ConstantConcentration` package.

        Returns
        -------
        clipped : Simulation

        Examples
        --------
        Slicing intervals may be half-bounded, by providing None:

        To select 500.0 <= x <= 1000.0:

        >>> mf6_sim.clip_box(x_min=500.0, x_max=1000.0)

        To select x <= 1000.0:

        >>> mf6_sim.clip_box(x_max=1000.0)``

        To select x >= 500.0:

        >>> mf6_sim.clip_box(x_min=500.0)

        To select a time interval, you can use datetime64:

        >>> mf6_sim.clip_box(time_min=np.datetime64("2020-01-01"), time_max=np.datetime64("2020-12-31"))

        To clip an area and set a boundary condition at the clipped boundary:

        >>> states_for_boundary = {"GWF6_model_name": heads}
        >>> clipped_sim = mf6_sim.clip_box(
        ...     x_min=500.0, x_max=1000.0, y_min=500.0, y_max=1000.0,
        ...     states_for_boundary=states_for_boundary
        ... )
        """

        if self.is_split():
            raise RuntimeError(
                "Unable to clip simulation. Clipping can only be done on simulations that haven't been split."
                + "Therefore clipping should be done before splitting the simulation."
            )
        if not self._has_one_flow_model():
            raise ValueError(
                "Unable to clip simulation. Clipping can only be done on simulations that have a single flow model ."
            )
        for model_name, model in self.get_models().items():
            supported, error_with_object = model._is_clipping_supported()
            if not supported:
                raise ValueError(
                    f"simulation cannot be clipped due to presence of package '{error_with_object}' in model '{model_name}'"
                )

        clipped = type(self)(name=self.name)
        for key, value in self.items():
            state_for_boundary = (
                None if states_for_boundary is None else states_for_boundary.get(key)
            )
            if isinstance(value, Modflow6Model):
                clipped[key] = value.clip_box(
                    time_min=time_min,
                    time_max=time_max,
                    layer_min=layer_min,
                    layer_max=layer_max,
                    x_min=x_min,
                    x_max=x_max,
                    y_min=y_min,
                    y_max=y_max,
                    state_for_boundary=state_for_boundary,
                )
            elif isinstance(value, Package):
                clipped[key] = value.clip_box(
                    time_min=time_min,
                    time_max=time_max,
                    layer_min=layer_min,
                    layer_max=layer_max,
                    x_min=x_min,
                    x_max=x_max,
                    y_min=y_min,
                    y_max=y_max,
                )
            elif isinstance(value, list) and all(
                isinstance(item, GWFGWT) for item in value
            ):
                continue
            else:
                raise ValueError(
                    f"object {key} of type {type(value)} cannot be clipped."
                )
        return clipped



[docs]
    def create_partition_labels(
        self,
        npartitions: int,
        weights: Optional[GridDataArray] = None,
    ) -> GridDataArray:
        """
        Returns a label array: a 2d array with a similar size to the top layer of
        idomain. Every array element is the partition number to which the column of
        gridblocks of idomain at that location belong. This is provided to
        :meth:`imod.mf6.Modflow6Simulation.split` to partition the model.

        Parameters
        ----------
        npartitions : int
            The number of partitions to create.
        weights : xarray.DataArray, xugrid.UgridDataArray, optional
            The weights to use for partitioning. The weights should be a 2d
            array with the same size as the top layer of idomain. The weights
            are used to determine the size of each partition. The weights should
            be positive integers. If not provided, active cells (idomain > 0)
            are summed across layers and passed on as weights. If None, the
            idomain is used to compute weights.

        Returns
        -------
        xarray.DataArray or xu.UgridDataArray
            An array with partition labels, with the same shape as the top layer
            of the idomain.

        Examples
        --------
        Create a partition label array with 4 partitions.

        >>> label_array = mf6_sim.create_partition_labels(n_partitions=4)

        You can then use this label array to split the simulation:

        >>> mf6_splitted = mf6_sim.split(label_array)

        You can also provide weights to the partitioning, which will influence
        the size of each partition. For example, if you want to create a uniform
        partitioning, you can use:

        >>> weights = xr.ones_like(idomain)
        >>> label_array = mf6_sim.create_partition_labels(n_partitions=4, weights=weights)

        """
        gwf_models = self.get_models_of_type("gwf6")
        if len(gwf_models) != 1:
            raise ValueError(
                "for partitioning a simulation to work, it must have exactly 1 flow model"
            )

        flowmodel = list(gwf_models.values())[0]
        idomain = flowmodel.domain
        return create_partition_labels(idomain, npartitions, weights=weights)



[docs]
    @standard_log_decorator()
    def split(
        self,
        submodel_labels: GridDataArray,
        ignore_time_purge_empty: Optional[bool] = None,
    ) -> Modflow6Simulation:
        """
        Split a simulation in different partitions using a submodel_labels
        array.

        Parameters
        ----------
        submodel_labels: xr.DataArray or xu.UgridDataArray
            A grid that defines how the simulation will be split. The array
            should have the same topology as the domain being split, i.e.
            similar shape as a layer in the domain. The values in the array
            indicate to which partition a cell belongs. The values should be
            zero or greater.
        ignore_time_purge_empty: bool, default None
            If True, only the first timestep is validated. This increases
            performance for packages with a time dimensions over which changes
            of cell activity are not expected. If None, the value of the
            validation context is of the simulation is used.

        Returns
        -------
        Modflow6Simulation
            A new simulation containing all the split models and packages

        Examples
        --------
        >>> submodel_labels = mf6_sim.create_partition_labels(n_partitions=4)
        >>> m6_splitted = mf6_sim.split(submodel_labels)
        """
        if self.is_split():
            raise RuntimeError(
                "Unable to split simulation. Splitting can only be done on simulations that haven't been split."
            )

        if not self._has_one_flow_model():
            raise ValueError(
                "splitting of simulations with more (or less) than 1 flow model currently not supported."
            )
        if ignore_time_purge_empty is None:
            ignore_time_purge_empty = self._validation_context.ignore_time

        transport_models = self.get_models_of_type("gwt6")
        flow_models = self.get_models_of_type("gwf6")
        if not any(flow_models) and not any(transport_models):
            raise ValueError("a simulation without any models cannot be split.")

        original_models = {**flow_models, **transport_models}
        for model_name, model in original_models.items():
            supported, error_with_object = model._is_splitting_supported()
            if not supported:
                raise ValueError(
                    f"simulation cannot be split due to presence of package '{error_with_object}' in model '{model_name}'"
                )

        original_packages = get_packages(self)

        partition_info = create_partition_info(submodel_labels)

        exchange_creator: ExchangeCreator_Unstructured | ExchangeCreator_Structured
        if is_unstructured(submodel_labels):
            exchange_creator = ExchangeCreator_Unstructured(
                submodel_labels, partition_info
            )
        else:
            exchange_creator = ExchangeCreator_Structured(
                submodel_labels, partition_info
            )

        new_simulation = imod.mf6.Modflow6Simulation(f"{self.name}_partioned")
        for package_name, package in {**original_packages}.items():
            new_simulation[package_name] = deepcopy(package)

        for model_name, model in original_models.items():
            solution_name = self.get_solution_name(model_name)
            solution = cast(Solution, new_simulation[solution_name])
            solution._remove_model_from_solution(model_name)
            for submodel_partition_info in partition_info:
                new_model_name = f"{model_name}_{submodel_partition_info.id}"
                new_simulation[new_model_name] = slice_model(
                    submodel_partition_info, model
                )
                new_simulation[new_model_name].purge_empty_packages(
                    ignore_time=ignore_time_purge_empty
                )
                solution._add_model_to_solution(new_model_name)

        exchanges: list[Any] = []

        for flow_model_name, flow_model in flow_models.items():
            exchanges += exchange_creator.create_gwfgwf_exchanges(
                flow_model_name, flow_model.domain.layer
            )

        if any(transport_models):
            for tpt_model_name in transport_models:
                exchanges += exchange_creator.create_gwtgwt_exchanges(
                    tpt_model_name, flow_model_name, model.domain.layer
                )
        new_simulation._add_modelsplit_exchanges(exchanges)
        new_simulation._update_buoyancy_packages()
        new_simulation._set_flow_exchange_options()
        new_simulation._set_transport_exchange_options()
        new_simulation._update_ssm_packages()

        new_simulation._filter_inactive_cells_from_exchanges()
        return new_simulation



[docs]
    @standard_log_decorator()
    def regrid_like(
        self,
        regridded_simulation_name: str,
        target_grid: GridDataArray,
        validate: bool = True,
    ) -> "Modflow6Simulation":
        """
        This method creates a new simulation object. The models contained in the
        new simulation are regridded versions of the models in the input object
        (this). Time discretization and solver settings are copied.

        Parameters
        ----------
        regridded_simulation_name: str
            name given to the output simulation
        target_grid: xr.DataArray or  xu.UgridDataArray
            discretization onto which the models  in this simulation will be regridded
        validate: bool
            set to true to validate the regridded packages

        Returns
        -------
        a new simulation object with regridded models

        Examples
        --------
        >>> target_grid = imod.util.empty_2d(
        ...     dx=5.0, xmin=500.0, xmax=1000.0, dy=5.0, ymin=500.0, ymax=1000.0
        ... )
        >>> regridded_sim = simulation.regrid_like(
        ...     regridded_simulation_name="regridded_sim",
        ...     target_grid=target_grid,
        ... )
        """

        return _regrid_like(self, regridded_simulation_name, target_grid, validate)


    def _add_modelsplit_exchanges(self, exchanges_list: list[GWFGWF]) -> None:
        if not self.is_split():
            self["split_exchanges"] = []
        self["split_exchanges"].extend(exchanges_list)

    def _set_flow_exchange_options(self) -> None:
        # collect some options that we will auto-set
        for exchange in self["split_exchanges"]:
            if isinstance(exchange, GWFGWF):
                model_name_1 = exchange.dataset["model_name_1"].values[()]
                model_1 = self[model_name_1]
                exchange.set_options(
                    save_flows=model_1["oc"].is_budget_output,
                    dewatered=model_1["npf"].is_dewatered,
                    variablecv=model_1["npf"].is_variable_vertical_conductance,
                    xt3d=model_1["npf"].get_xt3d_option(),
                    newton=model_1.is_use_newton(),
                )

    def _set_transport_exchange_options(self) -> None:
        for exchange in self["split_exchanges"]:
            if isinstance(exchange, GWTGWT):
                model_name_1 = exchange.dataset["model_name_1"].values[()]
                model_1 = self[model_name_1]
                advection_key = model_1._get_pkgkey("adv")
                dispersion_key = model_1._get_pkgkey("dsp")

                scheme = None
                xt3d_off = None
                xt3d_rhs = None
                if advection_key is not None:
                    scheme = model_1[advection_key].dataset["scheme"].values[()]
                if dispersion_key is not None:
                    xt3d_off = model_1[dispersion_key].dataset["xt3d_off"].values[()]
                    xt3d_rhs = model_1[dispersion_key].dataset["xt3d_rhs"].values[()]
                exchange.set_options(
                    save_flows=model_1["oc"].is_budget_output,
                    adv_scheme=scheme,
                    dsp_xt3d_off=xt3d_off,
                    dsp_xt3d_rhs=xt3d_rhs,
                )

    def _filter_inactive_cells_from_exchanges(self) -> None:
        for ex in self["split_exchanges"]:
            for i in [1, 2]:
                self._filter_inactive_cells_exchange_domain(ex, i)

    def _filter_inactive_cells_exchange_domain(self, ex: GWFGWF, i: int) -> None:
        """Filters inactive cells from one exchange domain inplace"""
        modelname = ex[f"model_name_{i}"].values[()]
        domain = self[modelname].domain

        layer = ex.dataset["layer"] - 1
        id = ex.dataset[f"cell_id{i}"] - 1
        if is_unstructured(domain):
            exchange_cells = {
                "layer": layer,
                "mesh2d_nFaces": id,
            }
        else:
            exchange_cells = {
                "layer": layer,
                "y": id.sel({f"cell_dims{i}": f"row_{i}"}),
                "x": id.sel({f"cell_dims{i}": f"column_{i}"}),
            }
        exchange_domain = domain.isel(exchange_cells)
        active_exchange_domain = exchange_domain.where(exchange_domain > 0)
        active_exchange_domain = active_exchange_domain.dropna("index")
        ex.dataset = ex.dataset.sel(index=active_exchange_domain["index"])

    def get_solution_name(self, model_name: str) -> Optional[str]:
        for k, v in self.items():
            if isinstance(v, Solution):
                if model_name in v.dataset["modelnames"]:
                    return k
        return None

    def __repr__(self) -> str:
        typename = type(self).__name__
        INDENT = "    "
        attrs = [
            f"{typename}(",
            f"{INDENT}name={repr(self.name)},",
            f"{INDENT}directory={repr(self.directory)}",
        ]
        items = [
            f"{INDENT}{repr(key)}: {type(value).__name__},"
            for key, value in self.items()
        ]
        # Place the emtpy dict on the same line. Looks silly otherwise.
        if items:
            content = attrs + ["){"] + items + ["}"]
        else:
            content = attrs + ["){}"]
        return "\n".join(content)

    def _get_transport_models_per_flow_model(self) -> dict[str, list[str]]:
        flow_models = self.get_models_of_type("gwf6")
        transport_models = self.get_models_of_type("gwt6")
        # exchange for flow and transport
        result = collections.defaultdict(list)

        for flow_model_name in flow_models:
            flow_model = self[flow_model_name]
            for tpt_model_name in transport_models:
                tpt_model = self[tpt_model_name]
                if is_equal(tpt_model.domain, flow_model.domain):
                    result[flow_model_name].append(tpt_model_name)
        return result

    def _generate_gwfgwt_exchanges(self) -> list[GWFGWT]:
        exchanges = []
        flow_transport_mapping = self._get_transport_models_per_flow_model()
        for flow_name, tpt_models_of_flow_model in flow_transport_mapping.items():
            if len(tpt_models_of_flow_model) > 0:
                for transport_model_name in tpt_models_of_flow_model:
                    exchanges.append(GWFGWT(flow_name, transport_model_name))

        return exchanges

    def _update_ssm_packages(self) -> None:
        flow_transport_mapping = self._get_transport_models_per_flow_model()
        for flow_name, tpt_models_of_flow_model in flow_transport_mapping.items():
            flow_model = self[flow_name]
            for tpt_model_name in tpt_models_of_flow_model:
                tpt_model = self[tpt_model_name]
                ssm_key = tpt_model._get_pkgkey("ssm")
                if ssm_key is not None:
                    old_ssm_package = tpt_model.pop(ssm_key)
                    state_variable_name = old_ssm_package.dataset[
                        "auxiliary_variable_name"
                    ].values[0]
                    ssm_package = SourceSinkMixing.from_flow_model(
                        flow_model, state_variable_name, is_split=self.is_split()
                    )
                    if ssm_package is not None:
                        tpt_model[ssm_key] = ssm_package

    def _update_buoyancy_packages(self) -> None:
        flow_transport_mapping = self._get_transport_models_per_flow_model()
        for flow_name, tpt_models_of_flow_model in flow_transport_mapping.items():
            flow_model = cast(GroundwaterFlowModel, self[flow_name])
            flow_model._update_buoyancy_package(tpt_models_of_flow_model)


[docs]
    def is_split(self) -> bool:
        """
        Check if the simulation is split into multiple partitions.

        Returns
        -------
        bool
            True if the simulation is split, False otherwise.
        """
        return "split_exchanges" in self.keys()


    def _has_one_flow_model(self) -> bool:
        flow_models = self.get_models_of_type("gwf6")
        return len(flow_models) == 1


[docs]
    @standard_log_decorator()
    def mask_all_models(
        self,
        mask: GridDataArray,
    ) -> None:
        """
        This function applies a mask to all models in a simulation, provided they use
        the same discretization. The  method parameter "mask" is an idomain-like array.
        Masking will overwrite idomain with the mask where the mask is <0.
        Where the mask is >0, the original value of idomain will be kept.
        Masking will update the packages accordingly, blanking their input where needed,
        and is therefore not a reversible operation.

        Parameters
        ----------
        mask: xr.DataArray, xu.UgridDataArray of ints
            idomain-like integer array. >0 sets cells to active, 0 sets cells to inactive,
            <0 sets cells to vertical passthrough

        Examples
        --------
        To mask all models in a simulation, you can use the following code:

        >>> mf6_sim.mask_all_models(new_idomain)

        This masks the model inplace and updates the packages accordingly. The
        mask should be an idomain-like array, i.e. it should have the same shape
        as the model and contain integer values.
        """
        _mask_all_models(self, mask)



[docs]
    @classmethod
    @standard_log_decorator()
    def from_imod5_data(
        cls,
        imod5_data: dict[str, dict[str, GridDataArray]],
        period_data: dict[str, list[datetime]],
        times: list[datetime],
        allocation_options: Optional[SimulationAllocationOptions] = None,
        distributing_options: Optional[SimulationDistributingOptions] = None,
        regridder_types: Optional[dict[str, DataclassType]] = None,
    ) -> "Modflow6Simulation":
        """
        Imports a GroundwaterFlowModel (GWF) from the data in an iMOD5 project
        file and puts it in a simulation. Quasi-3D iMOD5 models, i.e. models
        where there is only horizontal flow in aquifers and vertical flow in
        aquitards, are not supported.

        This method adds all static and boundary condition packages from the
        projectfile to the simulation. Output Control (OC) must be added
        manually after importing. The
        :func:`imod.mf6.ims.SolutionPresetModerate` solver settings are added
        automatically under the "ims" key, but these can be overrided by the
        user after importing.

        Parameters
        ----------
        imod5_data: dict[str, dict[str, GridDataArray]]
            dictionary containing the arrays mentioned in the project file as xarray datasets,
            under the key of the package type to which it belongs.
        period_data: dict[str, list[datetime]]
            dictionary containing the package names mapped to a list of repeated
            stress periods. These are set as ``repeat_stress``.
        times:  list[datetime]
            time discretization of the model to be imported. This is used for
            the following:

                * Times of wells with associated timeseries are resampled to these times
                * Start and end times in the list are used to repeat the stresses
                  of periodic data (e.g. river stages in iMOD5 for "summer", "winter")
                * The simulation is discretized to these times, using
                  :meth:`imod.mf6.Modflow6Simulation.create_time_discretization`

        allocation_options: SimulationAllocationOptions, optional
            object containing the allocation options per package type. If you
            want a specific package to have a different allocation option, then
            it should be imported separately.
        distributing_options: SimulationDistributingOptions, optional
            object containing the conductivity distribution options per package
            type. If you want a package to have a different allocation option,
            then it should be imported separately.
        regridder_types: dict[str, RegridMethodType]
            the key is the package name. The value is the RegridMethodType
            object containing the settings for regridding the package with the
            specified key.

        Returns
        -------
        Modflow6Simulation
            Simulation prepared for MODFLOW6

        Examples
        --------
        Open projectfile data first:

        >>> from imod.formats.prj import open_projectfile_data
        >>> imod5_data, period_data = open_projectfile_data("path/to/projectfile")

        You can then import the simulation as follows:

        >>> times = [np.datetime("2001-01-01"), np.datetime("2002-01-01"), np.datetime("2003-01-01")]
        >>> mf6_sim = imod.mf6.Modflow6Simulation.from_imod5_data(imod5_data, period_data, times)

        Allocate rivers differently:

        >>> from imod.prepare.topsystem import SimulationAllocationOptions, ALLOCATION_OPTION
        >>> allocation_options = SimulationAllocationOptions()
        >>> allocation_options.riv = ALLOCATION_OPTION.at_elevation
        >>> mf6_sim = imod.mf6.Modflow6Simulation.from_imod5_data(imod5_data, period_data, times, allocation_options)

        You can override solver settings if needed after importing:

        >>> mf6_sim["imported_model"]["ims"] = SolutionPresetComplex()

        """
        if allocation_options is None:
            allocation_options = SimulationAllocationOptions()
        if distributing_options is None:
            distributing_options = SimulationDistributingOptions()
        if regridder_types is None:
            regridder_types = {}

        simulation = Modflow6Simulation("imported_simulation")
        simulation._validation_context.strict_well_validation = False
        simulation._validation_context.strict_hfb_validation = False

        # import GWF model,
        gwf_model = GroundwaterFlowModel.from_imod5_data(
            imod5_data,
            period_data,
            times,
            allocation_options,
            distributing_options,
            regridder_types,
        )
        simulation["imported_model"] = gwf_model

        # generate ims package
        solution = SolutionPresetModerate(
            ["imported_model"],
            print_option="all",
        )
        simulation["ims"] = solution

        simulation.create_time_discretization(additional_times=times)
        return simulation