Source code for PyOCN.ocn

import warnings
import ctypes
from typing import Any, Callable, TYPE_CHECKING
from os import PathLike
from numbers import Number
from pathlib import Path

import networkx as nx 
import numpy as np
from tqdm import tqdm

from ._statushandler import check_status
from .utils import simulated_annealing_schedule, net_type_to_dag, unwrap_digraph
from . import _libocn_bindings as _bindings
from . import _flowgrid_convert as fgconv

if TYPE_CHECKING:
    import xarray as xr
    import rasterio

"""
High-level Optimized Channel Network (OCN) interface.

This module provides a high-level interface to the underlying
``libocn`` C library. The :class:`OCN` class can be used for 
constructing and optimizing river network models using 
simulated annealing.

Note
----
- The underlying data structure managed by :class:`OCN` is a FlowGrid owned by
    ``libocn``. Pointer lifetime and destruction are handled safely within this
    class.
- Many operations convert to a NetworkX ``DiGraph`` for convenience. These
    conversions are slow, and are intended for inspection, analysis, 
    and visualization rather than tight inner loops.

See Also
--------
PyOCN.utils
        Helper functions for OCN fitting and construction
PyOCN.plotting
        Helper functions for visualization and plotting
"""

# TODO: have to_rasterio use the option to set the root node to 0,0 by using to_xarray as the backend instead of numpy?





[docs]
class OCN:
    """
    The main class for interacting with Optimized Channel Networks. 

    Use :meth:`OCN.from_net_type` or :meth:`OCN.from_digraph` to construct an
    instance. 
    
    Methods
    -------------------
    from_net_type
        Create an OCN from a predefined network type and dimensions.
    from_digraph
        Create an OCN from an existing NetworkX DiGraph.
    to_digraph
        Export the current grid to a NetworkX DiGraph.
    to_numpy
        Export raster arrays (energy, drained area, elevation) as numpy arrays.
    to_xarray
        Export raster arrays as an xarray Dataset (requires xarray).
    to_gtiff
        Export raster arrays to a GeoTIFF file (requires rasterio).
    copy
        Create a deep copy of the OCN.
    single_erosion_event
        Perform a single erosion event at a given temperature.
    fit
        Optimize the network using the simulated annealing method from Carraro et al (2020).
    fit_custom_cooling
        Optimize the network using a custom cooling function.
    compute_energy
        Compute the current energy of the network.
    copy
        Create a deep copy of the OCN.

    Attributes
    ----------
    energy : float
        Current energy of the network (read-only property).
    dims : tuple[int, int]
        Grid dimensions (rows, cols) of the FlowGrid (read-only property).
    resolution: float
        The side length of each grid cell (read-only property).
    nroots : int
        Number of root nodes in the current OCN grid (read-only property).
    gamma : float
        Exponent in the energy model.
    verbosity : int
            Verbosity level (0-2). 0 is silent, 1 prints high-level progress messages, 2 prints detailed logging messages. Can be overridden in methods that support it.
    wrap : bool
        If true, enables periodic boundary conditions on the FlowGrid (read-only property).
    history : np.ndarray
        numpy array of shape (n_iterations, 3) recording the iteration index, energy, and temperature at each iteration during optimization.
        Updated each time an optimization method is called.
    rng : int
        the current random state of the internal RNG
    vertical_exaggeration : float
        Vertical exaggeration factor for the network. Used when computing elevation.
    

    Examples
    --------
    The following is a simple example of creating, optimizing, and plotting
    an OCN using PyOCN and Matplotlib. More examples are available in the
    `demo.ipynb` notebook in the repository (https://github.com/alextsfox/PyOCN).

    >>> # Fit an OCN from a "Hip-roof" initial network shape and periodic boundary conditions
    >>> import matplotlib.pyplot as plt
    >>> import matplotlib as mpl
    >>> import PyOCN as po
    >>> ocn = po.OCN.from_net_type("H", dims=(64, 64), wrap=True, random_state=8472, verbosity=0)
    >>> ocn.fit()
    >>> po.plot_ocn_raster(ocn, norm=mpl.colors.PowerNorm(gamma=0.5), attribute='drained_area')
    >>> plt.show()
    """

    ###########################
    #    CONSTRUCTORS         #
    ###########################

[docs]
    def __init__(self, dag: nx.DiGraph, resolution: float=1.0, gamma: float = 0.5, random_state=None, verbosity: int = 0, validate:bool=True, wrap : bool = False, vertical_exaggeration: float = 1.0):
        """
        Construct an :class:`OCN` from a valid NetworkX ``DiGraph``.

        Attention
        ---------
        Please use the classmethods :meth:`OCN.from_net_type` or
        :meth:`OCN.from_digraph` to instantiate an OCN.
        """
        
        # validate gamma, annealing schedule, and random_state
        if not isinstance(gamma, Number):
            raise TypeError(f"gamma must be a scalar. Got {type(gamma)}.")
        if not (0 <= gamma <= 1):
            warnings.warn(f"gamma values outside of [0, 1] may not be physically meaningful. Got {gamma}.")
        if not isinstance(resolution, Number):
            raise TypeError(f"resolution must be numeric. Got {type(resolution)}")
        
        self.verbosity = verbosity
        self.gamma = gamma
        self.__p_c_graph = fgconv.from_digraph(  # does most of the work 
            dag, 
            resolution, 
            verbose=(verbosity == 2), 
            validate=validate, 
            wrap=wrap
        )
        self.rng = random_state
        self.__p_c_graph.contents.energy = self.compute_energy()

        self.__history = np.empty((0, 3), dtype=np.float64)

        if not (isinstance(vertical_exaggeration, Number) and vertical_exaggeration >= 0):
            raise TypeError(f"vertical_exaggeration must be a number >= 0. Got {type(vertical_exaggeration)}")
        self.vertical_exaggeration = vertical_exaggeration




[docs]
    @classmethod
    def from_net_type(cls, net_type:str, dims:tuple[int, int], resolution:float=1, gamma : float = 0.5, random_state=None, verbosity:int=0, wrap : bool = False, vertical_exaggeration: float = 1.0):
        """
        Create an :class:`OCN` from a predefined network type and dimensions.

        Parameters
        ----------
        net_type : str
            Predefined network type to instantiate from. Valid types are "H", "I", "E", and "V". See
            :func:`~PyOCN.utils.net_type_to_dag` for more information.
        dims : tuple[int, int]
            Grid dimensions (rows, cols). Both must be positive even integers.
        resolution : int, optional
            The side length of each grid cell.
        gamma : float, default 0.5
            Exponent in the energy model.
        random_state : int | numpy.random.Generator | None, optional
            Seed or generator for RNG seeding.
        verbosity : int
            Verbosity level (0-2). 0 is silent, 1 prints high-level progress messages, 2 prints detailed logging messages. Can be overridden in methods that support it.
        wrap : bool, default False
            If true, allows wrapping around the edges of the grid (toroidal). If false, no wrapping is applied.
        vertical_exaggeration : float, default 1.0
            Vertical exaggeration factor for the network. Used when computing elevation.

        Returns
        -------
        OCN
            A newly constructed instance initialized from the specified
            network type and dimensions.
        """
        if not isinstance(dims, tuple):
            raise TypeError(f"dims must be a tuple of two positive integers, got {type(dims)}")
        if not (
            len(dims) == 2 
            and all(isinstance(d, int) and d > 0 for d in dims)
        ):
            raise ValueError(f"dims must be a tuple of two positive integers, got {dims}")
        
        if verbosity == 2:
            print(f"Creating {net_type} network DiGraph with dimensions {dims}...", end="")
        dag = net_type_to_dag(net_type, dims)
        if verbosity == 2:
            print(" Done.")
        
        # no need to validate inputs when using a predefined net_type. Saves time.
        return cls(dag, resolution, gamma, random_state, verbosity=verbosity, validate=False, wrap=wrap, vertical_exaggeration=vertical_exaggeration)



[docs]
    @classmethod
    def from_digraph(cls, dag: nx.DiGraph, resolution:float=1, gamma=0.5, random_state=None, verbosity: int = 0, wrap: bool = False, vertical_exaggeration: float = 1.0):
        """
        Create an :class:`OCN` from an existing NetworkX ``DiGraph``.

        Parameters
        ----------
        dag : nx.DiGraph
            Directed acyclic graph (DAG) representing the stream network.
        resolution : int, optional
            The side length of each grid cell.
        gamma : float, default 0.5
            Exponent in the energy model.
        random_state : int | numpy.random.Generator | None, optional
            Seed or generator for RNG seeding.
        verbosity : int
            Verbosity level (0-2). 0 is silent, 1 prints high-level progress messages, 2 prints detailed logging messages. Can be overridden in methods that support it.
        wrap : bool, default False
            If true, allows wrapping around the edges of the grid (toroidal). If false, no wrapping is applied.
        vertical_exaggeration : float, default 1.0
            Vertical exaggeration factor for the network. Used when computing elevation.

        Returns
        -------
        OCN
            A newly constructed instance encapsulating the provided graph.

        Important
        ---------
        The input graph must satisfy all of the following:

        - It is a directed acyclic graph (DAG).
        - Each node has attribute ``pos=(row:int, col:int)`` specifying its
          grid position with non-negative coordinates. Any other attributes
          are ignored.
        - The graph can be partitioned into one or more spanning trees over 
          a dense grid of shape ``(m, n)``: each grid cell corresponds to 
          exactly one node; each non-root node has ``out_degree == 1``; 
          the roots have ``out_degree == 0``.
        - Edges connect only to one of the 8 neighbors (cardinal or diagonal),
          i.e., no jumps over rows or columns. If ``wrap=True``, edges may
          connect across the grid boundaries (i.e. row 0 can connect to row m-1 and col 0 can connect to col n-1).
        - Edges do not cross in the row-column plane.
        - Both ``m`` and ``n`` are positive integers, and there are at least four
          vertices.

        Examples
        --------
        >>> # creating a "zig-zag" network
        >>> # O O O O
        >>> # |/|/|/|
        >>> # O O O X
        >>> import networkx as nx
        >>> import PyOCN as po
        >>> import matplotlib as mpl
        >>> dag = nx.DiGraph()
        >>> for i in range(8):
        ...     dag.add_node(i, pos=(i % 4, i // 4))
        ...     if i < 7: dag.add_edge(i, i + 1)
        >>> ocn = OCN.from_digraph(dag, random_state=8472)
        >>> ocn.fit()
        >>> po.plot_ocn_raster(ocn, norm=mpl.colors.PowerNorm(gamma=0.5), attribute='drained_area')
        >>> plt.show()
        """

        return cls(dag, resolution, gamma, random_state, verbosity=verbosity, validate=True, wrap=wrap, vertical_exaggeration=vertical_exaggeration)


    ###########################
    #    DUNDER METHODS       #
    ###########################
    def __repr__(self):
        return f"<PyOCN.OCN object at 0x{id(self):x}>\n<FlowGrid_C struct at 0x{ctypes.addressof(self.__p_c_graph.contents):x}>\n<Vertex_C array at 0x{ctypes.addressof(self.__p_c_graph.contents.vertices):x}>"
    def __str__(self):
        return f"OCN(gamma={self.gamma}, energy={self.energy}, dims={self.dims}, resolution={self.resolution}m, verbosity={self.verbosity})"
    def __del__(self):
        try:
            _bindings.libocn.fg_destroy(self.__p_c_graph)
            self.__p_c_graph = None
        except AttributeError:
            pass
    def __sizeof__(self) ->int:
        return (
            object.__sizeof__(self) +
            self.gamma.__sizeof__() +
            self.__history.nbytes +
            ctypes.sizeof(_bindings.FlowGrid_C) + 
            ctypes.sizeof(_bindings.Vertex_C)*(self.dims[0]*self.dims[1])
        )
    def __copy__(self) -> "OCN":
        """
        Create a deep copy of the OCN, including the underlying FlowGrid_C.
        Also copies the current RNG state. The new copy and the original
        will be independent from each other and behave identically statistically.

        If you want the copy to have a different random state, call :meth:`reseed`
        after copying.
        """
        cpy = object.__new__(type(self))
        cpy.gamma = self.gamma
        cpy.verbosity = self.verbosity
        
        cpy.__history = self.history.copy()

        cpy_p_c_graph = _bindings.libocn.fg_copy(self.__p_c_graph)
        if not cpy_p_c_graph:
            raise MemoryError("Failed to copy FlowGrid_C in OCN.__copy__")
        cpy.__p_c_graph = cpy_p_c_graph
        cpy.vertical_exaggeration = self.vertical_exaggeration
        return cpy

    def __deepcopy__(self, memo) -> "OCN":
        """
        Create a deep copy of the OCN, including the underlying FlowGrid_C.
        Also copies the current RNG state. The new copy and the original
        will be independent from each other and behave identically statistically.
        """
        return self.__copy__()
    

[docs]
    def copy(self) -> "OCN":
        """
        Create a deep copy of the OCN, including the underlying FlowGrid_C.
        Also copies the current RNG state. The new copy and the original
        will be independent from each other and behave identically statistically.
        """
        return self.__copy__()


    ###########################
    #    PROPERTIES           #
    ###########################

[docs]
    def compute_energy(self) -> float:
        """
        Compute the current energy of the network.

        Returns
        -------
        float
            The computed energy value.
        """
        return _bindings.libocn.ocn_compute_energy(self.__p_c_graph, self.gamma)

    
    @property
    def energy(self) -> float:
        return self.__p_c_graph.contents.energy
    @property
    def resolution(self) -> float:
        return self.__p_c_graph.contents.resolution
    @property
    def nroots(self) -> int:
        return int(self.__p_c_graph.contents.nroots)
    @property
    def dims(self) -> tuple[int, int]:
        return (
            int(self.__p_c_graph.contents.dims.row),
            int(self.__p_c_graph.contents.dims.col)
        )
    @property
    def wrap(self) -> bool:
        return self.__p_c_graph.contents.wrap
    @property
    def rng(self) -> int:
        s0, s1, s2, s3 = self.__p_c_graph.contents.rng.s
        s = (s0 << 96) | (s1 << 64) | (s2 << 32) | s3
        return s
    
    @rng.setter
    def rng(self, random_state:int|None|np.random.Generator=None):
        if not isinstance(random_state, (int, np.integer, type(None), np.random.Generator)):
            raise ValueError("RNG must be initialized with an integer/Generator/None.")
        seed = np.random.default_rng(random_state).integers(0, int(2**32 - 1))
        rng = _bindings.rng_state_t()
        _bindings.libocn.rng_seed(ctypes.byref(rng), seed)
        self.__p_c_graph.contents.rng = rng

    @property
    def history(self) -> np.ndarray:
        """The optimization history as a numpy array of shape (n_iterations, 3).
        Each row corresponds to an iteration. The columns are iteration index, energy, and temperature."""
        return self.__history

    ###########################
    #    GRAPH TRAVERSAL      #
    ###########################
    # # Commenting out for now. May decide to re-introduce later
    # def predecessors(self, pos:tuple[int, int]) -> Generator[tuple[int, int], None, None]:
    #     """Returns an iterator over predecessor nodes of the node at position `pos` in the OCN.
    #     A predecessor is defined as an immediate upstream neighbor.

    #     A predecessor of a node n is a node m such that there exists a directed edge from m to n.

    #     Mirrors the behavior of `networkx.DiGraph.predecessors`, but works directly on the OCN C graph structure.

    #     Yields (row, col) of successors.

    #     Parameters
    #     ----------
    #     ocn : OCN
    #         The OCN instance.
    #     pos : tuple[int, int]
    #         The (row, col) position of the node whose predecessors are to be found.
        
    #     Raises
    #     -------
    #     TypeError
    #         If `pos` is not a tuple of two integers.
    #     IndexError
    #         If `pos` is out of bounds for the current OCN grid.

    #     See Also
    #     --------
    #     :meth:`OCN.successors`
    #     """

    #     pos = tuple(pos)
    #     if len(pos) != 2 or not all(isinstance(p, int) for p in pos):
    #         raise TypeError(f"Position must be a tuple of two integers. Got {pos}.")
    #     if (pos[0] < 0 or pos[0] >= self.dims[0]) or (pos[1] < 0 or pos[1] >= self.dims[1]):
    #         raise IndexError(f"Position {pos} is out of bounds for OCN with dimensions {self.dims}.")

    #     # convert (row, col) to linear index
    #     a = _bindings.libocn.fg_cart_to_lin(
    #         _bindings.CartPair_C(row=pos[0], col=pos[1]),
    #         _bindings.CartPair_C(row=self.dims[0], col=self.dims[1]),
    #     )

    #     upstream_indices = (_bindings.linidx_t * 8)()
    #     nupstream = _bindings.linidx_t()
    #     check_status(_bindings.libocn.fg_find_upstream_neighbors(
    #         upstream_indices, 
    #         ctypes.byref(nupstream),
    #         self.__p_c_graph, 
    #         _bindings.linidx_t(a)
    #     ))
    #     count = int(nupstream.value)

    #     # convert back to cartesian (row, col)
    #     for idx in upstream_indices[:count]:
    #         cart = _bindings.libocn.fg_lin_to_cart(
    #             idx, 
    #             _bindings.CartPair_C(row=self.dims[0], col=self.dims[1])
    #         )
    #         yield (int(cart.row), int(cart.col))


    # def successors(self, pos: tuple[int, int]) -> Generator[tuple[int, int], None, None]:
    #     """Returns an iterator over successor nodes of the node at position `pos` in the OCN.
    #     A successor is the immediate downstream neighbor (at most one; none if root).

    #     Mirrors the behavior of `networkx.DiGraph.successors`, but works directly on the OCN C graph structure.
    #     Yields (row, col) of successors.

    #     Parameters
    #     ----------
    #     pos : tuple[int, int]
    #         The (row, col) position of the node whose successors are to be found.
        
    #     Raises
    #     -------
    #     TypeError
    #         If `pos` is not a tuple of two integers.
    #     IndexError
    #         If `pos` is out of bounds for the current OCN grid.
    #     """
    #     pos = tuple(pos)
    #     if len(pos) != 2 or not all(isinstance(p, int) for p in pos):
    #         raise TypeError(f"Position must be a tuple of two integers. Got {pos}.")
    #     if (pos[0] < 0 or pos[0] >= self.dims[0]) or (pos[1] < 0 or pos[1] >= self.dims[1]):
    #         raise IndexError(f"Position {pos} is out of bounds for OCN with dimensions {self.dims}.")

    #     # (row, col) -> linear index
    #     a = _bindings.libocn.fg_cart_to_lin(
    #         _bindings.CartPair_C(row=pos[0], col=pos[1]),
    #         _bindings.CartPair_C(row=self.dims[0], col=self.dims[1]),
    #     )

    #     # Read vertex to get downstream direction
    #     vert = _bindings.Vertex_C()
    #     check_status(_bindings.libocn.fg_get_lin(
    #         ctypes.byref(vert),
    #         self.__p_c_graph,
    #         _bindings.linidx_t(a),
    #     ))

    #     # If root, no successors
    #     if int(vert.downstream) == _bindings.IS_ROOT:
    #         return
        
    #     cart = _bindings.libocn.fg_lin_to_cart(
    #         vert.adown, 
    #         _bindings.CartPair_C(row=self.dims[0], col=self.dims[1])
    #     )
    #     yield (int(cart.row), int(cart.col))        

    ###########################
    #    EXPORT               #
    ###########################

[docs]
    def to_digraph(self) -> nx.DiGraph:
        """
        Create a NetworkX ``DiGraph`` view of the current grid.

        Returns
        -------
        nx.DiGraph
        # TODO: implement elevation, length, slope, q
            A DAG with the following node attributes per node:

            - ``pos``: ``(row, col)`` grid position
            - ``drained_area``: drained area value
            - ``energy``: cumulative energy at the node
            - ``elevation``: elevation at the node

            and the following edge attributes per edge:
            - ``length``: length of the edge/link
            - ``slope``: slope of the edge/link
            - ``q``: the landscape-forming discharge through the edge/link

        """
        dag = fgconv.to_digraph(self.__p_c_graph.contents, self.gamma, self.vertical_exaggeration)

        node_energies = dict()

        for node in nx.topological_sort(dag):
            node_energies[node] = (
                dag.nodes[node]['drained_area']**self.gamma 
                + sum(node_energies[p] for p in dag.predecessors(node))
            )
        nx.set_node_attributes(dag, node_energies, 'energy')

        return dag

    

[docs]
    def to_gtiff(self, west:float, north:float, crs: Any, path:"str|PathLike|rasterio.io.MemoryFile", unwrap:bool=True):
        """
        Export a raster of the current FlowGrid to a GeoTIFF file
        using rasterio. The resulting raster has 3 bands: `energy`, `drained_area`, and `elevation`.

        Caution
        -------
        This uses the :attr:`resolution` attribute to set pixel size in the raster and for computing elevation.
        This function does not check for unit compatibility, so it is up to the user
        to ensure the resolution and CRS units match. By default,
        the resolution is set to 1.0 units. Using a lat-long (geographic) CRS may give undesireable results.
        It is recommended to use a linear (projected) CRS with units of length (e.g., meters) for best results.

        Parameters
        ----------
        west : float
            The western border of the raster in crs units, corresponding
            to column 0.
        north : float
            The northern border of the raster in crs units, corresponding
            to row 0.
        crs : Any
            The crs for the resulting gtiff, passed to `rasterio.open`
        path : str or Pathlike or rasterio.io.MemoryFile
            The output path for the resulting gtiff file. Can also be rasterio.io.MemoryFile. 
        unwrap : bool, default True
            If True and the current OCN has periodic boundaries, the
            resulting raster will be transformed so connected grid cells 
            are adjacent in the raster. This will result in a larger raster
            with some nan values. If False or the current OCN does not have
            periodic boundaries, then no transformation is applied and the
            raster will have the same dimensions as the current OCN grid.
        """
        try:
            import rasterio
            from rasterio.transform import from_origin
        except ImportError as e:
            raise ImportError(
                "PyOCN.OCN.to_gtiff() requires rasterio to be installed. Install with `pip install rasterio`."
            ) from e

        array = self.to_numpy(unwrap=unwrap)
        dims = array.shape[1:]
        energy = array[0]
        drained_area = array[1]
        elevation = array[2]

        transform = from_origin(west, north, self.resolution, self.resolution)

        # Write three bands: 1=energy, 2=drained_area, 3=elevation
        with rasterio.open(
            path,
            "w",
            driver="GTiff",
            height=dims[0],
            width=dims[1],
            count=3,
            dtype=np.float64,
            crs=crs,
            transform=transform,
            compress="deflate",
        ) as dst:
            dst.write(energy, 1)
            dst.write(drained_area, 2)
            dst.write(elevation, 3)
            # Band descriptions (nice to have)
            try:
                dst.set_band_description(1, "energy")
                dst.set_band_description(2, "drained_area")
                dst.set_band_description(3, "elevation")
            except Exception:
                pass

    

[docs]
    def to_numpy(self, unwrap:bool=True) -> np.ndarray:
        """
        Export the current FlowGrid to a numpy array with shape (3, rows, cols).
        Has three channels: 0=energy, 1=drained_area, 2=elevation.

        Parameters
        ----------
        unwrap : bool, default True
            If True and the current OCN has periodic boundaries, the
            resulting array will be transformed so connected grid cells 
            are adjacent in the array. This will result in a larger array
            with some nan values. If False or the current OCN does not have
            periodic boundaries, then no transformation is applied and the
            resulting array will have the same dimensions as the current OCN grid.
        """
        dag = self.to_digraph()
        dims = self.dims
        if self.wrap and unwrap:
            dag = unwrap_digraph(dag, dims)
            positions = np.array(list(nx.get_node_attributes(dag, 'pos').values()))
            max_r, max_c = positions.max(axis=0)
            dims = (max_r + 1, max_c + 1)

        energy = np.full(dims, np.nan)
        drained_area = np.full(dims, np.nan)
        elevation = np.full(dims, np.nan)
        for node in dag.nodes:
            r, c = dag.nodes[node]['pos']
            energy[r, c] = dag.nodes[node]['energy']
            drained_area[r, c] = dag.nodes[node]['drained_area']
            elevation[r, c] = dag.nodes[node]['elevation']
        return np.stack([energy, drained_area, elevation], axis=0)



[docs]
    def to_xarray(self, unwrap:bool=True) -> "xr.Dataset":
        """
        Export the current FlowGrid to an xarray Dataset
        
        Parameters
        ----------
        unwrap : bool, default True
            If True and the current OCN has periodic boundaries, the
            resulting rasters will be transformed so connected grid cells
            are adjacent in the output. This will result in a larger raster
            with some nan values. If False or the current OCN does not have
            periodic boundaries, then no transformation is applied and the
            resulting raster will have the same dimensions as the current OCN grid.
            
            When unwrapping, the (0,0) coordinate
            will be set to the position of the "main" root node, defined as
            the root node with the smallest row*cols + col value. Otherwise,
            (0,0) will be the top-left corner of the grid.
        
        Returns
        -------
        xr.Dataset
         an xarray Dataset with data variables:
            - `energy` (np.float64) representing energy at each grid cell
            - `area` (np.float64) representing drained area at each grid cell
            - `elevation` (np.float64) representing elevation at each grid cell
        and coordinates:
            - `y` (float) representing the northing coordinate of each row.
            - `x` (float) representing the easting coordinate of each column.
        """

        try:
            import xarray as xr
        except ImportError as e:
            raise ImportError(
                "PyOCN.OCN.to_xarray() requires xarray to be installed. Install with `pip install xarray`."
            ) from e
        
        dims = self.dims

        dag = self.to_digraph()
        row_root, col_root = 0, 0
        if self.wrap and unwrap:
            roots = [n for n, d in dag.out_degree() if d==0]
            main_root = min(roots, key=lambda n: dag.nodes[n]['pos'][0]*dims[1] + dag.nodes[n]['pos'][1])
            
            dag = unwrap_digraph(dag, dims)
            positions = np.array(list(nx.get_node_attributes(dag, 'pos').values()))
            max_r, max_c = positions.max(axis=0)
            dims = (max_r + 1, max_c + 1)
            
            # compute the new position of the root node after unwrapping. This will be the new origin (0,0).
            row_root, col_root = dag.nodes[main_root]['pos']

        energy = np.full(dims, np.nan)
        drained_area = np.full(dims, np.nan)
        elevation = np.full(dims, np.nan)
        for node in dag.nodes:
            r, c = dag.nodes[node]['pos']
            energy[r, c] = dag.nodes[node]['energy']
            drained_area[r, c] = dag.nodes[node]['drained_area']
            elevation[r, c] = dag.nodes[node]['elevation']
        array_out = np.stack([energy, drained_area, elevation], axis=0)

        dims = array_out.shape[1:]

        return xr.Dataset(
            data_vars={
                "energy": (["y", "x"], array_out[0].astype(np.float64)),
                "area": (["y", "x"], array_out[1].astype(np.float64)),
                "elevation": (["y", "x"], array_out[2].astype(np.float64)),
            },
            coords={
                "y": ("y", np.linspace(-row_root, (-row_root + (dims[0]-1)), dims[0])*self.resolution),
                "x": ("x", np.linspace(-col_root, (-col_root + (dims[1]-1)), dims[1])*self.resolution),
            },
            attrs={
                "description": "OCN fit result arrays",
                "resolution": self.resolution,
                "gamma": self.gamma,
                "rng": self.rng,
                "wrap": self.wrap,
            }
        )


    ###########################
    #    OPTIMIZATION         #
    ###########################

[docs]
    def single_iteration(self, temperature:float, array_report:bool=False, unwrap:bool=True, calculate_full_energy:bool=False) -> "xr.Dataset | None":
        """ 
        Perform a single iteration of the optimization algorithm at a given temperature. Updates the internal history attribute.
        See :meth:`fit` for details on the algorithm.

        Parameters
        ----------
        temperature : float
            Temperature parameter governing acceptance probability. Typical
            range is a fraction of ocn.energy.
        array_report : bool, default False
            If True (default), the returned result will be an xarray.Dataset.
            See :meth:`fit` for details. The returned object will have an iteration dimension of size 1.
            Requires xarray to be installed.
        unwrap : bool, default True
            If True and the current OCN has periodic boundaries, the
            resulting rasters will be transformed so connected grid cells
            are adjacent in the output. This will result in a larger raster
            with some nan values. If False or the current OCN does not have
            periodic boundaries, then no transformation is applied and the
            resulting raster will have the same dimensions as the current OCN grid.
        calculate_full_energy : bool, default False
            If True, the full energy of the graph is recalculated when considering
            the proposed change. If False, a more efficient incremental update is used.
            Small numerical differences may arise between the two methods due to floating point
            precision. If precision is of the utmost importance, set this to True, but note that
            this comes with a significant performance penalty.

        Returns
        -------
        xr.Dataset | None
            If ``array_report == True``, an xarray.Dataset containing the state of the FlowGrid
            after the iteration. See :meth:`to_xarray` for details. If ``array_report == False``, returns None.

        Raises
        ------
        LibOCNError
            If the underlying C routine reports an error status.
        """
        # FlowGrid *G, uint32_t *total_tries, double gamma, double temperature
        check_status(_bindings.libocn.ocn_single_erosion_event(
            self.__p_c_graph,
            self.gamma, 
            temperature,
            calculate_full_energy
        ))

        # append to history
        last_iteration = self.__history[-1, 0] if self.__history.shape[0] else 0
        history = np.array([last_iteration + 1, self.energy, temperature]).reshape((1, 3))
        self.__history = np.concatenate((self.__history, history), axis=0)
        
        if not array_report:
            return None

        ds = self.to_xarray(unwrap=unwrap)
        ds = ds.expand_dims({"iteration": [0]})

        return ds

    

[docs]
    def fit(
        self,
        cooling_rate:float=1.0,
        constant_phase:float=0.0,
        n_iterations:int=None,
        pbar:bool=False,
        array_reports:int=0,
        tol:float | None=None,
        max_iterations_per_loop=10_000,
        unwrap:bool=True,
        calculate_full_energy:bool=False) -> "xr.Dataset | None":
        """
        Convenience function to optimize the OCN using the simulated annealing algorithm from Carraro et al (2020).
        For finer control over the optimization process, use :meth:`fit_custom_cooling` or use :meth:`single_erosion_event` in a loop.

        This performs ``n_iterations`` erosion events, accepting or rejecting
        proposals according to a temperature schedule defined by the annealing algorithm. 
        A proposal consists of changing the outflow direction of a randomly selected vertex. 
        The new outflow direction is chosen uniformly from the valid neighbors.
        A proposal is valid if it maintains a well-formed graph structure.

        The :attr:`history` attribute is updated in-place after optimization finishes.

        Parameters
        ----------
        cooling_rate : float, default 1.0
            Cooling rate parameter in the annealing algorithm. Typical range is 0.5-1.5.
            Higher values result in faster cooling and a greedier search.
            Lower values result in slower cooling and more thorough exploration of the solution space, but slower convergence and lower stability.
        constant_phase : float, default 0.0
            Amount of time to hold temeprature constant at the start of the optimization.
            This is a fraction of n_iterations, and must be in the range [0, 1].
            A value of 0.0 (default) means the temperature starts cooling immediately
            from the initial temperature. A value of 1.0 means the temperature is held
            constant for the entire optimization.
        n_iterations : int, optional
            defaults to ``int((63 * exp(-0.448 * cooling_rate)) * rows * cols * (1 + constant_phase))``, which was empirically found to work well across a range of cooling rates.
            When ``constant_phase = 1`` and ``constant_phase = 0``, this reduces to ``40 * rows * cols``.
            Clamped to at least ``energy_reports * 10`` (this should only matter for
            extremely small grids, where ``rows * cols < 256``).
        pbar : bool, default True
            Whether to display a progress bar.
        array_reports : int, default 0
            Number of timepoints (approximately) at which to save the state of the FlowGrid.
            If 0 (default), returns None. If >0, returns an xarray.Dataset
            containing the state of the FlowGrid at approximately evenly spaced intervals
            throughout the optimization, including the initial and final states. Requires xarray to be installed. See notes on xarray output for details.
        tol : float | None, optional
            If provided, optimization will stop early if the average relative energy reduction per iteration is less than `tol` for two consecutive checks. Must be positive.
            If None, no early stopping is performed.
            Recommended values are in the range 1e-9 to 1e-6 per iteration. A good default is 3.2e-8.
        max_iterations_per_loop: int, optional
            If provided, the number of iterations steps to perform in each "chunk"
            of optimization. Energy and output arrays can be reported no more often
            than this. Recommended values are 1_000-1_000_000. Default is 10_000.
        unwrap: bool, default True
            If True and the current OCN has periodic boundaries, the
            resulting rasters will be transformed so connected grid cells
            are adjacent in the output. This will result in a larger raster
            with some nan values. If False or the current OCN does not have
            periodic boundaries, then no transformation is applied and the
            resulting raster will have the same dimensions as the current OCN grid.
        calculate_full_energy : bool, default False
            If True, the full energy of the graph is recalculated when considering
            the proposed change. If False, a more efficient incremental update is used.
            Small numerical differences may arise between the two methods due to floating point
            precision. If precision is of the utmost importance, set this to True, but note that
            this comes with a significant performance penalty.

        Returns
        -------
        ds : xr.Dataset | None
            If ``array_reports > 0``, an xarray.Dataset containing the state of the FlowGrid
            at approximately evenly spaced intervals throughout the optimization, including
            the initial and final states. See notes on xarray output for details.
            If ``array_reports == 0``, returns None.

        

        Note
        ----
        The returned xarray.Dataset will have coordinates:

        - `y` (float) representing the northing coordinate of each row
        - `x` (float) representing the easting coordinate of each column
        - `iteration` (int) representing the iteration index at which the data was recorded

        and data variables:

        - `energy` (np.float64) representing energy at each grid cell
        - `area` (np.float64) representing drained area at each grid cell
        - `elevation` (np.float64) representing elevation at each grid cell

        If the OCN has a periodic boundary condition, the following changes apply: 

        - The (0,0) coordinate will be set to the position of the "main" root node, defined as the root node with the smallest row*cols + col value
        - The rasters will be unwrapped to a non-periodic representation, which may result in larger rasters.
        - The size of the final rasters are the maximum extent of the unwrapped grid, taken across all iterations.

        Generating reports requires additional memory and computation time.
        
        Note
        ----
        At iteration ``i``, the outflow of a random grid cell if proposed to be rerouted.
        The proposal is accepted with the probability
        
        .. math::
            P(\\text{accept}) = e^{-\\Delta E / T},

        where :math:`\\Delta E` is the change in energy the change would cause 
        and :math:`T` is the temperature of the network.

        The total energy of the system is computed from the drained areas of each grid cell :math:`k` as

        .. math::
            E = \\sum_k A_k^\\gamma

        The temperature of the network is governed by a cooling schedule, which is a function of iteration index.
        
        Note that when :math:`\\Delta E < 0`, the move is always accepted.

        The cooling schedule used by this method is a piecewise function of iteration index:
        
        .. math::
            T(i) = \\begin{cases}
                E_0 & i < C N \\\\
                E_0 \\cdot e^{i - C N} & i \\ge C N
            \\end{cases}

        where :math:`E_0` is the initial energy, :math:`N` is the total number
        of iterations, and :math:`C` is ``constant_phase``. Decreasing-energy
        moves (:math:`\\Delta E < 0`) are always accepted.

        Alternative cooling schedules can be implemented using :meth:`fit_custom_cooling`.
        """
        
        # make sure energy is up to date, useful if the user modified any parameters manually
        self.__p_c_graph.contents.energy = self.compute_energy()
        if constant_phase is None:
            constant_phase = 0.0
        if cooling_rate is None:
            cooling_rate = 1.0
        if n_iterations is None:
            n_iterations = int((63 * np.exp(-0.448 * cooling_rate)) * self.dims[0] * self.dims[1] * (1 + constant_phase))

        # create a cooling schedule from arguments
        cooling_func = simulated_annealing_schedule(
            dims=self.dims,
            E0=self.energy,
            constant_phase=constant_phase,
            n_iterations=n_iterations,
            cooling_rate=cooling_rate,
        )

        return self.fit_custom_cooling(
            cooling_func=cooling_func,
            n_iterations=n_iterations,
            pbar=pbar,
            array_reports=array_reports,
            tol=tol,
            max_iterations_per_loop=max_iterations_per_loop,
            unwrap=unwrap,
            calculate_full_energy=calculate_full_energy,
        )



[docs]
    def fit_custom_cooling(
        self,
        cooling_func:Callable[[np.ndarray], np.ndarray],
        n_iterations:int=None,
        iteration_start:int=0,
        pbar:bool=False,
        array_reports:int=0,
        tol:float | None=None,
        max_iterations_per_loop=10_000,
        unwrap:bool=True,
        calculate_full_energy:bool=False,
    ) -> "xr.Dataset | None":
        """
        Optimize the OCN using the a custom cooling schedule. This allows for
        multi-stage optimizations or other custom cooling schedules not covered by the default simulated annealing schedule
        from Carraro et al (2020).

        See :meth:`fit` for additional details on the optimization algorithm and parameters.

        Parameters
        ----------
        cooling_func : Callable[[np.ndarray], np.ndarray]
            A function that takes an array of iteration indices and returns an array of temperatures.
            This function defines the cooling schedule for the optimization. Note that the function
            should return temperatures that are appropriate for the current energy of the OCN.
        n_iterations : int, optional
        iteration_start : int, default 0
            The starting iteration index. This is useful for continuing an optimization
            from a previous run. Must be a non-negative integer. If provided, ``n_iterations``
            is the number of additional iterations to perform. The iteration number passed to
            ``cooling_func`` will be ``iteration_start + i`` where ``i`` is the current iteration index
            in the range ``[0, n_iterations-1]``.
        pbar : bool, default True
        array_reports : int, default 0
        tol : float, optional
        max_iterations_per_loop: int, optional
        unwrap: bool, default True
        calculate_full_energy: bool, default False

        Returns
        -------
        xr.Dataset | None
        """
        # validate inputs
        if n_iterations is None:
            n_iterations = int(40*self.dims[0]*self.dims[1])
        if not (isinstance(n_iterations, int) and n_iterations > 0):
            raise ValueError(f"n_iterations must be a positive integer, got {n_iterations}")
        if not (isinstance(array_reports, int) and array_reports >= 0):
            raise ValueError(f"array_reports must be a non-negative integer, got {array_reports}")
        if (not isinstance(iteration_start, (int, np.integer))) or iteration_start < 0:
            raise ValueError(f"iteration_start must be a non-negative integer, got {iteration_start}")
        if (not isinstance(tol, Number)) or tol < 0:
            if tol is not None:
                raise ValueError(f"tol must be a positive number or None, got {tol}")
        memory_est = array_reports*self.dims[0]*self.dims[1]*2*8 
        if memory_est > 20e6:
            warnings.warn(f"Requesting {array_reports} array is estimated to use {memory_est/1e6:.2f}MB of memory. Consider reducing array_reports or increasing max_iterations_per_loop if memory is a concern.")
        
        xarray_out = array_reports > 0
        if xarray_out:
            try:
                import xarray as xr
            except ImportError as e:
                raise ImportError(
                    "PyOCN.OCN.fit() with array_report>0 requires xarray to be installed. Install with `pip install xarray`."
                ) from e

        # preallocate output arrays
        max_iterations_per_loop = int(max_iterations_per_loop)
        max_iterations_per_loop = max(1, max_iterations_per_loop)
        n_iterations = int(n_iterations)
        n_iterations = max(1, n_iterations)
        max_iterations_per_loop = min(n_iterations, max_iterations_per_loop)

        # preallocate output arrays
        energy_out = np.empty(
            n_iterations//max_iterations_per_loop + 2, # always report energy when reporting arrays
            dtype=np.float64)
        
        if array_reports:
            array_report_interval = n_iterations // array_reports
            array_report_interval = max(array_report_interval, max_iterations_per_loop)
        else:
            array_report_interval = n_iterations*2  # never report arrays

        # temporary buffer to use for passing temperatures to libocn
        anneal_buf = np.empty(max_iterations_per_loop, dtype=np.float64)
        anneal_ptr = anneal_buf.ctypes.data_as(ctypes.POINTER(ctypes.c_double))

        completed_iterations = iteration_start
        n_iterations += iteration_start

        # set up reporting
        array_report_idx = []
        energy_report_idx = []
        ds_out_dict = dict()
        array_report_idx.append(completed_iterations)
        if xarray_out:
            ds_out_dict[completed_iterations] = self.to_xarray(unwrap=self.wrap)
        energy_out[0] = self.energy
        energy_report_idx.append(completed_iterations)

        pbar = tqdm(
            total=n_iterations - iteration_start, 
            desc="OCN Fit", 
            unit_scale=True, 
            dynamic_ncols=True, 
            disable=not (pbar or self.verbosity >= 1)
        )
        
        consecutive_convergence_required = 2
        consecutive_convergence_tests_passed = 0
        while completed_iterations < n_iterations:
            iterations_this_loop = min(max_iterations_per_loop, n_iterations - completed_iterations)
            anneal_buf[:iterations_this_loop] = cooling_func(
                np.arange(completed_iterations, completed_iterations + iterations_this_loop)
            )

            # main call to optimizer in libocn
            e_old = self.energy
            check_status(_bindings.libocn.ocn_outer_ocn_loop(
                self.__p_c_graph, 
                iterations_this_loop, 
                self.gamma, 
                anneal_ptr,
                calculate_full_energy,
            ))
            e_new = self.energy
            completed_iterations += iterations_this_loop
            
            # always report energy
            energy_out[len(energy_report_idx)] = e_new
            energy_report_idx.append(completed_iterations)
            # report arrays if requested
            if (
                xarray_out 
                and (
                    (completed_iterations % array_report_interval) < max_iterations_per_loop  # intermediate report
                    or completed_iterations >= n_iterations  # final report
                )
            ):
                array_report_idx.append(completed_iterations)
                ds_out_dict[completed_iterations] = self.to_xarray(unwrap=unwrap)  # TODO: pre-allocate this dict?


            # progress bar update
            # TODO: move this to a separate function
            if pbar or self.verbosity >= 1:
                RED = '\033[31m'
                YELLOW = '\033[33m'
                CYAN = '\033[36m'
                END = '\033[0m'
                T_over_E = anneal_buf[iterations_this_loop - 1]/e_old*100
                ToE_str = f"{int(np.floor(T_over_E)):02d}.{int((T_over_E - np.floor(T_over_E))*100):02d}%"
                de_over_E = (e_new - e_old)/e_old / iterations_this_loop
                dEoE_sign = '+' if de_over_E >= 0 else '-'
                dEoE_str = f"{dEoE_sign}{np.abs(de_over_E):.0e}"
                
                if T_over_E > 50: ToE_str = RED + ToE_str + END
                elif T_over_E > 5: ToE_str = YELLOW + ToE_str + END
                else: ToE_str = CYAN + ToE_str + END
                if de_over_E > 1e-7: dEoE_str = RED + dEoE_str + END
                elif de_over_E > -1e-7: dEoE_str = YELLOW + dEoE_str + END
                else: dEoE_str = CYAN + dEoE_str + END

                pbar.set_postfix({
                    "E": f"{self.energy:.1e}", 
                    "T/E": ToE_str,
                    # "ΔE/E/iter": dEoE_str,
                    "ΔE/E/iter": dEoE_str,
                })
                pbar.update(iterations_this_loop)

            # check for convergence if requested
            can_check_convergence = (tol is not None) and (completed_iterations >= 0.333 * n_iterations)
            improved_score = e_new <= e_old
            relative_improvement_per_iteration = abs((e_old - e_new) / e_old)/iterations_this_loop if e_old > 0 else np.inf
            if can_check_convergence and improved_score and (relative_improvement_per_iteration < tol):
                consecutive_convergence_tests_passed += 1
                if consecutive_convergence_tests_passed >= consecutive_convergence_required:
                    if self.verbosity >= 1:
                        print("Convergence reached, stopping optimization.")
                    break
            else:
                consecutive_convergence_tests_passed = 0
        
        pbar.close()
        
        # update energy and temperature history
        last_history_iteration = int(self.history[-1, 0]) if self.history.shape[0] else 0
        skip_first = 1 if self.history.shape[0] else 0
        history = np.stack([
            last_history_iteration + np.asarray(energy_report_idx)[skip_first:] - iteration_start,
            energy_out[skip_first:len(energy_report_idx)],
            cooling_func(np.asarray(energy_report_idx[skip_first:])),
        ], axis=1).reshape(-1, 3)
        self.__history = np.concatenate([self.__history, history], axis=0)
        
        if not xarray_out: 
            return None
    
        # convert the ds_out_dict to a single xarray.Dataset with an iteration dimension if requested
        # TODO: move this to a separate function???
        
        # if unwrapping is requested, the output rasters may have different shapes, so we need to find the max extent
        # across all reported arrays and create a new raster with that shape.
        
        # find the maximum extent of the unwrapped grid across all reported arrays
        coord_ranges = list((ds.x.data.min(), ds.x.data.max(), ds.y.data.min(), ds.y.data.max()) for ds in ds_out_dict.values())
        xmin, xmax, ymin, ymax = (
            min(coord_range[0] for coord_range in coord_ranges), 
            max(coord_range[1] for coord_range in coord_ranges), 
            min(coord_range[2] for coord_range in coord_ranges), 
            max(coord_range[3] for coord_range in coord_ranges),
        )
        new_xcoords = np.arange(xmin, xmax + self.resolution, self.resolution)
        new_ycoords = np.arange(ymin, ymax + self.resolution, self.resolution)

        data_shape = (len(ds_out_dict), len(new_ycoords), len(new_xcoords))

        # build an empty dataset
        ds = xr.Dataset(
            data_vars={
                "energy": (
                    ["iteration", "y", "x"], 
                    np.full(data_shape, np.nan, dtype=np.float64)
                ),
                "area": (
                    ["iteration", "y", "x"], 
                    np.full(data_shape, np.nan, dtype=np.float64)
                ),
                "elevation": (
                    ["iteration", "y", "x"], 
                    np.full(data_shape, np.nan, dtype=np.float64)
                ),
            },
            coords={
                "iteration": ("iteration", np.asarray(array_report_idx)),
                "y": ("y", new_ycoords),
                "x": ("x", new_xcoords),
            },
            attrs={
                "description": "OCN fit result arrays",
                "resolution": self.resolution,
                "gamma": self.gamma,
                "rng": self.rng,
                "wrap": self.wrap,
            }
        )

        # fill in the dataset with the unwrapped arrays, matching coordinates
        for i, ds_i in ds_out_dict.items():
            ds.energy.loc[dict(iteration=i, y=ds_i.y, x=ds_i.x)] = ds_i.energy
            ds.area.loc[dict(iteration=i, y=ds_i.y, x=ds_i.x)] = ds_i.area
            ds.elevation.loc[dict(iteration=i, y=ds_i.y, x=ds_i.x)] = ds_i.elevation

        return ds