Source code for PyOCN.utils

"""
Utility functions for working with OCNs.
"""

from __future__ import annotations
from collections.abc import Generator
from concurrent.futures import ThreadPoolExecutor
from ctypes import byref
from itertools import product
import os
from typing import Any, Literal, Callable, TYPE_CHECKING, Union
from numbers import Number
from functools import partial

import networkx as nx
import numpy as np
from tqdm import tqdm

import PyOCN._libocn_bindings as _bindings
from PyOCN._statushandler import check_status

if TYPE_CHECKING:
    from .ocn import OCN

_allowed_net_types = {"I", "H", "V", "E"}

#TODO: add ability to move root?

[docs]
def net_type_to_dag(net_type:Literal["I", "H", "V", "E"], dims:tuple, pbar: bool = False) -> nx.DiGraph:
    """Create a predefined OCN initialization network as a NetworkX DiGraph.

    Parameters
    ----------
    net_type : {"I", "H", "V", "E"}
        The type of network to create.
        Descriptions of allowed types:

        - "I":

          ::

              O--O--O--O--O
                    |
              O--O--O--O--O
                    |
              O--O--O--O--O
                    |
              O--O--X--O--O

        - "V":

          ::

              O  O  O  O  O
               \\  \\ | /  /
              O  O  O  O  O
               \\  \\ | /  /
              O  O  O  O  O
               \\  \\ | /  /
              O--O--X--O--O

        - "H":

          ::

              O  O  O  O
              |  |  | /
              O  O  O--O
              |  | /
              O  O--O--O
              | /
              X--O--O--O

        - "E": A network where every node on the edge of the grid is a root. Initial flow moves away from center towards edges.

    dims : tuple
        The network dimensions as ``(rows, cols)``. Both must be positive even integers.
    pbar : bool, default False
        If True, display a progress bar while constructing the graph.

    Returns
    -------
    networkx.DiGraph
        A directed acyclic graph representing a valid initial OCN configuration.

    Raises
    ------
    ValueError
        If ``net_type`` is invalid or ``dims`` are not two positive even integers.

    Note
    ----
    The returned graph assigns each grid cell exactly one node with a ``pos``
    attribute equal to ``(row, col)``.
    """
    rows, cols = dims
    G = nx.DiGraph()
    pbar = tqdm(product(range(rows), range(cols)), total=rows*cols, disable=not pbar, desc="Creating DAG")
    match net_type:
        case "I":
            jroot = cols // 2
            for i, j in pbar:
                n = i*cols + j
                G.add_node(n, pos=(i, j))
                if j < jroot:
                    G.add_edge(n, n+1)
                elif j > jroot:
                    G.add_edge(n, n-1)
                elif i > 0:
                    G.add_edge(n, n - cols)

        case "V":
            jroot = cols // 2
            for i, j in pbar:
                n = i*cols + j
                G.add_node(n, pos=(i, j))
                if i > 0:
                    if j < jroot:
                        G.add_edge(n, n - cols + 1)
                    elif j > jroot:
                        G.add_edge(n, n - cols - 1)
                    else:
                        G.add_edge(n, n - cols)
                else:
                    if j < jroot:
                        G.add_edge(n, n + 1)
                    elif j > jroot:
                        G.add_edge(n, n - 1)
        case "H": # hip roof is like V, but flowing towards a corner.
            for i, j in pbar:
                n = i*cols + j
                G.add_node(n, pos=(i, j))
                if i == j and i > 0:  # main diagonal
                    G.add_edge(n, n - cols - 1)
                elif i > j:
                    G.add_edge(n, n - cols)
                elif j > i:
                    G.add_edge(n, n - 1)
        case "E":  #TODO: implement a better radial pattern
            half_rows = rows / 2
            half_cols = cols / 2
            for i, j in pbar:
                n = i*cols + j
                G.add_node(n, pos=(i, j))
                # ul quadrant: flow up and left
                if i < half_rows and j < half_cols and i > 0 and j > 0:
                    G.add_edge(n, n - cols - 1)
                # ur quadrant: flow up and right
                elif i < half_rows and j >= half_cols and i > 0 and j < cols - 1:
                    G.add_edge(n, n - cols + 1)
                # ll quadrant: flow down and left
                elif i >= half_rows and j < half_cols and j > 0 and i < rows - 1:
                    G.add_edge(n, n + cols - 1)
                # lr quadrant: flow down and right
                elif i >= half_rows and j >= half_cols and i < rows - 1 and j < cols - 1:
                    G.add_edge(n, n + cols + 1)
        case _:
            raise ValueError(f"Invalid net_type {net_type}. Must be one of {_allowed_net_types}.")
        
    return G



[docs]
def simulated_annealing_schedule(dims: tuple[int, int],E0: float,constant_phase: float,n_iterations: int,cooling_rate: float,) -> Callable[[int], Union[float, np.ndarray]]:
    """
    Create a simulated-annealing cooling schedule for OCN optimization.

    This returns a callable ``schedule(i)`` that returns the temperature at
    iteration ``i``. The schedule consists of a constant-temperature phase
    followed by an exponentially decaying phase.

    Parameters
    ----------
    dims : tuple[int, int]
        The dimensions of the grid as (rows, cols).
    E0 : float
        Initial energy value.
    constant_phase : float
        Fraction of iterations (``0 <= fraction <= 1``) during which the
        temperature remains constant at ``Energy[0]``.
    n_iterations : int
        Total number of optimization iterations.
    cooling_rate : float
        Positive decay rate controlling the exponential temperature decrease
        after the constant phase.

    Returns
    -------
    Callable[[int], Union[float, np.ndarray]]
        A function mapping an iteration index ``i`` to a temperature value. If
        vectorized evaluation is used, may return a NumPy array of temperatures.

    Note
    ----
    The exponential phase follows the form

    .. math::

        T_i = E_0 \\exp\\left(-\\frac{r\\cdot(i - n_0)}{N}\\right),

    where ``E0`` is the initial energy, ``n0`` is the number of iterations in
    the constant phase, ``r`` is the cooling rate,and ``N = rows * cols``.
    """
    if (not isinstance(constant_phase, Number) or constant_phase < 0 or constant_phase > 1):
        raise ValueError(f"constant_phase must be a number between 0 and 1. Got {constant_phase}")
    if (not isinstance(n_iterations, int) or n_iterations <= 0):
        raise ValueError(f"n_iterations must be a positive integer. Got {n_iterations}")
    if not isinstance(cooling_rate, Number):
        raise ValueError(f"cooling_rate must be a number. Got {cooling_rate}")
    if not isinstance(E0, Number) or E0 <= 0:
        raise ValueError(f"E0 must be a positive number. Got {E0}")
    if not (isinstance(dims, tuple) and len(dims) == 2 and all(isinstance(d, int) and d > 0 for d in dims)):
        raise ValueError(f"dims must be a tuple of two positive integers. Got {dims}")
    
    n_constant = int(constant_phase * n_iterations)
    nnodes = dims[0] * dims[1]

    term1 = -cooling_rate / nnodes
    term2 = cooling_rate * n_constant / nnodes

    def schedule(i):
        i = np.asarray(i)
        return np.where(i < n_constant, E0, E0 * np.exp(term1*i + term2))

    return schedule



[docs]
def unwrap_digraph(dag: nx.DiGraph, dims: tuple[int, int]) -> nx.DiGraph:
    """"unwrap" gridcell coordinate attributes in a directed acyclic graph to place connected
    nodes adjacent to each other, removing periodic boundary conditions.

    Parameters
    ----------
    dag : nx.DiGraph
        The input directed acyclic graph with periodic boundary conditions.
        Each node must have a 'pos' attribute indicating its (row, col) position.
    dims : tuple[int, int]
        The dimensions of the grid as (rows, cols). Both must be positive integers.

    Returns
    -------
    nx.DiGraph
        A new directed acyclic graph with unwrapped grid coordinates. May not be
        consistent with a grid structure.

    Raises
    ------
    ValueError
        If any node in the input graph lacks a 'pos' attribute or if the
        dimensions are not positive integers.

    Important
    ---------
    The function assumes that the input graph is a valid DAG and that the
    'pos' attributes are correctly assigned. The output graph will no longer
    span a toroidal topology and will no longer cover a dense grid of nodes.
    """
    new_dag = dag.copy()
    
    for _ in range(2):
        for n in nx.topological_sort(new_dag):

            pos = new_dag.nodes[n]['pos']
            r, c = pos
            succs = list(new_dag.successors(n))
            
            # check for row wrapping
            for s in succs:
                sr, _ = new_dag.nodes[s]['pos']
                dr = sr - r
                # if we detect wrapping, move all ancestors and self
                if dr > 1:  # wrapped downward
                    for anc in nx.ancestors(new_dag, n):
                        anc_r, anc_c = new_dag.nodes[anc]['pos']
                        new_dag.nodes[anc]['pos'] = (anc_r + dims[0], anc_c)
                    new_dag.nodes[n]['pos'] = (r + dims[0], c)
                    break
                elif dr < -1:  # wrapped upward
                    for anc in nx.ancestors(new_dag, n):
                        anc_r, anc_c = new_dag.nodes[anc]['pos']
                        new_dag.nodes[anc]['pos'] = (anc_r - dims[0], anc_c)
                    new_dag.nodes[n]['pos'] = (r - dims[0], c)
                    break
            # check for column wrapping
            for s in succs:
                _, sc = new_dag.nodes[s]['pos']
                dc = sc - c
                if dc > 1:  # wrapped rightward
                    for anc in nx.ancestors(new_dag, n):
                        anc_r, anc_c = new_dag.nodes[anc]['pos']
                        new_dag.nodes[anc]['pos'] = (anc_r, anc_c + dims[1])
                    new_dag.nodes[n]['pos'] = (r, c + dims[1])
                    break
                elif dc < -1:  # wrapped leftward
                    for anc in nx.ancestors(new_dag, n):
                        anc_r, anc_c = new_dag.nodes[anc]['pos']
                        new_dag.nodes[anc]['pos'] = (anc_r, anc_c - dims[1])
                    new_dag.nodes[n]['pos'] = (r, c - dims[1])
                    break
    # Adjust positions to be non-negative
    positions = np.array(list(nx.get_node_attributes(new_dag, 'pos').values()))
    row_off, col_off = positions.min(axis=0)
    for n in new_dag.nodes:
        r, c = new_dag.nodes[n]['pos']
        new_dag.nodes[n]['pos'] = (r - row_off, c - col_off)
    return new_dag



[docs]
def assign_subwatersheds(dag: nx.DiGraph) -> None:
    """Assign a 'watershed_id' attribute to each node in the DAG. 
    The resulting watershed_ids will be of the highest order possible,
    meaning that ids are assigned based on watersheds that drain directly into the 
    root nodes of the graph. To assign ids to lower order watersheds, consider first
    partitioning the graph into smaller subgraphs using the `get_subwatersheds` function.

    Parameters
    ----------
    dag : nx.DiGraph
        The input directed acyclic graph. Each node must have a 'pos' attribute
        indicating its (row, col) position.

    Returns
    -------
    None
        The function modifies the input graph in place by adding a 'watershed_id'
        attribute to each node.

    Raises
    ------
    ValueError
        If any node in the input graph lacks a 'pos' attribute.

    Note
    ----
    A subwatershed is defined as the set of nodes that drain to a common outlet,
    where an outlet is a node with out-degree zero. Each subwatershed is assigned
    a unique integer ID, starting from 0. Nodes that are outlets themselves are
    assigned a watershed ID of -1.
    """
    roots = [n for n, d in dag.out_degree() if d==0]
    subwatershed_outlets = [n for root in roots for n in dag.predecessors(root)]
    subwatersheds = list(set(nx.ancestors(dag, outlet)) | {outlet} for outlet in subwatershed_outlets)
    subwatersheds = [dag.subgraph(wshd) for wshd in subwatersheds]
    for i, wshd in enumerate(subwatersheds):
        nx.set_node_attributes(wshd, i + 1, 'watershed_id')
    for r in roots:
        nx.set_node_attributes(dag, {r: -1}, 'watershed_id')



[docs]
def get_subwatersheds(dag : nx.DiGraph, node : Any) -> set[nx.DiGraph]:
    """Extract subwatershed subgraphs from the main DAG. Each subwatershed drains to a common outlet node `node`.
    Node `node` is not included in the returned subwatershed graphs.

    Parameters
    ----------
    dag : nx.DiGraph
        The input directed acyclic graph. Each node must have a 'pos' attribute
        indicating its (row, col) position.
    node : Any
        A node in the graph representing the outlet of a subwatershed.

    Returns
    -------
    set of nx.DiGraph
        A set of directed acyclic graphs, each representing a subwatershed.

    Danger
    ------
    The returned subwatersheds are subgraph views of the input graph and share node
    and edge data with the original graph. Unless copied, any changes to node or edge attributes
    in the subwatersheds will affect the original graph.
    """
    subwatershed_outlets = [n for n in dag.predecessors(node)]
    subwatersheds = (nx.ancestors(dag, outlet) | {outlet} for outlet in subwatershed_outlets)
    subwatersheds = set(dag.subgraph(wshd) for wshd in subwatersheds)
    return subwatersheds


# # deferring stream order calculations for now.
# def assign_strahler_orders(dag: nx.DiGraph) -> None:
#     """Assign Strahler order to each node in the DAG as a 'strahler_order' attribute.
#     Modifies the input graph in place.

#     Parameters
#     ----------
#     dag : nx.DiGraph
#         The input directed acyclic graph.
#     """
#     # Initialize Strahler order for leaf nodes
#     leaf_nodes = [n for n, d in dag.in_degree() if d == 0]
#     nx.set_node_attributes(dag, {n: 1 for n in leaf_nodes}, 'strahler_order')

#     # Compute Strahler order for other nodes
#     strahler_orders = dict(nx.get_node_attributes(dag, 'strahler_order'))
#     for n in nx.topological_sort(dag):
#         if dag.in_degree(n):
#             in_orders = [strahler_orders[p] for p in dag.predecessors(n)]
#             max_order = max(in_orders)
#             if sum(o == max_order for o in in_orders) > 1:
#                 order = max_order + 1
#             else:
#                 order = max_order
#             strahler_orders[n] = order
#     nx.set_node_attributes(dag, strahler_orders, 'strahler_order')

# def assign_shreve_orders(dag: nx.DiGraph) -> None:
#     """Assign Shreve order to each node in the DAG as a 'shreve_order' attribute.
#     Shreve order is defined as the total number of upstream sources that contribute to a node.

#     Parameters
#     ----------
#     dag : nx.DiGraph
#         The input directed acyclic graph.
#     """
#     # Initialize Shreve order for leaf nodes
#     leaf_nodes = [n for n, d in dag.in_degree() if d == 0]
#     nx.set_node_attributes(dag, {n: 1 for n in leaf_nodes}, 'shreve_order')

#     # Compute Shreve order for other nodes
#     shreve_orders = dict(nx.get_node_attributes(dag, 'shreve_order'))
#     for n in nx.topological_sort(dag):
#         if dag.in_degree(n):
#             in_orders = [shreve_orders[p] for p in dag.predecessors(n)]
#             order = sum(in_orders)
#             shreve_orders[n] = order
#     nx.set_node_attributes(dag, shreve_orders, 'shreve_order')
    

def parallel_fit(
    ocn:OCN|list[OCN], 
    n_runs=5, 
    n_threads=None, 
    fit_method:Literal["fit", "fit_custom_cooling"]|list[Literal["fit", "fit_custom_cooling"]]|None=None, 
    increment_rng:bool=True, 
    pbar:bool=False, 
    fit_kwargs:dict|list[dict]=None
) -> tuple[list[Any], list[OCN]]:
    """Convenience function to perform multiple OCN fitting operations in parallel using multithreading. 
    Useful for doing sensitivity analysis or ensemble fitting.

    Parameters
    ----------
    ocn : OCN | list[OCN]
        The OCN instance(s) to fit. If a list of OCNs is provided, each OCN will be fitted independently.
        If a single OCN is provided, it will be copied `n_runs` times.
        Not modified during fitting.
    n_runs : int, default 5
        The number of fitting runs to perform. Must be equal to the length of `ocn` if `ocn` is a list.
    n_threads : int, default None
        The number of worker threads to use for parallel execution. If None, defaults to the number of CPU cores, times 2.
    fit_method : {"fit", "fit_custom_cooling"} | list[{"fit", "fit_custom_cooling"} | None], default None
        The fitting method to use. If None, defaults to "fit". If a list is provided, it must be of length `n_runs`,
        and each element specifies the fitting method for the corresponding fit.
    increment_rng : bool, default True
        If True, each fit's random seed is set to `ocn.rng + i`, where `i` is the thread index.
    pbar : bool, default False
        If True, display a master progress bar that tracks the completion of each thread.
    fit_kwargs : dict | list[dict], optional
        Additional keyword arguments to pass to the `OCN.fit` method. If a list of dicts is provided,
        it must be of length `n_runs`, and each dict will be used for the corresponding fit.

    Returns
    -------
    tuple[list[Any], list[OCN]]
        A tuple containing two lists:
        - A list of results from each fitting operation.
        - A list of fitted OCN instances corresponding to each fitting operation.
    """

    if isinstance(ocn, list):
        if len(ocn) != n_runs:
            raise ValueError(f"When ocn is a list, its length must equal n_runs. Got len(ocn)={len(ocn)} and n_runs={n_runs}.")
        ocn = [o.copy() for o in ocn]
    else:
        ocn = [ocn.copy() for _ in range(n_runs)]

    if isinstance(fit_kwargs, list):
        if len(fit_kwargs) != n_runs:
            raise ValueError(f"When fit_kwargs is a list, its length must equal n_runs. Got len(fit_kwargs)={len(fit_kwargs)} and n_runs={n_runs}.")
        if not all(isinstance(k, dict) for k in fit_kwargs):
            raise ValueError("All elements of fit_kwargs list must be dictionaries.")
    elif not isinstance(fit_kwargs, dict) and fit_kwargs is not None:
        raise ValueError(f"fit_kwargs must be a dict or a list of dicts. Got {type(fit_kwargs)}.")
    else: 
        fit_kwargs = [fit_kwargs or dict() for _ in range(n_runs)]

    if isinstance(fit_method, list):
        if len(fit_method) != n_runs:
            raise ValueError(f"When fit_method is a list, its length must equal n_runs. Got len(fit_method)={len(fit_method)} and n_runs={n_runs}.")
        elif not all(m is None or m in {"fit", "fit_custom_cooling"} for m in fit_method):
            raise ValueError("All elements of fit_method list must be one of 'fit', 'fit_custom_cooling', or None.")
    else:
        if fit_method is not None and fit_method not in {"fit", "fit_custom_cooling"}:
            raise ValueError(f"Invalid fit_method {fit_method}. Must be one of 'fit', 'fit_custom_cooling', or None.")
        fit_method = [fit_method for _ in range(n_runs)]

    def fit(ocn, i, fit_method, fit_kwargs):
        if increment_rng:
            ocn.rng  = ocn.rng + i
        if fit_method is None or fit_method == "fit":
            res = ocn.fit(**fit_kwargs)
        elif fit_method == "fit_custom_cooling":
            res = ocn.fit_custom_cooling(**fit_kwargs)
        else:
            raise ValueError(f"Invalid fit_method {fit_method}. Must be one of 'fit', 'fit_custom_cooling', or None.")
        return res, i  # return index to place result correctly, in case of out-of-order completion.
    
    if n_threads is None:
        n_threads = os.cpu_count()*2
    n_threads = min(os.cpu_count()*2, n_threads)

    with ThreadPoolExecutor(max_workers=n_threads) as executor:
        futures = []
        for i in range(n_runs):
            futures.append(executor.submit(fit, ocn[i], i, fit_method[i], fit_kwargs[i]))
        results = [None] * n_runs
        pbar = tqdm(futures, disable=not pbar, desc="Fitting OCNs")
        for future in futures:
            res, idx = future.result()
            results[idx] = res
            pbar.update(1)
    return results, ocn

# # Commenting out for now. May decide to re-introduce later
# def ancestors(ocn:OCN, pos:tuple[int, int]) -> set[tuple[int, int]]:
#     """Returns all nodes that drain into the node at position `pos` in the OCN.

#     Parameters
#     ----------
#     ocn : OCN
#         The OCN instance.
#     pos : tuple[int, int]
#         The (row, col) position of the node whose predecessors are to be found.

#     Returns
#     -------
#     set()
#         A set of (row, col) tuples representing the positions of all ancestor nodes
#         that eventually drain into the specified node, not including the node itself.

#     See Also
#     --------
#     :meth:`OCN.predecessors`
#     :meth:`OCN.successors`
#     :meth:`utils.descendants`
#     """

#     pos = tuple(pos)
#     if len(pos) != 2 or not all(isinstance(p, int) for p in pos):
#         raise TypeError(f"Position must be a tuple of two integers. Got {pos}.")
#     if (pos[0] < 0 or pos[0] >= ocn.dims[0]) or (pos[1] < 0 or pos[1] >= ocn.dims[1]):
#         raise IndexError(f"Position {pos} is out of bounds for OCN with dimensions {ocn.dims}.")

#     a = _bindings.libocn.fg_cart_to_lin(
#         _bindings.CartPair_C(row=pos[0], col=pos[1]),
#         _bindings.CartPair_C(row=ocn.dims[0], col=ocn.dims[1])
#     )
#     upstream_indices = (_bindings.linidx_t * (ocn.dims[0]*ocn.dims[1]))()
#     nupstream = _bindings.linidx_t(0)
#     check_status(_bindings.libocn.fg_dfs_iterative(
#         upstream_indices, 
#         byref(nupstream), 
#         (_bindings.linidx_t * (ocn.dims[0]*ocn.dims[1]))(), 
#         ocn._OCN__p_c_graph, 
#         a
#     ))

#     return set(
#         (int(c.row), int(c.col)) 
#         for c in (
#             _bindings.libocn.fg_lin_to_cart(
#                 idx, 
#                 _bindings.CartPair_C(row=ocn.dims[0], col=ocn.dims[1])
#             ) 
#             for idx in upstream_indices[:nupstream.value]
#         )
#     )

# # TODO write tests for the traversal functions
# def descendants(ocn:OCN, pos:tuple[int, int]) -> set[tuple[int, int]]:
#     """Returns all nodes that are reachable from the node at position `pos` in the OCN.
#     Mirrors the functionality of `networkx.descendants`.

#     Parameters
#     ----------
#     ocn : OCN
#         The OCN instance.
#     pos : tuple[int, int]
#         The (row, col) position of the node whose successors are to be found.

#     Returns
#     -------
#     set()
#         A set of (row, col) tuples representing the positions of all descendant nodes
#         that the specified node eventually drains into, not including the node itself.

#     See Also
#     --------
#     :meth:`OCN.predecessors`
#     :meth:`OCN.successors`
#     :meth:`utils.ancestors`
#     """

#     pos = tuple(pos)
#     if len(pos) != 2 or not all(isinstance(p, int) for p in pos):
#         raise TypeError(f"Position must be a tuple of two integers. Got {pos}.")
#     if (pos[0] < 0 or pos[0] >= ocn.dims[0]) or (pos[1] < 0 or pos[1] >= ocn.dims[1]):
#         raise IndexError(f"Position {pos} is out of bounds for OCN with dimensions {ocn.dims}.")

#     a = _bindings.libocn.fg_cart_to_lin(
#         _bindings.CartPair_C(row=pos[0], col=pos[1]),
#         _bindings.CartPair_C(row=ocn.dims[0], col=ocn.dims[1])
#     )
#     downstream_indices = (_bindings.linidx_t * (ocn.dims[0]*ocn.dims[1]))()
#     ndownstream = _bindings.linidx_t(0)
#     check_status(_bindings.libocn.flow_downstream(
#         downstream_indices,
#         byref(ndownstream),
#         ocn._OCN__p_c_graph,
#         a
#     ))

#     return set(
#         (int(c.row), int(c.col))
#         for c in (
#             _bindings.libocn.fg_lin_to_cart(
#                 idx,
#                 _bindings.CartPair_C(row=ocn.dims[0], col=ocn.dims[1])
#             )
#             for idx in downstream_indices[:ndownstream.value]
#         )
#     )

__all__ = [
    "net_type_to_dag",
    "simulated_annealing_schedule",
    "unwrap_digraph",
    "assign_subwatersheds",
    "get_subwatersheds",
    "parallel_fit",
    "assign_strahler_orders",
    "assign_shreve_orders",
]