stDiGraph

stDiGraph(
    base_graph: DiGraph,
    additional_starts: list = [],
    additional_ends: list = [],
)

Bases: DiGraph

Source code in flowpaths/stdigraph.py

def __init__(
    self,
    base_graph: nx.DiGraph,
    additional_starts: list = [],
    additional_ends: list = [],
):
    if not all(isinstance(node, str) for node in base_graph.nodes()):
        utils.logger.error(f"{__name__}: Every node of the graph must be a string.")
        raise ValueError("Every node of the graph must be a string.")

    super().__init__()
    self.base_graph = base_graph
    if "id" in base_graph.graph:
        self.id = base_graph.graph["id"]
    else:
        self.id = id(self)
    self.additional_starts = set(additional_starts)
    self.additional_ends = set(additional_ends)
    self.source = f"source_{id(self)}"
    self.sink = f"sink_{id(self)}"

    self._build_graph()

    nx.freeze(self)

compute_max_edge_antichain

compute_max_edge_antichain(
    get_antichain=False,
    weight_function=None,
)

Computes the maximum edge antichain in a directed graph.

Parameters

get_antichain (bool): If True, the function also returns the antichain along with its cost. Default is False.
weight_function (dict): A dictionary where keys are edges (tuples) and values are weights. If None, weights 1 are used for original graph edges, and weights 0 are used for global source / global sink edges. If given, the antichain weight is computed as the sum of the weights of the edges in the antichain, where edges that have some missing weight again get weight 0. Default is None.

Returns

If get_antichain is False, returns the size of maximum edge antichain.
If get_antichain is True, returns a tuple containing the size of maximum edge antichain and the antichain.

Source code in flowpaths/stdigraph.py

def compute_max_edge_antichain(self, get_antichain=False, weight_function=None):
    """
    Computes the maximum edge antichain in a directed graph.

    Parameters
    ----------
    - get_antichain (bool): If True, the function also returns the antichain along with its cost. Default is False.
    - weight_function (dict): A dictionary where keys are edges (tuples) and values are weights.
            If None, weights 1 are used for original graph edges, and weights 0 are used for global source / global sink edges.
            If given, the antichain weight is computed as the sum of the weights of the edges in the antichain,
            where edges that have some missing weight again get weight 0.
            Default is None.

    Returns
    ----------
    - If get_antichain is False, returns the size of maximum edge antichain.
    - If get_antichain is True, returns a tuple containing the
            size of maximum edge antichain and the antichain.
    """

    G_nx = nx.DiGraph()
    demand = dict()

    G_nx.add_nodes_from(self.nodes())

    for u, v in self.edges():
        # the cost of each path is 1
        cost = 1 if u == self.source else 0

        edge_demand = int(u != self.source and v != self.sink)
        if weight_function:
            edge_demand = weight_function.get((u, v), 0)

        demand[(u, v)] = edge_demand
        # adding the edge
        G_nx.add_edge(u, v, l=demand[(u, v)], u=graphutils.bigNumber, c=cost)

    minFlowCost, minFlow = graphutils.min_cost_flow(G_nx, self.source, self.sink)

    # def DFS_find_reachable_from_source(u, visited):
    #     if visited[u] != 0:
    #         return
    #     assert u != self.sink
    #     visited[u] = 1
    #     for v in self.successors(u):
    #         if minFlow[u][v] > demand[(u, v)]:
    #             if visited[v] == 0:
    #                 DFS_find_reachable_from_source(v, visited)
    #     for v in self.predecessors(u):
    #         if visited[v] == 0:
    #             DFS_find_reachable_from_source(v, visited)

    # The following code was created by Claude 3.7 Sonnet to avoid recursion and uses a stack instead.
    def DFS_find_reachable_from_source(start_node, visited):
        stack = [start_node]

        while stack:
            u = stack.pop()
            if visited[u] != 0:
                continue

            assert u != self.sink
            visited[u] = 1

            for v in self.successors(u):
                if minFlow[u][v] > demand[(u, v)] and visited[v] == 0:
                    stack.append(v)

            for v in self.predecessors(u):
                if visited[v] == 0:
                    stack.append(v)

    # def DFS_find_saturating(u, visited):
    #     if visited[u] != 1:
    #         return
    #     visited[u] = 2
    #     for v in self.successors(u):
    #         if minFlow[u][v] > demand[(u, v)]:
    #             DFS_find_saturating(v, visited)
    #         elif (
    #             minFlow[u][v] == demand[(u, v)]
    #             and demand[(u, v)] >= 1
    #             and visited[v] == 0
    #         ):
    #             antichain.append((u, v))
    #     for v in self.predecessors(u):
    #         DFS_find_saturating(v, visited)

    # The following code was created by Claude 3.7 Sonnet to avoid recursion and uses a stack instead.
    def DFS_find_saturating(start_node, visited):
        stack = [start_node]

        while stack:
            u = stack.pop()

            if visited[u] != 1:
                continue

            visited[u] = 2

            # Process successors
            for v in self.successors(u):
                if minFlow[u][v] > demand[(u, v)]:
                    if visited[v] == 1:  # Only visit nodes marked as reachable (1)
                        stack.append(v)
                elif (minFlow[u][v] == demand[(u, v)] 
                    and demand[(u, v)] >= 1 
                    and visited[v] == 0):
                    antichain.append((u, v))

            # Process predecessors
            for v in self.predecessors(u):
                if visited[v] == 1:  # Only visit nodes marked as reachable (1)
                    stack.append(v)

    if get_antichain:
        antichain = []
        visited = {node: 0 for node in self.nodes()}
        DFS_find_reachable_from_source(self.source, visited)
        DFS_find_saturating(self.source, visited)
        if weight_function:
            assert minFlowCost == sum(
                map(lambda edge: weight_function[edge], antichain)
            )
        else:
            assert minFlowCost == len(antichain)
        return minFlowCost, antichain

    return minFlowCost

decompose_using_max_bottleneck

decompose_using_max_bottleneck(
    flow_attr: str,
)

Decomposes the flow greedily into paths using the maximum bottleneck algorithm. This method iteratively finds the path with the maximum bottleneck capacity in the graph and decomposes the flow along that path. The process continues until no more paths can be found.

Note

The decomposition path do not contain the global source nor sink.

Returns

tuple: A tuple containing two lists:
- paths (list of lists): A list of paths, where each path is represented as a list of nodes.
- weights (list): A list of weights (bottleneck capacities) corresponding to each path.

Source code in flowpaths/stdigraph.py

def decompose_using_max_bottleneck(self, flow_attr: str):
    """
    Decomposes the flow greedily into paths using the maximum bottleneck algorithm.
    This method iteratively finds the path with the maximum bottleneck capacity
    in the graph and decomposes the flow along that path. The process continues
    until no more paths can be found.

    !!! note "Note"
        The decomposition path do not contain the global source nor sink.

    Returns
    ----------
    - tuple: A tuple containing two lists:
        - paths (list of lists): A list of paths, where each path is represented
            as a list of nodes.
        - weights (list): A list of weights (bottleneck capacities) corresponding to each path.
    """

    paths = list()
    weights = list()

    temp_G = nx.DiGraph()
    temp_G.add_nodes_from(self.nodes())
    temp_G.add_edges_from(self.edges(data=True))
    temp_G.remove_nodes_from([self.source, self.sink])

    while True:
        bottleneck, path = graphutils.max_bottleneck_path(temp_G, flow_attr)
        if path is None:
            break

        for i in range(len(path) - 1):
            temp_G[path[i]][path[i + 1]][flow_attr] -= bottleneck

        paths.append(path)
        weights.append(bottleneck)

    return (paths, weights)

get_flow_width

get_flow_width(
    flow_attr: str,
    edges_to_ignore: list = None,
) -> int

Calculate, store, and return the flow-width of the graph. The flow width is computed as the minimum number to cover all the edges, with the constraint that an edge cannot be covered more time than the flow value given as flow_attr in the edge data.

If the flow-width has already been computed, the stored value is returned.

Returns

int: The flow-width of the graph.

Source code in flowpaths/stdigraph.py

def get_flow_width(self, flow_attr: str, edges_to_ignore: list = None) -> int:
    """
    Calculate, store, and return the [flow-width](https://arxiv.org/abs/2409.20278) of the graph.
    The flow width is computed as the minimum number to cover all the edges, with the constraint 
    that an edge cannot be covered more time than the flow value given as `flow_attr` in the edge data.

    If the flow-width has already been computed, the stored value is returned.

    Returns
    ----------
    - int: The flow-width of the graph.
    """

    if self.flow_width != None:
        return self.flow_width

    G_nx = nx.DiGraph()

    edges_to_ignore_set = set(edges_to_ignore or [])

    G_nx.add_nodes_from(self.nodes())

    for u, v in self.edges():
        # the cost of each path is 1
        cost = 1 if u == self.source else 0

        edge_demand = int(u != self.source and v != self.sink)
        if (u, v) in edges_to_ignore_set:
            edge_demand = 0
        edge_capacity = self[u][v].get(flow_attr, float('inf'))

        # adding the edge
        G_nx.add_edge(u, v, l=edge_demand, u=edge_capacity, c=cost)

    minFlowCost, _ = graphutils.min_cost_flow(G_nx, self.source, self.sink)

    self.flow_width = minFlowCost

    return self.flow_width

get_max_flow_value_and_check_non_negative_flow

get_max_flow_value_and_check_non_negative_flow(
    flow_attr: str,
    edges_to_ignore: set,
) -> float

Determines the maximum flow value in the graph and checks for positive flow values.

This method iterates over all edges in the graph, ignoring edges specified in self.edges_to_ignore. It checks if each edge has the required flow attribute specified by self.flow_attr. If an edge does not have this attribute, a ValueError is raised. If an edge has a negative flow value, a ValueError is raised. The method returns the maximum flow value found among all edges.

Returns

float: The maximum flow value among all edges in the graph.

Raises

ValueError: If an edge does not have the required flow attribute.
ValueError: If an edge has a negative flow value.

Source code in flowpaths/stdigraph.py

def get_max_flow_value_and_check_non_negative_flow(
    self, flow_attr: str, edges_to_ignore: set
) -> float:
    """
    Determines the maximum flow value in the graph and checks for positive flow values.

    This method iterates over all edges in the graph, ignoring edges specified in
    `self.edges_to_ignore`. It checks if each edge has the required flow attribute
    specified by `self.flow_attr`. If an edge does not have this attribute, a
    ValueError is raised. If an edge has a negative flow value, a ValueError is
    raised. The method returns the maximum flow value found among all edges.

    Returns
    -------
    - float: The maximum flow value among all edges in the graph.

    Raises
    -------
    - ValueError: If an edge does not have the required flow attribute.
    - ValueError: If an edge has a negative flow value.
    """

    w_max = float("-inf")
    if edges_to_ignore is None:
        edges_to_ignore = set()

    for u, v, data in self.edges(data=True):
        if (u, v) in edges_to_ignore:
            continue
        if not flow_attr in data:
            utils.logger.error(
                f"Edge ({u},{v}) does not have the required flow attribute '{flow_attr}'. Check that the attribute passed under 'flow_attr' is present in the edge data."
            )
            raise ValueError(
                f"Edge ({u},{v}) does not have the required flow attribute '{flow_attr}'. Check that the attribute passed under 'flow_attr' is present in the edge data."
            )
        if data[flow_attr] < 0:
            utils.logger.error(
                f"Edge ({u},{v}) has negative flow value {data[flow_attr]}. All flow values must be >=0."
            )
            raise ValueError(
                f"Edge ({u},{v}) has negative flow value {data[flow_attr]}. All flow values must be >=0."
            )
        w_max = max(w_max, data[flow_attr])

    return w_max

get_non_zero_flow_edges

get_non_zero_flow_edges(
    flow_attr: str,
    edges_to_ignore: set = set(),
) -> set

Get all edges with non-zero flow values.

Returns

set A set of edges (tuples) that have non-zero flow values.

Source code in flowpaths/stdigraph.py

def get_non_zero_flow_edges(
    self, flow_attr: str, edges_to_ignore: set = set()
) -> set:
    """
    Get all edges with non-zero flow values.

    Returns
    -------
    set
        A set of edges (tuples) that have non-zero flow values.
    """

    non_zero_flow_edges = set()
    for u, v, data in self.edges(data=True):
        if (u, v) not in edges_to_ignore and data.get(flow_attr, 0) != 0:
            non_zero_flow_edges.add((u, v))

    return non_zero_flow_edges

get_width

get_width(
    edges_to_ignore: list = None,
) -> int

Calculate and return the width of the graph. The width is computed as the minimum number of paths needed to cover all the edges of the graph, except those in the edges_to_ignore list.

If the width has already been computed and edges_to_ignore is empty, the stored value is returned.

Returns

int: The width of the graph.

Source code in flowpaths/stdigraph.py

def get_width(self, edges_to_ignore: list = None) -> int:
    """
    Calculate and return the width of the graph.
    The width is computed as the minimum number of paths needed to cover all the edges of the graph, 
    except those in the `edges_to_ignore` list. 

    If the width has already been computed and `edges_to_ignore` is empty,
    the stored value is returned.

    Returns
    ----------
    - int: The width of the graph.
    """

    if self.width is not None and (edges_to_ignore is None or len(edges_to_ignore) == 0):
        return self.width

    edges_to_ignore_set = set(edges_to_ignore or [])

    weight_function = {e: 1 for e in self.edges() if e not in edges_to_ignore_set}
    self.width = self.compute_max_edge_antichain(get_antichain=False, weight_function=weight_function)

    return self.width