Directed acyclic graphs with global source and global sink

This class is used in AbstractPathModelDAG as a wrapper (with unique global source and unique global sink) to pass the DAG to the ILP models.

stDAG

stDAG(
    base_graph: DiGraph,
    additional_starts: (
        list | None
    ) = None,
    additional_ends: (
        list | None
    ) = None,
)

Bases: AbstractSourceSinkGraph

Augmented DAG with global source/sink.

This class derives from AbstractSourceSinkGraph, which centralises the creation of a unique global source and sink and the shared flow utility helpers. Only DAG specific validation (acyclicity) and derived DAG-only structures (topological orders and reachability caches) remain here.

Source code in flowpaths/stdag.py

def __init__(
    self,
    base_graph: nx.DiGraph,
    additional_starts: list | None = None,
    additional_ends: list | None = None,
):
    super().__init__(
        base_graph=base_graph,
        additional_starts=additional_starts,
        additional_ends=additional_ends,
    )

compute_max_edge_antichain

compute_max_edge_antichain(
    get_antichain=False,
    weight_function=None,
)

Computes the maximum edge antichain in a directed graph.

Parameters

get_antichain (bool): If True, the function also returns the antichain along with its cost. Default is False.
weight_function (dict): A dictionary where keys are edges (tuples) and values are weights. If None, weights 1 are used for original graph edges, and weights 0 are used for global source / global sink edges. If given, the antichain weight is computed as the sum of the weights of the edges in the antichain, where edges that have some missing weight again get weight 0. Default is None.

Returns

If get_antichain is False, returns the size of maximum edge antichain.
If get_antichain is True, returns a tuple containing the size of maximum edge antichain and the antichain.

Source code in flowpaths/stdag.py

def compute_max_edge_antichain(self, get_antichain=False, weight_function=None):
    """
    Computes the maximum edge antichain in a directed graph.

    Parameters
    ----------
    - get_antichain (bool): If True, the function also returns the antichain along with its cost. Default is False.
    - weight_function (dict): A dictionary where keys are edges (tuples) and values are weights.
            If None, weights 1 are used for original graph edges, and weights 0 are used for global source / global sink edges.
            If given, the antichain weight is computed as the sum of the weights of the edges in the antichain,
            where edges that have some missing weight again get weight 0.
            Default is None.

    Returns
    ----------
    - If get_antichain is False, returns the size of maximum edge antichain.
    - If get_antichain is True, returns a tuple containing the
            size of maximum edge antichain and the antichain.
    """

    G_nx = nx.DiGraph()
    demand = dict()

    G_nx.add_nodes_from(self.nodes())

    for u, v in self.edges():
        # the cost of each path is 1
        cost = 1 if u == self.source else 0

        edge_demand = int(u != self.source and v != self.sink)
        if weight_function:
            edge_demand = weight_function.get((u, v), 0)

        demand[(u, v)] = edge_demand
        # adding the edge
        G_nx.add_edge(u, v, l=demand[(u, v)], u=graphutils.bigNumber, c=cost)

    minFlowCost, minFlow = graphutils.min_cost_flow(G_nx, self.source, self.sink)

    # def DFS_find_reachable_from_source(u, visited):
    #     if visited[u] != 0:
    #         return
    #     assert u != self.sink
    #     visited[u] = 1
    #     for v in self.successors(u):
    #         if minFlow[u][v] > demand[(u, v)]:
    #             if visited[v] == 0:
    #                 DFS_find_reachable_from_source(v, visited)
    #     for v in self.predecessors(u):
    #         if visited[v] == 0:
    #             DFS_find_reachable_from_source(v, visited)

    # The following code was created by Claude 3.7 Sonnet to avoid recursion and uses a stack instead.
    def DFS_find_reachable_from_source(start_node, visited):
        stack = [start_node]

        while stack:
            u = stack.pop()
            if visited[u] != 0:
                continue

            assert u != self.sink
            visited[u] = 1

            for v in self.successors(u):
                if minFlow[u][v] > demand[(u, v)] and visited[v] == 0:
                    stack.append(v)

            for v in self.predecessors(u):
                if visited[v] == 0:
                    stack.append(v)

    # def DFS_find_saturating(u, visited):
    #     if visited[u] != 1:
    #         return
    #     visited[u] = 2
    #     for v in self.successors(u):
    #         if minFlow[u][v] > demand[(u, v)]:
    #             DFS_find_saturating(v, visited)
    #         elif (
    #             minFlow[u][v] == demand[(u, v)]
    #             and demand[(u, v)] >= 1
    #             and visited[v] == 0
    #         ):
    #             antichain.append((u, v))
    #     for v in self.predecessors(u):
    #         DFS_find_saturating(v, visited)

    # The following code was created by Claude 3.7 Sonnet to avoid recursion and uses a stack instead.
    def DFS_find_saturating(start_node, visited):
        stack = [start_node]

        while stack:
            u = stack.pop()

            if visited[u] != 1:
                continue

            visited[u] = 2

            # Process successors
            for v in self.successors(u):
                if minFlow[u][v] > demand[(u, v)]:
                    if visited[v] == 1:  # Only visit nodes marked as reachable (1)
                        stack.append(v)
                elif (minFlow[u][v] == demand[(u, v)] 
                    and demand[(u, v)] >= 1 
                    and visited[v] == 0):
                    antichain.append((u, v))

            # Process predecessors
            for v in self.predecessors(u):
                if visited[v] == 1:  # Only visit nodes marked as reachable (1)
                    stack.append(v)

    if get_antichain:
        antichain = []
        visited = {node: 0 for node in self.nodes()}
        DFS_find_reachable_from_source(self.source, visited)
        DFS_find_saturating(self.source, visited)
        if weight_function:
            assert minFlowCost == sum(
                map(lambda edge: weight_function[edge], antichain)
            )
        else:
            assert minFlowCost == len(antichain)
        return minFlowCost, antichain

    return minFlowCost

decompose_using_max_bottleneck

decompose_using_max_bottleneck(
    flow_attr: str,
)

Decomposes the flow greedily into paths using the maximum bottleneck algorithm. This method iteratively finds the path with the maximum bottleneck capacity in the graph and decomposes the flow along that path. The process continues until no more paths can be found.

Note

The decomposition path do not contain the global source nor sink.

Returns

tuple: A tuple containing two lists:
- paths (list of lists): A list of paths, where each path is represented as a list of nodes.
- weights (list): A list of weights (bottleneck capacities) corresponding to each path.

Source code in flowpaths/stdag.py

def decompose_using_max_bottleneck(self, flow_attr: str):
    """
    Decomposes the flow greedily into paths using the maximum bottleneck algorithm.
    This method iteratively finds the path with the maximum bottleneck capacity
    in the graph and decomposes the flow along that path. The process continues
    until no more paths can be found.

    !!! note "Note"
        The decomposition path do not contain the global source nor sink.

    Returns
    ----------
    - tuple: A tuple containing two lists:
        - paths (list of lists): A list of paths, where each path is represented
            as a list of nodes.
        - weights (list): A list of weights (bottleneck capacities) corresponding to each path.
    """

    paths = list()
    weights = list()

    temp_G = nx.DiGraph()
    temp_G.add_nodes_from(self.nodes())
    temp_G.add_edges_from(self.edges(data=True))
    temp_G.remove_nodes_from([self.source, self.sink])

    while True:
        bottleneck, path = graphutils.max_bottleneck_path(temp_G, flow_attr)
        if path is None:
            break

        for i in range(len(path) - 1):
            temp_G[path[i]][path[i + 1]][flow_attr] -= bottleneck

        paths.append(path)
        weights.append(bottleneck)

    return (paths, weights)

get_flow_width

get_flow_width(
    flow_attr: str,
    edges_to_ignore: list = None,
) -> int

Calculate, store, and return the flow-width of the graph. The flow width is computed as the minimum number to cover all the edges, with the constraint that an edge cannot be covered more time than the flow value given as flow_attr in the edge data.

If the flow-width has already been computed, the stored value is returned.

Returns

int: The flow-width of the graph.

Source code in flowpaths/stdag.py

def get_flow_width(self, flow_attr: str, edges_to_ignore: list = None) -> int:
    """
    Calculate, store, and return the [flow-width](https://arxiv.org/abs/2409.20278) of the graph.
    The flow width is computed as the minimum number to cover all the edges, with the constraint 
    that an edge cannot be covered more time than the flow value given as `flow_attr` in the edge data.

    If the flow-width has already been computed, the stored value is returned.

    Returns
    ----------
    - int: The flow-width of the graph.
    """

    if self.flow_width != None:
        return self.flow_width

    G_nx = nx.DiGraph()

    edges_to_ignore_set = set(edges_to_ignore or [])

    G_nx.add_nodes_from(self.nodes())

    for u, v in self.edges():
        # the cost of each path is 1
        cost = 1 if u == self.source else 0

        edge_demand = int(u != self.source and v != self.sink)
        if (u, v) in edges_to_ignore_set:
            edge_demand = 0
        edge_capacity = self[u][v].get(flow_attr, float('inf'))

        # adding the edge
        G_nx.add_edge(u, v, l=edge_demand, u=edge_capacity, c=cost)

    minFlowCost, _ = graphutils.min_cost_flow(G_nx, self.source, self.sink)

    self.flow_width = minFlowCost

    return self.flow_width

get_width

get_width(
    edges_to_ignore: list = None,
) -> int

Calculate and return the width of the graph. The width is computed as the minimum number of paths needed to cover all the edges of the graph, except those in the edges_to_ignore list.

If the width has already been computed and edges_to_ignore is empty, the stored value is returned.

Returns

int: The width of the graph.

Source code in flowpaths/stdag.py

def get_width(self, edges_to_ignore: list = None) -> int:
    """
    Calculate and return the width of the graph.
    The width is computed as the minimum number of paths needed to cover all the edges of the graph, 
    except those in the `edges_to_ignore` list. 

    If the width has already been computed and `edges_to_ignore` is empty,
    the stored value is returned.

    Returns
    ----------
    - int: The width of the graph.
    """

    if self.width is not None and (edges_to_ignore is None or len(edges_to_ignore) == 0):
        return self.width

    edges_to_ignore_set = set(edges_to_ignore or [])

    weight_function = {e: 1 for e in self.edges() if e not in edges_to_ignore_set}

    width = self.compute_max_edge_antichain(get_antichain=False, weight_function=weight_function)
    if (edges_to_ignore is None or len(edges_to_ignore) == 0):
        self.width = width

    return width