Source code for flowno.core.flow.flow

"""
Flow execution and graph resolution module for Flowno.

This module contains the Flow class, which is the core execution engine for dataflow graphs.
It manages node scheduling, dependency resolution, cycle breaking, and concurrent execution.

Key components:
    - Flow: The main dataflow graph execution engine
    - FlowEventLoop: A custom event loop for handling Flow-specific commands
    - NodeTaskStatus: State tracking for node execution
"""

from contextvars import ContextVar
import logging
from collections import defaultdict, deque
from collections.abc import AsyncGenerator, Awaitable, Coroutine, Generator
from dataclasses import dataclass
from types import coroutine
from typing import Any, Callable, NamedTuple, Optional, TypeAlias, cast

from flowno.core.event_loop.commands import Command, StreamCancelCommand
from flowno.core.event_loop.event_loop import EventLoop
from flowno.core.event_loop.instrumentation import EventLoopInstrument
from flowno.core.event_loop.queues import AsyncQueue, AsyncSetQueue, QueueClosedError
from flowno.core.event_loop.types import RawTask, TaskHandlePacket
from flowno.core.flow.instrumentation import get_current_flow_instrument
from flowno.core.node_base import (
    DraftInputPortRef,
    DraftNode,
    FinalizedInputPort,
    FinalizedInputPortRef,
    FinalizedNode,
    MissingDefaultError,
    NodeContextFactoryProtocol,
    Nothing,
    Some,
    Stream,
    StreamCheckCommand,
    StreamWaitCommand,
    SuperNode,
    StreamCancelled,
)
from flowno.core.types import DataGeneration, Generation, InputPortIndex, OutputPortIndex
from flowno.utilities.helpers import cmp_generation, clip_generation, inc_generation, main_generation, parent_generation, stitched_generation
from flowno.utilities.logging import log_async
from typing_extensions import Never, Unpack, override

logger = logging.getLogger(__name__)

AnyFinalizedNode: TypeAlias = FinalizedNode[Unpack[tuple[Any, ...]], tuple[Any, ...]]
ObjectFinalizedNode: TypeAlias = FinalizedNode[
    Unpack[tuple[object, ...]], tuple[object, ...]]

# Key for stream consumer state: (consumer_node, input_port, producer_node, output_port, run_level)
# This is stable across RL0 cycles unlike Stream object identity
StreamStateKey: TypeAlias = tuple[
    FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],  # consumer
    int,  # consumer input port index
    FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],  # producer
    int,  # producer output port index
    int,  # run level
]

_current_flow: "Flow | None" = None


[docs]
def current_flow() -> "Flow | None":
    """Get the currently executing Flow instance.
    
    Returns:
        The current Flow instance, or None if not in a Flow context.
    """
    global _current_flow

    return _current_flow



[docs]
def current_node() -> AnyFinalizedNode | None:
    """Get the current node from the FlowEventLoop's task context."""
    from flowno.core.event_loop import current_task

    task = current_task()
    flow = current_flow()
    if flow is None:
        return None

    # TODO: replace the data structure with a more efficient reversible mapping
    for node, task_and_status in flow.node_tasks.items():
        if task_and_status.task is task:
            return node

    return None


# Near the top with other module-level functions

[docs]
def current_context() -> Any:
    """Get the context for the currently executing node. Calls the context factory provided to run_until_complete().
    
    Returns:
        The NodeContext for the current node.
        
    Raises:
        RuntimeError: If called outside a flow, outside a node, or if no context factory was provided.
    """
    flow = current_flow()
    if flow is None:
        raise RuntimeError("current_context() called outside of a flow")
    
    node = current_node()
    if node is None:
        raise RuntimeError("current_context() called outside of a node")

    if flow._context_factory is None:
        raise RuntimeError("No context factory provided to run_until_complete()")

    return flow._context_factory(node)



[docs]
@dataclass
class WaitForStartNextGenerationCommand(Command):
    """Command to wait for a node to start its next generation.
    
    .. warning::
        If this command is handled before the resolution queue is pushed with new nodes,
        and the resolution queue is empty, the resolution queue will be closed, causing the flow to terminate.
    """

    node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    run_level: int = 0




[docs]
@coroutine
def _wait_for_start_next_generation(
    node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
    run_level: int = 0,
) -> Generator[WaitForStartNextGenerationCommand, None, None]:
    """Coroutine that yields a command to wait for a node's next generation."""
    return (yield WaitForStartNextGenerationCommand(node, run_level))




[docs]
@dataclass
class TerminateWithExceptionCommand(Command):
    """Command to terminate the flow with an exception."""

    node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    exception: Exception




[docs]
@coroutine
def _terminate_with_exception(
    node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
    exception: Exception,
) -> Generator[TerminateWithExceptionCommand, None, None]:
    """Coroutine that yields a command to terminate with an exception."""
    return (yield TerminateWithExceptionCommand(node, exception))




[docs]
@dataclass
class TerminateReachedLimitCommand(Command):
    """Command to terminate the flow because a node reached its generation limit."""

    pass




[docs]
@coroutine
def _terminate_reached_limit() -> Generator[TerminateReachedLimitCommand, None, None]:
    """Coroutine that yields a command to terminate when a generation limit is reached."""
    return (yield TerminateReachedLimitCommand())




[docs]
class TerminateLimitReached(Exception):
    """Exception raised when a node reaches its generation limit."""

    pass




[docs]
class NodeExecutionError(Exception):
    """Exception raised when a node execution fails."""

    node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]

    def __init__(
        self, node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ):
        super().__init__(f"Exception in node {node}")
        self.node = node




[docs]
@dataclass
class ResumeNodesCommand(Command):
    """Command to resume execution of one or more nodes."""

    nodes: list[FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]]




[docs]
@coroutine
def _resume_nodes(
    nodes: list[FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]],
) -> Generator[ResumeNodesCommand, None, None]:
    """Resume the concurrent node tasks. Does not guarantee that the nodes will resume if already running."""
    return (yield ResumeNodesCommand(nodes))




[docs]
class NodeTaskStatus:
    """
    Represents the possible states of a node's task within the flow execution.

    States:
        - Queued: The node is queued to be executed (in the event loop task queue).
        - Executing: The node task is currently executing (task.send/throw is being called).
        - WaitingForStartNextGeneration: The node is waiting to start its next generation.
        - Error: The node encountered an error during execution.
        - Stalled: The node is blocked waiting on input data.
    """


[docs]
    @dataclass(frozen=True)
    class Queued:
        """Node is queued to be executed."""

        pass



[docs]
    @dataclass(frozen=True)
    class Executing:
        """Node is currently being executed (task.send/throw is being called)."""

        pass



[docs]
    @dataclass(frozen=True)
    class WaitingForStartNextGeneration:
        """Node is waiting to start its next generation."""

        run_level: int



[docs]
    @dataclass(frozen=True)
    class Error:
        """Node encountered an error during execution."""

        pass



[docs]
    @dataclass(frozen=True)
    class Stalled:
        """Node is stalled waiting for input data."""

        stalling_input: FinalizedInputPortRef[object]


    Type: TypeAlias = Queued | Executing | WaitingForStartNextGeneration | Error | Stalled




[docs]
class NodeTaskAndStatus(NamedTuple):
    """Container for a node's task and its current status."""

    task: RawTask[Command, object, Never]
    status: NodeTaskStatus.Type




[docs]
@dataclass
class StreamConsumerState:
    """Tracks the consumption state of a stream consumer.

    This state is used to determine when to return data, stall waiting
    for the producer, or raise StopAsyncIteration (stream complete).
    """
    last_consumed_generation: Generation | None = None
    cancelled_after_consuming_generation: Optional[Generation] = None




[docs]
class Flow:
    """
    Dataflow graph execution engine.

    The Flow class manages the execution of a dataflow graph, handling dependency
    resolution, node scheduling, and cycle breaking. It uses a custom event loop
    to execute nodes concurrently while respecting data dependencies.

    Key features:
        - Automatic dependency-based scheduling
        - Cycle detection and resolution
        - Support for streaming data (run levels)
        - Concurrency management

    Attributes:
        unvisited: List of nodes that have not yet been visited during execution
        visited: Set of nodes that have been visited
        node_tasks: Dictionary mapping nodes to their tasks and status
        resolution_queue: Queue of nodes waiting to be resolved
    """

    # Classvar as instance init
    counter: int = 0

    # Instance attribute types
    unvisited: list[FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]]
    visited: set[FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]]
    _stop_at_node_generation: (
        dict[FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]], Generation]
        | Generation
    )

    node_tasks: dict[
        FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]], NodeTaskAndStatus
    ]
    resolution_queue: AsyncSetQueue[
        FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ]
    _defaulted_inputs: defaultdict[
        FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        list[InputPortIndex],
    ]
    _cancelled_streams: defaultdict[
        FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]], set[Stream]
    ]
    _stream_consumer_state: defaultdict[StreamStateKey, "StreamConsumerState"]
    _stalled_stream_consumers: dict[
        tuple[FinalizedNode[Any, Any], int],
        list[tuple[RawTask[Command, Any, Any], StreamStateKey]],
    ]
    # Track which specific stream connections have been cancelled
    # Key is the StreamStateKey tuple: (consumer, input_port, producer, output_port, run_level)
    # This is cleared when the stream resets (new generation)
    _cancelled_stream_connections: set["StreamStateKey"]
    _context_factory: Callable[["FinalizedNode"], Any] | None

    resumable: bool
    event_loop: "FlowEventLoop"

    def __init__(self, is_finalized: bool = True):
        """
        Initialize a new Flow instance.

        Args:
            is_finalized: Whether the nodes in this flow are already finalized.
        """
        self.resumable = False
        self.event_loop = FlowEventLoop(self)

        self.counter = Flow.counter
        Flow.counter += 1

        self._active_nodes = set()
        self._processing_queue_item = False
        self._pending_node_completions = 0  # Nodes resumed but not yet yielded WaitForStartNextGeneration
        self._main_loop_has_item = False  # True while main loop has gotten an item but not finished processing

        self.unvisited = []
        self.visited = set()
        self._stop_at_node_generation = None
        self.node_tasks = {}
        self.resolution_queue = AsyncSetQueue()
        self._defaulted_inputs = defaultdict(list)
        self._cancelled_streams = defaultdict(set)
        self._stream_consumer_state = defaultdict(StreamConsumerState)
        self._stalled_stream_consumers = defaultdict(list)
        self._cancelled_stream_connections = set()
        self._context_factory = None

    @property
    def active_nodes(self) -> int:
        return len(self._active_nodes)


[docs]
    def set_node_status(
        self,
        node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        status: NodeTaskStatus.Type,
    ) -> None:
        """
        Update the status of a node and notify instrumentation.

        Args:
            node: The node whose status is being updated
            status: The new status to set
        """
        old_status = self.node_tasks[node].status
        get_current_flow_instrument().on_node_status_change(
            self, node, old_status, status
        )
        self.node_tasks[node] = self.node_tasks[node]._replace(status=status)



[docs]
    def set_defaulted_inputs(
        self,
        node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        defaulted_inputs: list[InputPortIndex],
    ) -> None:
        """
        Mark specific inputs of a node as using default values.

        When a node uses default values for inputs that are part of a cycle,
        this method records that information and increments the stitch level
        to prevent infinite recursion.

        Args:
            node: The node with defaulted inputs
            defaulted_inputs: List of input port indices using default values
        """
        self._defaulted_inputs[node] = defaulted_inputs
        for input_port_index in defaulted_inputs:
            node._input_ports[input_port_index].stitch_level_0 += 1
        get_current_flow_instrument().on_defaulted_inputs_set(
            self, node, defaulted_inputs
        )



[docs]
    def clear_defaulted_inputs(
        self, node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ) -> None:
        """
        Remove defaulted input information for a node.

        Args:
            node: The node to clear defaulted inputs for
        """
        _ = self._defaulted_inputs.pop(node, None)



[docs]
    def is_input_defaulted(
        self,
        node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        input_port: InputPortIndex,
    ) -> bool:
        """
        Check if a specific input port is using a default value.

        Args:
            node: The node to check
            input_port: The input port index to check

        Returns:
            True if the input port is using a default value, False otherwise
        """
        return input_port in self._defaulted_inputs[node]



[docs]
    async def _terminate_if_reached_limit(
        self, node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ):
        """
        Check if a node has reached its generation limit and terminate if so.

        Args:
            node: The node to check

        Raises:
            TerminateLimitReached: If the node reached its generation limit
        """
        if isinstance(self._stop_at_node_generation, dict):
            stop_generation = self._stop_at_node_generation.get(node, ())
        else:
            stop_generation = self._stop_at_node_generation

        if cmp_generation(node.generation, stop_generation) >= 0:
            get_current_flow_instrument().on_node_generation_limit(
                self, node, stop_generation
            )
            await _terminate_reached_limit()



[docs]
    def _stall_stream_consumer(
        self,
        consumer_node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        producer_node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        stream: Stream[object],
        consumer_task: Generator[object, object, object],
        state_key: StreamStateKey,
        event_loop: EventLoop,
    ) -> None:
        """
        Stall a stream consumer and potentially wake the producer.
        
        Called when a consumer requests stream data that isn't available yet.
        Updates consumer status, registers it for notification when data arrives,
        and enqueues the producer if it's idle.
        
        PRODUCER STATUS → ACTION:
        - WaitingForStartNextGeneration: Enqueue (producer is idle)
        - Stalled: Enqueue (producer blocked, needs cycle resolution)
        - Queued: No action (already pending)
        - Executing: No action (will push data when it yields)
        - Error: End stream with StopAsyncIteration
        """
        # Mark consumer as stalled
        self.set_node_status(consumer_node, NodeTaskStatus.Stalled(stream.input))
        self._active_nodes.discard(consumer_node)
        logger.debug(f"Active nodes: {self.active_nodes} (Stall {consumer_node})")
        get_current_flow_instrument().on_node_stalled(self, consumer_node, stream.input)
        
        # Register for notification when producer pushes data
        self._stalled_stream_consumers[(producer_node, stream.output.port_index)].append(
            (consumer_task, state_key)
        )
        
        # Check producer status and take appropriate action
        producer_status = self.node_tasks[producer_node].status

        match producer_status:
            case NodeTaskStatus.WaitingForStartNextGeneration() | NodeTaskStatus.Stalled():
                # Producer idle or blocked - enqueue to wake it up
                # Don't change status here - let ResumeNodesCommand handler do it
                # when it actually adds the task to the event loop queue
                self.resolution_queue.put_nowait(producer_node, event_loop)
                    
            case NodeTaskStatus.Queued() | NodeTaskStatus.Executing():
                # Producer already active - it will push data when it yields
                pass
                
            case NodeTaskStatus.Error():
                # Producer failed - Raise a runtime exception in the consumer?
                # TODO
                raise NotImplementedError("Handling producer error not implemented yet.")



[docs]
    async def _handle_coroutine_node(
        self,
        node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        returned: Awaitable[tuple[object, ...]],
    ):
        """
        Handle a node that returns a coroutine (single output).

        This awaits the result of the node's coroutine and stores the
        result in the node's data.

        Args:
            node: The node to handle
            returned: The coroutine returned by the node's call
        """
        # this is already part of run_level 0 lifecyce instrumentation context
        # in evaluate_node
        result = await returned

        # Wait for the last output data to have been read before overwriting
        with get_current_flow_instrument().on_barrier_node_write(self, node, result, 0):
            await node._barrier0.wait()
        node.push_data(result, 0)
        # Remember how many times output data must be read
        node._barrier0.set_count(len(node.get_output_nodes_by_run_level(0)))

        get_current_flow_instrument().on_node_emitted_data(self, node, result, 0)



[docs]
    async def _handle_async_generator_node(
        self,
        node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        returned: AsyncGenerator[tuple[object, ...], None],
    ):
        """
        Handle a node that returns an async generator (streaming output).

        This processes each yielded item from the generator, storing them
        as run level 1 data, and accumulates them for the final run level 0
        result when the generator completes.

        Args:
"""
        """
        Handle a node that returns an async generator (streaming output).

        This processes each yielded item from the generator, storing them
        as run level 1 data, and accumulates them for the final run level 0
        result when the generator completes.

        Args:
            node: The node to handle
            returned: The async generator returned by the node's call
        """
        acc: tuple[object, ...] | None = None

        # Clear any cancelled stream connections where this node is the producer.
        # This ensures cancellations from previous generations don't affect the new generation.
        if self._cancelled_stream_connections:  # Quick check before iterating
            for state_key in list(self._cancelled_stream_connections):
                # state_key = (consumer, input_port, producer, output_port, run_level)
                if state_key[2] is node:  # producer is this node
                    logger.debug(f"🧹 Clearing cancelled stream connection {state_key} for new generation of {node}")
                    self._cancelled_stream_connections.discard(state_key)

        try:
            while True:
                cancelled_streams = self._cancelled_streams.get(node, set())
                logger.debug(f"_node_gen_lifecycle loop start for {node}, cancelled_streams={cancelled_streams}")
                if cancelled_streams:
                    logger.info(f"Cancelling streams for {node}: {cancelled_streams}", extra={"tag": "flow"})
                    # Make a copy before clearing so the local variable remains truthy
                    cancelled_streams = cancelled_streams.copy()
                    self._cancelled_streams[node].clear()

                    # this node has a set of output streams that have been cancelled
                    # currently, there can only be one output stream, but I'm trying
                    # to think ahead to multiple output streams.

                # already part of run_level 0 lifecycle
                    
                with get_current_flow_instrument().node_lifecycle(
                    self, node, run_level=1
                ):
                    if cancelled_streams:
                        # inform the async generator of the cancelled stream
                        # (assumes one output stream for now)
                        try:
                            result = await returned.athrow(
                                StreamCancelled(stream=next(iter(cancelled_streams)))
                            )
                            # If the generator yields after a stream cancellation,
                            # that just means the node wants to disregard the consumer's
                            # cancellation request and continue producing data.
                        except StopAsyncIteration as e:
                            raise
                    else:
                        result = await anext(returned)

                if acc is None:
                    acc = result
                else:
                    try:
                        acc = tuple(
                            node._draft_node.accumulate_streamed_data(acc, result)
                        )
                    except NotImplementedError:
                        acc = None

                # Push this iteration's data
                node.push_data(result, 1)

                node._barrier1.set_count(len(node.get_output_nodes_by_run_level(1)))

                get_current_flow_instrument().on_node_emitted_data(
                    self, node, result, 1
                )

                await self._terminate_if_reached_limit(node)
                await self._enqueue_output_nodes(node)

                # Wait for this iteration's data to be consumed before proceeding
                with get_current_flow_instrument().on_barrier_node_write(
                    self, node, result, 1
                ):
                    await node._barrier1.wait()

                await _wait_for_start_next_generation(node, 1)

        except (StreamCancelled, StopAsyncIteration) as e:
            # Stream completed (either cancelled or naturally finished)
            # If StopAsyncIteration has args, use that as the final value (from explicit raise)
            # Otherwise use the accumulated run level 0 value
            # Note: The last run level 1 chunk's barrier was already waited on in the loop above

            # If StreamCancelled, propagate cancellation to all streaming input ports.
            # This ensures that when an intermediate node receives StreamCancelled and
            # either reraises it or leaves it unhandled, the cancellation automatically
            # propagates upstream through the entire pipeline.
            if isinstance(e, StreamCancelled):
                logger.info(f"Propagating StreamCancelled from {node} to input streams", extra={"tag": "flow"})
                for input_port_index, input_port in node._input_ports.items():
                    if input_port.minimum_run_level > 0 and input_port.connected_output is not None:
                        # This is a streaming input - cancel it to propagate upstream
                        input_stream = Stream(node.input(input_port_index), input_port.connected_output)
                        logger.debug(f"Cancelling input stream {input_stream} for {node}")
                        await input_stream.cancel()

            if isinstance(e, StopAsyncIteration) and e.args:
                # User explicitly passed a final value via raise StopAsyncIteration(value)
                # The wrapper should have already wrapped it in a tuple
                data = e.args[0] if isinstance(e.args[0], tuple) else (e.args[0],)
            elif acc is None:
                data = None
            else:
                data = acc

            # Wait for the last output data to have been read before overwriting
            with get_current_flow_instrument().on_barrier_node_write(self, node, data, 0):
                await node._barrier0.wait()

            node.push_data(data, 0)

            # Clear cancelled stream connections for this producer now that it's completed,
            # but ONLY for consumers that are stalled waiting for StopAsyncIteration.
            # Consumers that already completed (not stalled) shouldn't be re-enqueued.
            if self._cancelled_stream_connections:
                for state_key in list(self._cancelled_stream_connections):
                    if state_key[2] is node:  # producer is this node
                        consumer_node = state_key[0]
                        consumer_status = self.node_tasks[consumer_node].status
                        if isinstance(consumer_status, NodeTaskStatus.Stalled):
                            logger.debug(f"🧹 Clearing cancelled stream connection {state_key} for stalled consumer")
                            self._cancelled_stream_connections.discard(state_key)
                        else:
                            logger.debug(f"🔒 Keeping cancelled stream connection {state_key} (consumer not stalled)")

            # Remember how many times output data must be read
            node._barrier0.set_count(len(node.get_output_nodes_by_run_level(0)))

            get_current_flow_instrument().on_node_emitted_data(self, node, data, 0)

        except Exception as e:
            # python reraises any exception raised in the async generator as RuntimeError
            # `Exception.__cause__` is the original exception
            if isinstance(e.__cause__, StopAsyncIteration):
                # completion with explicit `raise StopAsyncIteration("final value")`
                # Note: The last run level 1 chunk's barrier was already waited on in the loop above
                if not isinstance(e.__cause__.args[0], tuple):
                    raise ValueError(
                        (
                            "The final value of a node async generator must ",
                            f"be a tuple. Got: {e.__cause__.args[0]}. If ",
                            "you use the @node.tuple decorator you are ",
                            "responsible for wrapping the final value in ",
                            "a tuple.",
                        )
                    )
                data: tuple[object, ...] = e.__cause__.args[0]

                # Wait for the last output data to have been read before overwriting
                with get_current_flow_instrument().on_barrier_node_write(self, node, data, 0):
                    await node._barrier0.wait()
                node.push_data(data, 0)

                # Clear cancelled stream connections for stalled consumers only.
                if self._cancelled_stream_connections:
                    for state_key in list(self._cancelled_stream_connections):
                        if state_key[2] is node:
                            consumer_node = state_key[0]
                            consumer_status = self.node_tasks[consumer_node].status
                            if isinstance(consumer_status, NodeTaskStatus.Stalled):
                                logger.debug(f"🧹 Clearing cancelled stream connection {state_key} for stalled consumer")
                                self._cancelled_stream_connections.discard(state_key)

                # Remember how many times output data must be read
                node._barrier0.set_count(len(node.get_output_nodes_by_run_level(0)))

                get_current_flow_instrument().on_node_emitted_data(self, node, data, 0)
            else:
                raise



[docs]
    @log_async
    async def evaluate_node(
        self, node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ) -> Never:
        """
        The persistent task that evaluates a node.

        This is the main execution function for a node. It:
            1. Waits for the node to be ready to run
            2. Gathers inputs and handles defaulted values
            3. Calls the node with its inputs
            4. Processes the result (either coroutine or async generator)
            5. Propagates outputs to dependent nodes
            6. Repeats

        Args:
            node: The node to evaluate

        Returns:
            Never returns; runs as a persistent coroutine

        Raises:
            NotImplementedError: If the node does not return a coroutine or async generator
        """
        while True:
            await _wait_for_start_next_generation(node, 0)
            with get_current_flow_instrument().node_lifecycle(self, node, run_level=0):
                positional_arg_values, defaulted_inputs = node.gather_inputs()

                await node.count_down_upstream_latches(defaulted_inputs)

                try:
                    self.set_defaulted_inputs(node, defaulted_inputs)
                    returned = node.call(*positional_arg_values)

                    # make sure the user used async def.
                    if not isinstance(returned, (Coroutine, AsyncGenerator)):
                        raise NotImplementedError(
                            "Node must be a coroutine (async def) or an AsyncGenerator (async def with yield)"
                        )

                    if isinstance(returned, Coroutine):
                        await self._handle_coroutine_node(node, returned)
                    else:
                        await self._handle_async_generator_node(node, returned)
                except Exception as e:
                    get_current_flow_instrument().on_node_error(self, node, e)
                    # if self.node_unhandled_exception_terminates:
                    await _terminate_with_exception(node, e)
                finally:
                    self.clear_defaulted_inputs(node)
                    await self._terminate_if_reached_limit(node)
                    await self._enqueue_output_nodes(node)



[docs]
    def add_node(self, node: FinalizedNode[Unpack[tuple[Any, ...]], tuple[Any, ...]]):
        """
        Add a node to the flow.

        Args:
            node: The node to add
        """
        if node in self.unvisited:
            return

        get_current_flow_instrument().on_node_registered(self, node)
        self.unvisited.append(node)
        self._register_node(node)



[docs]
    def _register_node(
        self, node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ):
        """
        Register a node's task with the flow.

        This creates the persistent task for the node and adds it to the node_tasks dictionary.

        Args:
            node: The node to register
        """
        task: RawTask[Command, object, Never] = self.evaluate_node(node)
        # prime the coroutine. I choose to structure the evaluate_node while loop this way so
        # it needs to be primed once to get rid of the unawaited coroutine warning
        _ = task.send(None)
        self.node_tasks[node] = NodeTaskAndStatus(task, NodeTaskStatus.WaitingForStartNextGeneration(-1))



[docs]
    def _mark_node_as_visited(
        self, node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ):
        """
        Mark a node as visited during the resolution process.

        Args:
            node: The node to mark as visited
        """
        get_current_flow_instrument().on_node_visited(self, node)

        if node in self.unvisited:
            # this proves that the node is connected to the graph
            self.unvisited.remove(node)
            self.visited.add(node)
        elif node not in self.visited:
            # current node has not been registered by .add_node()
            self.visited.add(node)
            self._register_node(node)



[docs]
    def add_nodes(
        self, nodes: list[FinalizedNode[Unpack[tuple[Any, ...]], tuple[Any, ...]]]
    ):
        """
        Add multiple nodes to the flow.

        Args:
            nodes: The nodes to add
        """
        for node in nodes:
            self.add_node(node)



[docs]
    async def _enqueue_output_nodes(
        self, out_node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ):
        """
        Enqueue all nodes that depend on the given node.

        Args:
            out_node: The node whose dependents should be enqueued
        """
        logger.debug(f"🔍 _enqueue_output_nodes called for {out_node}, queue {id(self.resolution_queue)} closed={self.resolution_queue.closed}, active_nodes={self.active_nodes}")
        if not self.resolution_queue.closed:
            nodes_to_enqueue = []
            all_output_nodes = out_node.get_output_nodes()
            logger.debug(f"🔍 Output nodes of {out_node}: {all_output_nodes}")

            for output_node in all_output_nodes:
                # Check if this specific stream connection was cancelled
                # Only skip if THIS specific (consumer, producer, stream) was cancelled
                should_skip = False
                if self._cancelled_stream_connections:  # Quick check before iterating
                    for input_port_idx, input_port in output_node._input_ports.items():
                        if (input_port.connected_output is not None and
                            input_port.connected_output.node is out_node and
                            input_port.minimum_run_level == 1):
                            # This is a streaming connection from out_node to output_node
                            state_key: StreamStateKey = (
                                output_node,
                                input_port_idx,
                                out_node,
                                input_port.connected_output.port_index,
                                1,  # run_level
                            )
                            if state_key in self._cancelled_stream_connections:
                                logger.debug(f"🔍 Skipping enqueue of {output_node} - this specific stream was cancelled")
                                should_skip = True
                                break

                if should_skip:
                    continue

                nodes_to_enqueue.append(output_node)
                get_current_flow_instrument().on_resolution_queue_put(self, output_node)

            logger.debug(f"🔍 Enqueueing {len(nodes_to_enqueue)} nodes: {nodes_to_enqueue}")
            await self.resolution_queue.putAll(nodes_to_enqueue)
        else:
            logger.debug(f"🔍 Skipping enqueue because queue is closed")



[docs]
    async def _enqueue_node(
        self, node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ):
        """
        Enqueue a single node for resolution.

        Args:
            node: The node to enqueue
        """
        get_current_flow_instrument().on_resolution_queue_put(self, node)
        await self.resolution_queue.put(node)



[docs]
    def run_until_complete(
        self,
        stop_at_node_generation: (
            dict[
                FinalizedNode[Unpack[tuple[Any, ...]], tuple[Any, ...]]
                | DraftNode[Unpack[tuple[Any, ...]], tuple[Any, ...]],
                Generation,
            ]
            | Generation
        ) = (),
        terminate_on_node_error: bool = False,
        _debug_max_wait_time: float | None = None,
        context_factory: Callable[["FinalizedNode"], Any] | None = None,
    ):
        """
        Execute the flow until completion or until a termination condition is met.

        This is the main entry point for running a flow. It starts the resolution
        process and runs until all nodes have completed or a termination condition
        (like reaching a generation limit or an error) is met.

        Args:
            stop_at_node_generation: Generation limit for nodes, either as a global
                limit or as a dict mapping nodes to their individual limits
            terminate_on_node_error: Whether to terminate the flow if a node raises an exception
            _debug_max_wait_time: Maximum time in seconds to wait for I/O operations
                (useful for debugging)

        Raises:
            Exception: Any exception raised by nodes and not caught
            TerminateLimitReached: When a node reaches its generation limit
        """
        global _current_flow
        _current_flow = self

        if context_factory:
            self._context_factory = context_factory
        else:
            self._context_factory = None

        self.event_loop.run_until_complete(
            self._node_resolve_loop(
                cast(
                    dict[
                        FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
                        Generation,
                    ]
                    | Generation,
                    stop_at_node_generation,
                ),
                terminate_on_node_error,
            ),
            join=True,
            _debug_max_wait_time=_debug_max_wait_time,
        )

        _current_flow = None



[docs]
    @log_async
    async def _node_resolve_loop(
        self,
        stop_at_node_generation: (
            dict[
                FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
                Generation,
            ]
            | Generation
        ),
        terminate_on_node_error: bool,
    ):
        """
        Main resolution loop for the flow.

        This function implements the core algorithm for resolving node dependencies
        and executing nodes in the correct order. It:

        1. Picks an initial node
        2. For each node in the resolution queue:
            a. Finds the set of nodes that must be executed first
            b. Marks those nodes as visited
            c. Resumes their execution
        3. Continues until the resolution queue is empty

        Args:
            stop_at_node_generation: Generation limit for nodes
            terminate_on_node_error: Whether to terminate on node errors
        """
        get_current_flow_instrument().on_flow_start(self)
        self._stop_at_node_generation = stop_at_node_generation

        if not self.unvisited:
            logger.warning("No nodes to run.")

        logger.debug(f"🔍 Initial unvisited list: {self.unvisited}")

        flow = self

        class ResolutionQueueInstrument(EventLoopInstrument):
            def on_queue_get(
                self, queue: AsyncQueue[Any], item: Any, immediate: bool
            ) -> None:
                if queue is flow.resolution_queue:
                    flow._main_loop_has_item = True

        while self.unvisited:
            initial_node = self.unvisited.pop(0)
            logger.debug(f"🔍 Processing unvisited node: {initial_node}, remaining: {self.unvisited}")
            if self.resolution_queue.closed:
                logger.debug(f"🔍 Reopening closed resolution queue for {initial_node}")
                self.resolution_queue = AsyncSetQueue()

            # Manually mark as executing so active_nodes > 0, preventing immediate closure
            # by _handle_command when processing intermediate commands.
            if isinstance(self.node_tasks[initial_node].status, NodeTaskStatus.WaitingForStartNextGeneration):
                self._active_nodes.add(initial_node)
                self.set_node_status(initial_node, NodeTaskStatus.Executing())

            get_current_flow_instrument().on_resolution_queue_put(self, initial_node)
            await self.resolution_queue.put(initial_node)

            # blocks until a node is available or the queue is closed
            with ResolutionQueueInstrument():
                while True:
                    # Clear the flag - we're about to try to get a new item
                    self._main_loop_has_item = False

                    try:
                        current_node = await self.resolution_queue.get()
                    except QueueClosedError:
                        break

                    # The hook already set _main_loop_has_item = True when the item was popped
                    logger.debug(f"Got item {current_node} from queue")

                    get_current_flow_instrument().on_resolution_queue_get(
                        self, current_node
                    )

                    solution_nodes = self._find_node_solution(current_node)
                    get_current_flow_instrument().on_solving_nodes(
                        self, current_node, solution_nodes
                    )

                    for leaf_node in solution_nodes:
                        self._mark_node_as_visited(leaf_node)
                        if leaf_node in self.resolution_queue:
                            logger.debug(f"Leaf node {leaf_node} already in resolution queue, skipping resume")
                            continue
                        
                        # Check status to avoid resuming already queued/running nodes
                        status = self.node_tasks[leaf_node].status
                        if isinstance(status, (NodeTaskStatus.WaitingForStartNextGeneration, NodeTaskStatus.Stalled)):
                            # Node is waiting to run or stalled waiting for data - resume it
                            await _resume_nodes([leaf_node])
                        elif isinstance(status, (NodeTaskStatus.Queued, NodeTaskStatus.Executing)):
                            # Already queued or running, skip
                            logger.debug(f"Skipping resume for {leaf_node} with status {status}")
                        else:
                            # Error or unknown status
                            logger.debug(f"Skipping resume for {leaf_node} with status {status}")

        # self.event_loop.clean_up()
        get_current_flow_instrument().on_flow_end(self)



[docs]
    def _find_node_solution(
        self, node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ) -> list[FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]]:
        """
        Find the nodes that are ultimately preventing the given node from running.

        This method is key to Flowno's cycle resolution algorithm. It:
            1. Builds a condensed graph of strongly connected components (SCCs)
            2. Finds the leaf SCCs in this condensed graph
            3. For each leaf SCC, picks a node to force evaluate based on default values

        Args:
            node: The node whose dependencies need to be resolved

        Returns:
            A list of nodes that should be forced to evaluate to unblock the given node

        Raises:
            MissingDefaultError: If a cycle is detected with no default values to break it
        """
        supernode_root = self._condensed_tree(node)

        nodes_to_force_evaluate: list[
            FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
        ] = []
        for supernode in self._find_leaf_supernodes(supernode_root):
            selected_node = self._pick_node_to_force_evaluate(supernode)
            nodes_to_force_evaluate.append(selected_node)

        return nodes_to_force_evaluate



[docs]
    def _condensed_tree(
        self, head: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
    ) -> SuperNode:
        """
        Build a condensed graph of strongly connected components (SCCs) from stale connections.

        This method implements Tarjan's algorithm to find strongly connected components
        (cycles) in the dependency graph, but only following connections that are "stale"
        (where the input's generation is <= the node's generation).

        Args:
            head: The starting point for building the condensed graph

        Returns:
            A SuperNode representing the root of the condensed graph
        """
        visited: set[FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]] = (
            set()
        )
        current_scc_stack: list[
            FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
        ] = []
        on_stack: set[FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]] = (
            set()
        )
        id_counter = 0
        ids: dict[
            FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]], int
        ] = {}
        low_links: dict[
            FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]], int
        ] = {}
        all_sccs: list[SuperNode] = []
        scc_for_node: dict[
            FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]], SuperNode
        ] = {}

        def get_subgraph_edges(
            node: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        ) -> Generator[FinalizedInputPort[object], None, None]:
            """
            Return the inputs (edges) from `node` to its upstream dependencies that
            belong in the stale subgraph.

            1) Gather all inputs that are stale according to
               get_inputs_with_le_generation_clipped_to_minimum_run_level().

            2) If the node is stalled, we only yield the single stalled input
               (if and only if it is also stale and not defaulted).

            3) Otherwise, we yield all stale, non-defaulted inputs.
            """
            # 1) Collect all stale inputs
            stale_inputs = (
                node.get_inputs_with_le_generation_clipped_to_minimum_run_level()
            )

            # 2) Check node's status
            match self.node_tasks[node].status:
                case NodeTaskStatus.Stalled(stalling_input):
                    # logger.debug(f"{node} is stalled on input port {stalling_input.port_index}")
                    assert stalling_input.node == node

                    # Grab exactly that one input port:
                    single_port = node._input_ports[stalling_input.port_index]

                    # Only yield it if:
                    #   - it's in the stale set
                    #   - it's not defaulted
                    if single_port in stale_inputs and not self.is_input_defaulted(
                        node, single_port.port_index
                    ):
                        yield single_port

                case _:
                    # 3) Normal case: yield all stale, non-defaulted inputs
                    for port in stale_inputs:
                        if self.is_input_defaulted(node, port.port_index):
                            continue
                        yield port

        def tarjan_dfs(
            v: FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]],
        ):
            """
            Tarjan's algorithm for finding strongly connected components.

            This is a depth-first search that identifies strongly connected
            components (cycles) in the graph.

            Args:
                v: The current node being processed
            """
            nonlocal id_counter

            ids[v] = low_links[v] = id_counter
            id_counter += 1
            current_scc_stack.append(v)
            on_stack.add(v)
            visited.add(v)

            for v_input_ports in get_subgraph_edges(v):
                if v_input_ports.connected_output is None:
                    continue
                dependency: FinalizedNode[
                    Unpack[tuple[object, ...]], tuple[object, ...]
                ] = v_input_ports.connected_output.node
                if dependency not in visited:
                    tarjan_dfs(dependency)
                    low_links[v] = min(low_links[v], low_links[dependency])
                elif dependency in on_stack:
                    low_links[v] = min(low_links[v], ids[dependency])

            if low_links[v] == ids[v]:
                scc_nodes: set[
                    FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]
                ] = set()
                while True:
                    w = current_scc_stack.pop()
                    on_stack.remove(w)
                    scc_nodes.add(w)
                    if w == v:
                        break

                members_dict = {
                    node: [
                        port.port_index
                        for port in get_subgraph_edges(node)
                        if port.connected_output
                        and port.connected_output.node in scc_nodes
                    ]
                    for node in scc_nodes
                }
                super_node = SuperNode(head=v, members=members_dict, dependencies=[])
                for member in scc_nodes:
                    scc_for_node[member] = super_node
                all_sccs.append(super_node)

        tarjan_dfs(head)

        # build the condensed graph
        for super_node in all_sccs:
            for member in super_node.members:
                for port in get_subgraph_edges(member):
                    if not port.connected_output:
                        continue
                    dependency: FinalizedNode[
                        Unpack[tuple[object, ...]], tuple[object, ...]
                    ] = port.connected_output.node
                    if scc_for_node[dependency] != super_node:
                        super_node.dependencies.append(scc_for_node[dependency])
                        scc_for_node[dependency].dependent = super_node

        return scc_for_node[head]



[docs]
    def _find_leaf_supernodes(self, root: SuperNode) -> list[SuperNode]:
        """
        Identify all leaf supernodes in the condensed DAG.
        Leaf supernodes are those with no dependencies.

        Returns:
            list[SuperNode]: A list of all leaf supernodes in the graph.
        """
        final_leaves: list[SuperNode] = []

        def dfs(current: SuperNode):
            if not current.dependencies:
                final_leaves.append(current)
                return
            for dep in current.dependencies:
                dfs(dep)

        dfs(root)
        return final_leaves



[docs]
    def _pick_node_to_force_evaluate(
        self, leaf_supernode: SuperNode
    ) -> "FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]":
        """Pick a node to force evaluate according to the cycle breaking heuristic.

        Args:
            leaf_supernode (SuperNode): The leaf Super-Node of the Condensed subgraph.

        Returns:
            FinalizedNode[Unpack[tuple[object, ...]], tuple[object, ...]]: The node to force evaluate.

        Undefined Behavior:
            If the argument is not a leaf in the condensed graph, the behavior is undefined.
        """
        for node, input_ports in leaf_supernode.members.items():
            if all(
                node.has_default_for_input(input_port) for input_port in input_ports
            ):
                return node
        raise MissingDefaultError(leaf_supernode)


    @override
    def __repr__(self):
        return f"<Flow#{self.counter}>"




[docs]
class FlowEventLoop(EventLoop):
    def __init__(self, flow: Flow):
        super().__init__()
        self.flow = flow


[docs]
    @override
    def _on_task_before_send(
        self, task: RawTask[Command, Any, Any], value: Any
    ) -> None:
        """Set node status to Executing when the task is about to be executed."""
        super()._on_task_before_send(task, value)
        
        # Check if this task corresponds to a node task
        for node, task_and_status in self.flow.node_tasks.items():
            if task_and_status.task is task:
                self.flow.set_node_status(node, NodeTaskStatus.Executing())
                break



[docs]
    @override
    def _on_task_before_throw(
        self, task: RawTask[Command, Any, Any], exception: Exception
    ) -> None:
        """Set node status to Executing when the task is about to receive an exception."""
        super()._on_task_before_throw(task, exception)
        
        # Check if this task corresponds to a node task
        for node, task_and_status in self.flow.node_tasks.items():
            if task_and_status.task is task:
                self.flow.set_node_status(node, NodeTaskStatus.Executing())
                break



[docs]
    @override
    def _handle_command(
        self,
        current_task_packet: TaskHandlePacket[Command, Any, Any, Exception],
        command: Command,
    ) -> bool:
        if super()._handle_command(current_task_packet, command):
            return True

        if isinstance(command, WaitForStartNextGenerationCommand):
            node = command.node
            old_status = self.flow.node_tasks[node].status
            self.flow.set_node_status(node, NodeTaskStatus.WaitingForStartNextGeneration(command.run_level))
            
            if isinstance(old_status, NodeTaskStatus.Executing):
                self.flow._active_nodes.discard(node)
                # Only decrement pending for nodes that were in the resolution loop
                self.flow._pending_node_completions -= 1
                logger.debug(f"Active nodes: {self.flow.active_nodes} (Wait {node}), pending now {self.flow._pending_node_completions}")
            else:
                logger.debug(f"Node {node} yielded WaitForStartNextGenerationCommand but was in status {old_status} (not decrementing pending)")

            # Close the queue if there's no more work:
            # - Queue is empty (no pending items)
            # - No nodes are actively executing
            # - No items being processed by the main loop (pending_node_completions == 0)
            # - Main loop doesn't have an unconsumed item (would indicate a race where
            #   the queue looks empty but main loop is about to process an item)
            if (len(self.flow.resolution_queue) == 0 and
                self.flow.active_nodes == 0 and
                self.flow._pending_node_completions == 0 and
                not self.flow._main_loop_has_item):
                logger.debug("Closing resolution queue (no more work)")
                self.flow.resolution_queue.close_nowait(self)

        elif isinstance(command, TerminateWithExceptionCommand):
            node = command.node
            old_status = self.flow.node_tasks[node].status
            self.flow.set_node_status(node, NodeTaskStatus.Error())
            
            if isinstance(old_status, NodeTaskStatus.Executing):
                self.flow._active_nodes.discard(node)
                logger.debug(f"Active nodes: {self.flow.active_nodes} (Terminate {node})")
            else:
                logger.warning(f"Node {node} terminated but was in status {old_status}")

            # The exception will terminate the flow, no need to close the queue
            raise command.exception

        elif isinstance(command, TerminateReachedLimitCommand):
            raise TerminateLimitReached()

        elif isinstance(command, ResumeNodesCommand):
            nodes = command.nodes
            current_task = current_task_packet[0]

            for node in nodes:
                status = self.flow.node_tasks[node].status

                if isinstance(status, NodeTaskStatus.WaitingForStartNextGeneration):
                    self.flow._active_nodes.add(node)
                    # Track pending completions: increment when resuming a node
                    self.flow._pending_node_completions += 1
                    logger.debug(f"Active nodes: {self.flow.active_nodes} (Resume {node}), pending now {self.flow._pending_node_completions}")
                    self.flow.set_node_status(node, NodeTaskStatus.Queued())
                    self.tasks.append((self.flow.node_tasks[node][0], None, None))
                elif isinstance(status, NodeTaskStatus.Stalled):
                    # Node was stalled waiting for stream data - wake it up
                    # The task is at `yield StreamWaitCommand`, will receive None and loop to re-check
                    self.flow._active_nodes.add(node)
                    # Don't increment _pending_node_completions - the node was never "completed"
                    # when it stalled, so pending is still counted from the original resume
                    logger.debug(f"Active nodes: {self.flow.active_nodes} (Resume stalled {node}), pending still {self.flow._pending_node_completions}")
                    self.flow.set_node_status(node, NodeTaskStatus.Queued())
                    self.tasks.append((self.flow.node_tasks[node][0], None, None))
                elif isinstance(status, NodeTaskStatus.Queued):
                    # Already queued, do nothing
                    logger.debug(f"Node {node} already queued, skipping resume")
                    pass
                else:
                    raise RuntimeError(
                        f"Cannot resume node {node} because it is in status {status}"
                    )
                    # may not actually require a full exception - could just skip resuming

            self.tasks.append((current_task, None, None))

        elif isinstance(command, StreamCheckCommand):
            # Non-blocking check for stream data availability
            # Returns: Some(value), Nothing, or throws StopAsyncIteration
            stream = command.stream
            consumer_node = stream.input.node
            producer_node = stream.output.node
            current_task = current_task_packet[0]

            state_key: StreamStateKey = (
                consumer_node,
                stream.input.port_index,
                producer_node,
                stream.output.port_index,
                stream.run_level,
            )
            state = self.flow._stream_consumer_state[state_key]

            assert stream.run_level == 1, "Only run level 1 streams are supported currently"

            # === 1. COMPUTE GENERATIONS ===
            # Use main_generation (not clip_generation) to get the run-level-0 generation.
            # clip_generation finds "highest gen <= input at target length", which is wrong here.
            # We need "which main generation does this streaming generation belong to?"
            producer_parent = main_generation(producer_node.generation)
            desired_generation = inc_generation(state.last_consumed_generation, 1)
            desired_parent = main_generation(desired_generation)

            # === 2. CHECK FOR STREAM RESET ===
            if cmp_generation(producer_parent, desired_parent) > 0:
                state.last_consumed_generation = None
                # Clear cancellation state for this stream - new generation starts fresh
                self.flow._cancelled_stream_connections.discard(state_key)
                if len(producer_node.generation) == 1:
                    self.tasks.insert(0, (current_task, None, StopAsyncIteration()))
                    return True
                elif len(producer_node.generation) == 2:
                    state.last_consumed_generation = producer_node.generation
                    value = producer_node._data[cast("DataGeneration", producer_node.generation)][0]
                    producer_node._barrier1.countdown_nowait(self)
                    self.tasks.insert(0, (current_task, Some(value), None))
                    return True

            # === 3. CHECK IF DESIRED DATA IS AVAILABLE ===
            if cast("DataGeneration", desired_generation) in producer_node._data:
                state.last_consumed_generation = desired_generation
                value = producer_node._data[cast("DataGeneration", desired_generation)][0]
                producer_node._barrier1.countdown_nowait(self)
                self.tasks.insert(0, (current_task, Some(value), None))
                return True

            # === 4. CHECK IF STREAM IS COMPLETE ===
            completion_marker = cast("DataGeneration", desired_parent)
            if completion_marker in producer_node._data:
                self.tasks.insert(0, (current_task, None, StopAsyncIteration()))
                return True

            # === 5. DATA NOT READY - return Nothing ===
            # Don't stall here - just return Nothing and let the caller decide to wait
            self.tasks.insert(0, (current_task, Nothing(), None))
            return True

        elif isinstance(command, StreamWaitCommand):
            # Stall until the resolver decides to wake this node
            stream = command.stream
            consumer_node = stream.input.node
            producer_node = stream.output.node
            current_task = current_task_packet[0]

            state_key: StreamStateKey = (
                consumer_node,
                stream.input.port_index,
                producer_node,
                stream.output.port_index,
                stream.run_level,
            )

            # Mark consumer as stalled and enqueue producer if needed
            self.flow._stall_stream_consumer(
                consumer_node, producer_node, stream, current_task, state_key, self
            )
            # Note: _stall_stream_consumer does NOT add the task back to the queue
            # The task will be resumed by ResumeNodesCommand when the resolver wakes it
            return True

        elif isinstance(command, StreamCancelCommand):
            # _node = command.node
            producer_node = command.producer_node
            stream = command.stream
            consumer_node = stream.input.node
            current_task = current_task_packet[0]

            self.flow._cancelled_streams[producer_node].add(stream)

            # Track this specific stream connection as cancelled
            # This is more precise than tracking the consumer node globally
            state_key: StreamStateKey = (
                consumer_node,
                stream.input.port_index,
                producer_node,
                stream.output.port_index,
                stream.run_level,
            )
            self.flow._cancelled_stream_connections.add(state_key)

            # Decrement the producer's barrier to unblock it.
            # The producer may be blocked on `await node._barrier1.wait()` waiting
            # for consumers to read. Since this consumer is cancelling instead of
            # reading, we need to decrement the barrier so the producer can proceed
            # to check `_cancelled_streams` and throw StreamCancelled.
            producer_node._barrier1.countdown_nowait(self)

            # Resume the producer node so it can check for cancelled streams
            # and call athrow(StreamCancelled) on its internal generator.
            # This is critical: if we don't resume the producer, the flow may
            # terminate before the producer sees the cancellation.
            #
            # BUT: Don't resume if the producer has already completed this generation
            # (has run_level=0 data). Cancelling after completion is a no-op.
            producer_gen = producer_node.generation
            producer_has_completed = (len(producer_gen) == 1 and
                                      cast("DataGeneration", producer_gen) in producer_node._data)

            if producer_has_completed:
                logger.debug(f"🔒 Producer {producer_node} already completed, not resuming for cancel")
            elif producer_node in self.flow.node_tasks:
                status = self.flow.node_tasks[producer_node].status
                if isinstance(status, NodeTaskStatus.WaitingForStartNextGeneration):
                    # Producer is waiting for the next generation - resume it with cancel intent
                    # The producer will check _cancelled_streams and call athrow
                    producer_task = self.flow.node_tasks[producer_node][0]

                    # Update bookkeeping like ResumeNodesCommand does
                    self.flow._active_nodes.add(producer_node)
                    self.flow._pending_node_completions += 1
                    logger.debug(f"Active nodes: {self.flow.active_nodes} (Cancel-resume {producer_node}), pending now {self.flow._pending_node_completions}")
                    self.flow.set_node_status(producer_node, NodeTaskStatus.Queued())

                    # Add producer to task queue - it will see cancelled_streams and call athrow
                    self.tasks.append((producer_task, None, None))

            # Immediately resume the current task. The order probably doesn't matter here, but
            # I'm worried about nodes in the resolution queue being executed in a surprising order.
            self.tasks.insert(0, (current_task, None, None))

        else:
            return False
        return True