Workflow

Workflow #

An event-driven abstraction used to orchestrate the execution of different components called "steps".

Each step is responsible for handling certain event types and possibly emitting new events. Steps can be "bound" when they are defined as methods of the Workflow class itself, or "unbound" when they are defined as free functions. To define a step, the method or function must be decorated with the @step decorator.

Workflows provide basic validation to catch potential runtime errors as soon as possible. Validation happens once, when the workflow starts, and does not produce much overhead. It can be disabled in any case.

Use an instance of a Workflow class to run a workflow and stream events produced during execution. Workflows can be run step-by-step, by calling the run_step function multiple times until completion.

Source code in workflows/workflow.py

class Workflow(metaclass=WorkflowMeta):
    """
    An event-driven abstraction used to orchestrate the execution of different components called "steps".

    Each step is responsible for handling certain event types and possibly emitting new events. Steps can be "bound"
    when they are defined as methods of the `Workflow` class itself, or "unbound" when they are defined as free
    functions. To define a step, the method or function must be decorated with the `@step` decorator.

    Workflows provide basic validation to catch potential runtime errors as soon as possible. Validation happens once,
    when the workflow starts, and does not produce much overhead. It can be disabled in any case.

    Use an instance of a `Workflow` class to run a workflow and stream events produced during execution. Workflows
    can be run step-by-step, by calling the `run_step` function multiple times until completion.
    """

    def __init__(
        self,
        timeout: float | None = 10.0,
        disable_validation: bool = False,
        verbose: bool = False,
        service_manager: ServiceManager | None = None,
        resource_manager: ResourceManager | None = None,
        num_concurrent_runs: int | None = None,
    ) -> None:
        """
        Create an instance of the workflow.

        Args:
            timeout:
                Number of seconds after the workflow execution will be halted, raising a `WorkflowTimeoutError`
                exception. If set to `None`, the timeout will be disabled.
            disable_validaton:
                Whether or not the workflow should be validated before running. In case the workflow is
                misconfigured, a call to `run` will raise a `WorkflowValidationError` exception explaining the details
                of the problem.
            verbose:
                Whether or not the workflow should print additional informative messages during execution.
            service_manager:
                The instance of the `ServiceManager` used to make nested workflows available to this
                workflow instance. The default value is the best choice unless you're customizing the workflow runtime.
            num_concurrent_runs:
                maximum number of .run() executions occurring simultaneously. If set to `None`, there
                is no limit to this number.

        """
        # Configuration
        self._timeout = timeout
        self._verbose = verbose
        self._disable_validation = disable_validation
        self._num_concurrent_runs = num_concurrent_runs
        self._stop_event_class = self._ensure_stop_event_class()
        self._start_event_class = self._ensure_start_event_class()
        self._sem = (
            asyncio.Semaphore(num_concurrent_runs) if num_concurrent_runs else None
        )
        # Broker machinery
        self._contexts: WeakSet[Context] = WeakSet()
        self._stepwise_context: Context | None = None
        # Services management
        self._service_manager = service_manager or ServiceManager()
        # Resource management
        self._resource_manager = resource_manager or ResourceManager()
        # Instrumentation
        self._dispatcher = dispatcher

    def _ensure_start_event_class(self) -> type[StartEvent]:
        """
        Returns the StartEvent type used in this workflow.

        It works by inspecting the events received by the step methods.
        """
        start_events_found: set[type[StartEvent]] = set()
        for step_func in self._get_steps().values():
            step_config: StepConfig = getattr(step_func, "__step_config")
            for event_type in step_config.accepted_events:
                if issubclass(event_type, StartEvent):
                    start_events_found.add(event_type)

        num_found = len(start_events_found)
        if num_found == 0:
            msg = "At least one Event of type StartEvent must be received by any step."
            raise WorkflowConfigurationError(msg)
        elif num_found > 1:
            msg = f"Only one type of StartEvent is allowed per workflow, found {num_found}: {start_events_found}."
            raise WorkflowConfigurationError(msg)
        else:
            return start_events_found.pop()

    def _ensure_stop_event_class(self) -> type[RunResultT]:
        """
        Returns the StopEvent type used in this workflow.

        It works by inspecting the events returned.
        """
        stop_events_found: set[type[StopEvent]] = set()
        for step_func in self._get_steps().values():
            step_config: StepConfig = getattr(step_func, "__step_config")
            for event_type in step_config.return_types:
                if issubclass(event_type, StopEvent):
                    stop_events_found.add(event_type)

        num_found = len(stop_events_found)
        if num_found == 0:
            msg = "At least one Event of type StopEvent must be returned by any step."
            raise WorkflowConfigurationError(msg)
        elif num_found > 1:
            msg = f"Only one type of StopEvent is allowed per workflow, found {num_found}: {stop_events_found}."
            raise WorkflowConfigurationError(msg)
        else:
            return stop_events_found.pop()

    async def stream_events(self) -> AsyncGenerator[Event, None]:
        """
        Returns an async generator to consume any event that workflow steps decide to stream.

        To be able to use this generator, the usual pattern is to wrap the `run` call in a background task using
        `asyncio.create_task`, then enter a for loop like this:

            wf = StreamingWorkflow()
            r = asyncio.create_task(wf.run())

            async for ev in wf.stream_events():
                print(ev)

            await r
        """
        # In the typical streaming use case, `run()` is not awaited but wrapped in a asyncio.Task. Since we'll be
        # consuming events produced by `run()`, we must give its Task the chance to run before entering the dequeueing
        # loop.
        await asyncio.sleep(0)

        if len(self._contexts) > 1:
            # We can't possibly know from what session we should stream events, raise an error.
            msg = (
                "This workflow has multiple concurrent runs in progress and cannot stream events. "
                "To be able to stream events, make sure you call `run()` on this workflow only once."
            )
            raise WorkflowRuntimeError(msg)

        # Enter the dequeuing loop.
        ctx = next(iter(self._contexts))
        while True:
            ev = await ctx.streaming_queue.get()
            if isinstance(ev, StopEvent):
                break

            yield ev

        # remove context to free up room for the next stream_events call
        self._contexts.remove(ctx)

    @classmethod
    def add_step(cls, func: Callable) -> None:
        """
        Adds a free function as step for this workflow instance.

        It raises an exception if a step with the same name was already added to the workflow.
        """
        step_config: StepConfig | None = getattr(func, "__step_config", None)
        if not step_config:
            msg = f"Step function {func.__name__} is missing the `@step` decorator."
            raise WorkflowValidationError(msg)

        if func.__name__ in {**get_steps_from_class(cls), **cls._step_functions}:
            msg = f"A step {func.__name__} is already part of this workflow, please choose another name."
            raise WorkflowValidationError(msg)

        cls._step_functions[func.__name__] = func

    def add_workflows(self, **workflows: "Workflow") -> None:
        """
        Adds one or more nested workflows to this workflow.

        This method only accepts keyword arguments, and the name of the parameter
        will be used as the name of the workflow.
        """
        for name, wf in workflows.items():
            self._service_manager.add(name, wf)

    def _get_steps(self) -> dict[str, Callable]:
        """Returns all the steps, whether defined as methods or free functions."""
        return {**get_steps_from_instance(self), **self._step_functions}  # type: ignore[attr-defined]

    def _start(
        self,
        stepwise: bool = False,
        ctx: Context | None = None,
        checkpoint_callback: CheckpointCallback | None = None,
    ) -> Tuple[Context, str]:
        """
        sets up the queues and tasks for each declared step.

        This method also launches each step as an async task.
        """
        run_id = str(uuid.uuid4())
        if ctx is None:
            ctx = Context(self, stepwise=stepwise)
            self._contexts.add(ctx)
        else:
            # clean up the context from the previous run
            ctx._tasks = set()
            ctx._retval = None
            ctx._step_events_holding = None
            ctx._cancel_flag.clear()

        for name, step_func in self._get_steps().items():
            if name not in ctx._queues:
                ctx._queues[name] = asyncio.Queue()

            if name not in ctx._step_flags:
                ctx._step_flags[name] = asyncio.Event()

            # At this point, step_func is guaranteed to have the `__step_config` attribute
            step_config: StepConfig = getattr(step_func, "__step_config")

            # Make the system step "_done" accept custom stop events
            if (
                name == "_done"
                and self._stop_event_class not in step_config.accepted_events
            ):
                step_config.accepted_events.append(self._stop_event_class)

            for _ in range(step_config.num_workers):
                ctx.add_step_worker(
                    name=name,
                    step=step_func,
                    config=step_config,
                    stepwise=stepwise,
                    verbose=self._verbose,
                    checkpoint_callback=checkpoint_callback,
                    run_id=run_id,
                    service_manager=self._service_manager,
                    resource_manager=self._resource_manager,
                )

        # add dedicated cancel task
        ctx.add_cancel_worker()

        return ctx, run_id

    def send_event(self, message: Event, step: str | None = None) -> None:
        msg = (
            "Use a Context instance to send events from a step. "
            "Make sure your step method or function takes a parameter of type Context like `ctx: Context` and "
            "replace `self.send_event(...)` with `ctx.send_event(...)` in your code."
        )

        if len(self._contexts) > 1:
            # We can't possibly know to what session we should send this event, raise an error.
            raise WorkflowRuntimeError(msg)

        # Emit a warning as this won't work for multiple run()s.
        warnings.warn(msg)
        ctx = next(iter(self._contexts))
        ctx.send_event(message=message, step=step)

    def _get_start_event_instance(
        self, start_event: StartEvent | None, **kwargs: Any
    ) -> StartEvent:
        if start_event is not None:
            # start_event was used wrong
            if not isinstance(start_event, StartEvent):
                msg = "The 'start_event' argument must be an instance of 'StartEvent'."
                raise ValueError(msg)

            # start_event is ok but point out that additional kwargs will be ignored in this case
            if kwargs:
                msg = (
                    "Keyword arguments are not supported when 'run()' is invoked with the 'start_event' parameter."
                    f" These keyword arguments will be ignored: {kwargs}"
                )
                logger.warning(msg)
            return start_event

        # Old style start event creation, with kwargs used to create an instance of self._start_event_class
        try:
            return self._start_event_class(**kwargs)
        except ValidationError as e:
            ev_name = self._start_event_class.__name__
            msg = f"Failed creating a start event of type '{ev_name}' with the keyword arguments: {kwargs}"
            logger.debug(e)
            raise WorkflowRuntimeError(msg)

    @dispatcher.span
    def run(
        self,
        ctx: Context | None = None,
        stepwise: bool = False,
        checkpoint_callback: CheckpointCallback | None = None,
        start_event: StartEvent | None = None,
        **kwargs: Any,
    ) -> WorkflowHandler:
        """Runs the workflow until completion."""
        # Validate the workflow and determine HITL usage
        uses_hitl = self._validate()
        if uses_hitl and stepwise:
            raise WorkflowRuntimeError(
                "Human-in-the-loop is not supported with stepwise execution"
            )

        # Start the machinery in a new Context or use the provided one
        ctx, run_id = self._start(
            ctx=ctx, stepwise=stepwise, checkpoint_callback=checkpoint_callback
        )

        result = WorkflowHandler(ctx=ctx, run_id=run_id)

        async def _run_workflow() -> None:
            if self._sem:
                await self._sem.acquire()
            try:
                if not ctx.is_running:
                    # Send the first event
                    start_event_instance = self._get_start_event_instance(
                        start_event, **kwargs
                    )
                    ctx.send_event(start_event_instance)

                    # the context is now running
                    ctx.is_running = True

                done, unfinished = await asyncio.wait(
                    ctx._tasks,
                    timeout=self._timeout,
                    return_when=asyncio.FIRST_EXCEPTION,
                )

                we_done = False
                exception_raised = None
                for task in done:
                    e = task.exception()
                    if type(e) is WorkflowDone:
                        we_done = True
                    elif e is not None:
                        exception_raised = e
                        break

                # Cancel any pending tasks
                for t in unfinished:
                    t.cancel()

                # wait for cancelled tasks to cleanup
                # prevents any tasks from being stuck
                try:
                    await asyncio.wait_for(
                        asyncio.gather(*unfinished, return_exceptions=True),
                        timeout=0.5,
                    )
                except asyncio.TimeoutError:
                    logger.warning("Some tasks did not clean up within timeout")

                # the context is no longer running
                ctx.is_running = False

                if exception_raised:
                    # cancel the stream
                    ctx.write_event_to_stream(StopEvent())

                    raise exception_raised

                if not we_done:
                    # cancel the stream
                    ctx.write_event_to_stream(StopEvent())

                    msg = f"Operation timed out after {self._timeout} seconds"
                    raise WorkflowTimeoutError(msg)

                result.set_result(ctx._retval)
            except Exception as e:
                result.set_exception(e)
            finally:
                if self._sem:
                    self._sem.release()
                await ctx.shutdown()

        asyncio.create_task(_run_workflow())
        return result

    @dispatcher.span
    def run_from(
        self,
        checkpoint: Checkpoint,
        ctx_serializer: BaseSerializer | None = None,
        checkpoint_callback: CheckpointCallback | None = None,
        **kwargs: Any,
    ) -> WorkflowHandler:
        """
        Run from a specified Checkpoint.

        The `Context` snapshot contained in the checkpoint is loaded and used
        to execute the `Workflow`.
        """
        # load the `Context` from the checkpoint
        ctx_serializer = ctx_serializer or JsonSerializer()
        ctx = Context.from_dict(self, checkpoint.ctx_state, serializer=ctx_serializer)
        handler: WorkflowHandler = self.run(
            ctx=ctx, checkpoint_callback=checkpoint_callback, **kwargs
        )

        # only kick off the workflow if there are no in-progress events
        # in-progress events are already started in self.run()
        num_in_progress = sum(len(v) for v in ctx._in_progress.values())
        if (
            num_in_progress == 0
            and handler.ctx is not None
            and checkpoint.output_event is not None
        ):
            handler.ctx.send_event(checkpoint.output_event)

        return handler

    def is_done(self) -> bool:
        """Checks if the workflow is done."""
        return self._stepwise_context is None

    @step(num_workers=1)
    async def _done(self, ctx: Context, ev: StopEvent) -> None:
        """Tears down the whole workflow and stop execution."""
        if self._stop_event_class is StopEvent:
            ctx._retval = ev.result
        else:
            ctx._retval = ev

        ctx.write_event_to_stream(ev)

        # Signal we want to stop the workflow. Since we're about to raise, delete
        # the reference to ctx explicitly to avoid it becoming dangling
        del ctx
        raise WorkflowDone

    def _validate(self) -> bool:
        """
        Validate the workflow to ensure it's well-formed.

        Returns True if the workflow uses human-in-the-loop, False otherwise.
        """
        if self._disable_validation:
            return False

        produced_events: set[type] = {self._start_event_class}
        consumed_events: set[type] = set()
        requested_services: set[ServiceDefinition] = set()

        # Collect steps that incorrectly accept StopEvent
        steps_accepting_stop_event: list[str] = []

        for name, step_func in self._get_steps().items():
            step_config: StepConfig | None = getattr(step_func, "__step_config")
            # At this point we know step config is not None, let's make the checker happy
            assert step_config is not None

            # Check that no user-defined step accepts StopEvent (only _done step should)
            if name != "_done":
                for event_type in step_config.accepted_events:
                    if issubclass(event_type, StopEvent):
                        steps_accepting_stop_event.append(name)
                        break

            for event_type in step_config.accepted_events:
                consumed_events.add(event_type)

            for event_type in step_config.return_types:
                if event_type is type(None):
                    # some events may not trigger other events
                    continue

                produced_events.add(event_type)

            requested_services.update(step_config.requested_services)

        # Raise error if any steps incorrectly accept StopEvent
        if steps_accepting_stop_event:
            step_names = "', '".join(steps_accepting_stop_event)
            plural = "" if len(steps_accepting_stop_event) == 1 else "s"
            msg = f"Step{plural} '{step_names}' cannot accept StopEvent. StopEvent signals the end of the workflow. Use a different Event type instead."
            raise WorkflowValidationError(msg)

        # Check if no StopEvent is produced
        stop_ok = False
        for ev in produced_events:
            if issubclass(ev, StopEvent):
                stop_ok = True
                break
        if not stop_ok:
            msg = "No event of type StopEvent is produced."
            raise WorkflowValidationError(msg)

        # Check if all consumed events are produced (except specific built-in events)
        unconsumed_events = consumed_events - produced_events
        unconsumed_events = {
            x
            for x in unconsumed_events
            if not issubclass(x, (InputRequiredEvent, HumanResponseEvent, StopEvent))
        }
        if unconsumed_events:
            names = ", ".join(ev.__name__ for ev in unconsumed_events)
            raise WorkflowValidationError(
                f"The following events are consumed but never produced: {names}"
            )

        # Check if there are any unused produced events (except specific built-in events)
        unused_events = produced_events - consumed_events
        unused_events = {
            x
            for x in unused_events
            if not issubclass(
                x, (InputRequiredEvent, HumanResponseEvent, self._stop_event_class)
            )
        }
        if unused_events:
            names = ", ".join(ev.__name__ for ev in unused_events)
            raise WorkflowValidationError(
                f"The following events are produced but never consumed: {names}"
            )

        # Check all the requested services are available
        required_service_names = {
            sd.name for sd in requested_services if sd.default_value is None
        }
        if required_service_names:
            avail_service_names = set(self._service_manager._services.keys())
            missing = required_service_names - avail_service_names
            if missing:
                msg = f"The following services are not available: {', '.join(str(m) for m in missing)}"
                raise WorkflowValidationError(msg)

        # Check if the workflow uses human-in-the-loop
        return (
            InputRequiredEvent in produced_events
            or HumanResponseEvent in consumed_events
        )

init #

__init__(timeout: float | None = 10.0, disable_validation: bool = False, verbose: bool = False, service_manager: ServiceManager | None = None, resource_manager: ResourceManager | None = None, num_concurrent_runs: int | None = None) -> None

Parameters:

Name	Type	Description	Default
`timeout`	`float \| None`	Number of seconds after the workflow execution will be halted, raising a `WorkflowTimeoutError` exception. If set to `None`, the timeout will be disabled.	`10.0`
`disable_validaton`		Whether or not the workflow should be validated before running. In case the workflow is misconfigured, a call to `run` will raise a `WorkflowValidationError` exception explaining the details of the problem.	required
`verbose`	`bool`	Whether or not the workflow should print additional informative messages during execution.	`False`
`service_manager`	`ServiceManager \| None`	The instance of the `ServiceManager` used to make nested workflows available to this workflow instance. The default value is the best choice unless you're customizing the workflow runtime.	`None`
`num_concurrent_runs`	`int \| None`	maximum number of .run() executions occurring simultaneously. If set to `None`, there is no limit to this number.	`None`

Source code in workflows/workflow.py

def __init__(
    self,
    timeout: float | None = 10.0,
    disable_validation: bool = False,
    verbose: bool = False,
    service_manager: ServiceManager | None = None,
    resource_manager: ResourceManager | None = None,
    num_concurrent_runs: int | None = None,
) -> None:
    """
    Create an instance of the workflow.

    Args:
        timeout:
            Number of seconds after the workflow execution will be halted, raising a `WorkflowTimeoutError`
            exception. If set to `None`, the timeout will be disabled.
        disable_validaton:
            Whether or not the workflow should be validated before running. In case the workflow is
            misconfigured, a call to `run` will raise a `WorkflowValidationError` exception explaining the details
            of the problem.
        verbose:
            Whether or not the workflow should print additional informative messages during execution.
        service_manager:
            The instance of the `ServiceManager` used to make nested workflows available to this
            workflow instance. The default value is the best choice unless you're customizing the workflow runtime.
        num_concurrent_runs:
            maximum number of .run() executions occurring simultaneously. If set to `None`, there
            is no limit to this number.

    """
    # Configuration
    self._timeout = timeout
    self._verbose = verbose
    self._disable_validation = disable_validation
    self._num_concurrent_runs = num_concurrent_runs
    self._stop_event_class = self._ensure_stop_event_class()
    self._start_event_class = self._ensure_start_event_class()
    self._sem = (
        asyncio.Semaphore(num_concurrent_runs) if num_concurrent_runs else None
    )
    # Broker machinery
    self._contexts: WeakSet[Context] = WeakSet()
    self._stepwise_context: Context | None = None
    # Services management
    self._service_manager = service_manager or ServiceManager()
    # Resource management
    self._resource_manager = resource_manager or ResourceManager()
    # Instrumentation
    self._dispatcher = dispatcher

stream_events `async` #

stream_events() -> AsyncGenerator[Event, None]

Returns an async generator to consume any event that workflow steps decide to stream.

To be able to use this generator, the usual pattern is to wrap the run call in a background task using asyncio.create_task, then enter a for loop like this:

wf = StreamingWorkflow()
r = asyncio.create_task(wf.run())

async for ev in wf.stream_events():
    print(ev)

await r

Source code in workflows/workflow.py

async def stream_events(self) -> AsyncGenerator[Event, None]:
    """
    Returns an async generator to consume any event that workflow steps decide to stream.

    To be able to use this generator, the usual pattern is to wrap the `run` call in a background task using
    `asyncio.create_task`, then enter a for loop like this:

        wf = StreamingWorkflow()
        r = asyncio.create_task(wf.run())

        async for ev in wf.stream_events():
            print(ev)

        await r
    """
    # In the typical streaming use case, `run()` is not awaited but wrapped in a asyncio.Task. Since we'll be
    # consuming events produced by `run()`, we must give its Task the chance to run before entering the dequeueing
    # loop.
    await asyncio.sleep(0)

    if len(self._contexts) > 1:
        # We can't possibly know from what session we should stream events, raise an error.
        msg = (
            "This workflow has multiple concurrent runs in progress and cannot stream events. "
            "To be able to stream events, make sure you call `run()` on this workflow only once."
        )
        raise WorkflowRuntimeError(msg)

    # Enter the dequeuing loop.
    ctx = next(iter(self._contexts))
    while True:
        ev = await ctx.streaming_queue.get()
        if isinstance(ev, StopEvent):
            break

        yield ev

    # remove context to free up room for the next stream_events call
    self._contexts.remove(ctx)

add_step `classmethod` #

add_step(func: Callable) -> None

Adds a free function as step for this workflow instance.

It raises an exception if a step with the same name was already added to the workflow.

Source code in workflows/workflow.py

@classmethod
def add_step(cls, func: Callable) -> None:
    """
    Adds a free function as step for this workflow instance.

    It raises an exception if a step with the same name was already added to the workflow.
    """
    step_config: StepConfig | None = getattr(func, "__step_config", None)
    if not step_config:
        msg = f"Step function {func.__name__} is missing the `@step` decorator."
        raise WorkflowValidationError(msg)

    if func.__name__ in {**get_steps_from_class(cls), **cls._step_functions}:
        msg = f"A step {func.__name__} is already part of this workflow, please choose another name."
        raise WorkflowValidationError(msg)

    cls._step_functions[func.__name__] = func

add_workflows #

add_workflows(**workflows: 'Workflow') -> None

Adds one or more nested workflows to this workflow.

This method only accepts keyword arguments, and the name of the parameter will be used as the name of the workflow.

Source code in workflows/workflow.py

def add_workflows(self, **workflows: "Workflow") -> None:
    """
    Adds one or more nested workflows to this workflow.

    This method only accepts keyword arguments, and the name of the parameter
    will be used as the name of the workflow.
    """
    for name, wf in workflows.items():
        self._service_manager.add(name, wf)

run #

run(ctx: Context | None = None, stepwise: bool = False, checkpoint_callback: CheckpointCallback | None = None, start_event: StartEvent | None = None, **kwargs: Any) -> WorkflowHandler

Runs the workflow until completion.

Source code in workflows/workflow.py

@dispatcher.span
def run(
    self,
    ctx: Context | None = None,
    stepwise: bool = False,
    checkpoint_callback: CheckpointCallback | None = None,
    start_event: StartEvent | None = None,
    **kwargs: Any,
) -> WorkflowHandler:
    """Runs the workflow until completion."""
    # Validate the workflow and determine HITL usage
    uses_hitl = self._validate()
    if uses_hitl and stepwise:
        raise WorkflowRuntimeError(
            "Human-in-the-loop is not supported with stepwise execution"
        )

    # Start the machinery in a new Context or use the provided one
    ctx, run_id = self._start(
        ctx=ctx, stepwise=stepwise, checkpoint_callback=checkpoint_callback
    )

    result = WorkflowHandler(ctx=ctx, run_id=run_id)

    async def _run_workflow() -> None:
        if self._sem:
            await self._sem.acquire()
        try:
            if not ctx.is_running:
                # Send the first event
                start_event_instance = self._get_start_event_instance(
                    start_event, **kwargs
                )
                ctx.send_event(start_event_instance)

                # the context is now running
                ctx.is_running = True

            done, unfinished = await asyncio.wait(
                ctx._tasks,
                timeout=self._timeout,
                return_when=asyncio.FIRST_EXCEPTION,
            )

            we_done = False
            exception_raised = None
            for task in done:
                e = task.exception()
                if type(e) is WorkflowDone:
                    we_done = True
                elif e is not None:
                    exception_raised = e
                    break

            # Cancel any pending tasks
            for t in unfinished:
                t.cancel()

            # wait for cancelled tasks to cleanup
            # prevents any tasks from being stuck
            try:
                await asyncio.wait_for(
                    asyncio.gather(*unfinished, return_exceptions=True),
                    timeout=0.5,
                )
            except asyncio.TimeoutError:
                logger.warning("Some tasks did not clean up within timeout")

            # the context is no longer running
            ctx.is_running = False

            if exception_raised:
                # cancel the stream
                ctx.write_event_to_stream(StopEvent())

                raise exception_raised

            if not we_done:
                # cancel the stream
                ctx.write_event_to_stream(StopEvent())

                msg = f"Operation timed out after {self._timeout} seconds"
                raise WorkflowTimeoutError(msg)

            result.set_result(ctx._retval)
        except Exception as e:
            result.set_exception(e)
        finally:
            if self._sem:
                self._sem.release()
            await ctx.shutdown()

    asyncio.create_task(_run_workflow())
    return result

run_from #

run_from(checkpoint: Checkpoint, ctx_serializer: BaseSerializer | None = None, checkpoint_callback: CheckpointCallback | None = None, **kwargs: Any) -> WorkflowHandler

Run from a specified Checkpoint.

The Context snapshot contained in the checkpoint is loaded and used to execute the Workflow.

Source code in workflows/workflow.py

@dispatcher.span
def run_from(
    self,
    checkpoint: Checkpoint,
    ctx_serializer: BaseSerializer | None = None,
    checkpoint_callback: CheckpointCallback | None = None,
    **kwargs: Any,
) -> WorkflowHandler:
    """
    Run from a specified Checkpoint.

    The `Context` snapshot contained in the checkpoint is loaded and used
    to execute the `Workflow`.
    """
    # load the `Context` from the checkpoint
    ctx_serializer = ctx_serializer or JsonSerializer()
    ctx = Context.from_dict(self, checkpoint.ctx_state, serializer=ctx_serializer)
    handler: WorkflowHandler = self.run(
        ctx=ctx, checkpoint_callback=checkpoint_callback, **kwargs
    )

    # only kick off the workflow if there are no in-progress events
    # in-progress events are already started in self.run()
    num_in_progress = sum(len(v) for v in ctx._in_progress.values())
    if (
        num_in_progress == 0
        and handler.ctx is not None
        and checkpoint.output_event is not None
    ):
        handler.ctx.send_event(checkpoint.output_event)

    return handler

is_done #

is_done() -> bool

Checks if the workflow is done.

Source code in workflows/workflow.py

def is_done(self) -> bool:
    """Checks if the workflow is done."""
    return self._stepwise_context is None

Workflow

Workflow #

__init__ #

stream_events async #

add_step classmethod #

add_workflows #

run #

run_from #

is_done #

init #

stream_events `async` #

add_step `classmethod` #