LlamaIndex 工作流核心组件与实战指南 | 极客日志

PythonAI算法

LlamaIndex 工作流核心组件与实战指南

LlamaIndex Workflows 是构建复杂大模型应用的轻量级事件驱动框架。它将应用拆解为独立步骤，通过事件通信，支持并行执行、状态共享及可视化调试。核心组件如 Event、Context 及 Step 装饰器，涵盖分支循环、流式处理、并发执行及嵌套工作流等高级用法。结合智能客服实战案例，展示如何利用检查点机制保障长流程稳定性，帮助开发者在灵活性与可控性之间找到平衡，高效编排多智能体协作系统。

DataScient发布于 2026/4/9更新于 2026/7/2044 浏览

LlamaIndex 工作流核心组件与实战指南

背景与概述

构建大语言模型（LLM）应用时，我们常面临复杂场景：需多次调用模型、查询多数据源、执行分支逻辑或人工介入。传统顺序代码耦合度高、难调试、扩展性差。

LlamaIndex Workflows 是专为解决这些问题设计的轻量级事件驱动框架。2025 年 6 月发布的 1.0 正式版作为独立 Python/TypeScript 包，核心理念是将 AI 应用拆解为独立'步骤'（Step），通过'事件'（Event）通信，由框架调度执行。这种设计带来模块化、易测试、支持并行及内置可视化调试等优势。

LlamaIndex 工作流

核心组件

理解核心概念前，把工作流比作智能工厂：事件是流转的'物料'，步骤是处理物料的'工位'，上下文则是共享的'信息白板'。

定义工作流事件

事件是基本通信单元。所有事件继承自 Event 类，本质是 Pydantic 模型，可携带结构化数据。

from llama_index.core.workflow import Event
from typing import List, Optional

# 简单事件，携带一条消息
class MessageEvent(Event):
    content: str

# 复杂事件，携带多个字段
class AnalysisEvent(Event):
    topic: str
    keywords: List[str]
    confidence: float

框架提供两个特殊内置事件：

StartEvent：工作流入口，调用 workflow.run() 时参数自动封装成它。
StopEvent：工作流出口，返回它时流程终止，并返回 result 字段。

from llama_index.core.workflow import StartEvent, StopEvent
# StartEvent 可携带任意字段
# StopEvent 需要传入 result 参数

设置工作流类

创建继承自 Workflow 的类，定义各个步骤。

from llama_index.core.workflow import Workflow, step
from llama_index.llms.openai import OpenAI

class ():
    
    llm = OpenAI(model=)

from llama_index.core.workflow import step, StartEvent, StopEvent

class JokeWorkflow(Workflow):
    llm = OpenAI(model="gpt-4o-mini")

    # 入口点：接收 StartEvent，产出自定义 JokeEvent
    @step
    async def generate_joke(self, ev: StartEvent) -> JokeEvent:
        topic = ev.topic
        prompt = f"讲一个关于{topic}的笑话"
        response = await self.llm.acomplete(prompt)
        return JokeEvent(joke=str(response))

    # 出口点：接收 JokeEvent，产出 StopEvent
    @step
    async def critique_joke(self, ev: JokeEvent) -> StopEvent:
        prompt = f"分析这个笑话的笑点：{ev.joke}"
        response = await self.llm.acomplete(prompt)
        return StopEvent(result=str(response))

class ConditionalWorkflow(Workflow):
    @step
    async def step_one(self, ev: StartEvent) -> StopEvent | NextEvent:
        if ev.input == "exit":
            return StopEvent(result="流程提前结束")
        return NextEvent(data=ev.input)

pip install llama-index-utils-workflow

from llama_index.utils.workflow import (
    draw_all_possible_flows,
    draw_most_recent_execution,
)

# 1. 绘制静态流程图（基于代码分析）
draw_all_possible_flows(JokeWorkflow, filename="workflow_structure.html")

# 2. 绘制最近一次执行的动态轨迹（用于调试）
workflow = JokeWorkflow()
await workflow.run(topic="程序员")
draw_most_recent_execution(workflow, filename="recent_execution.html")

from llama_index.core.workflow import Context

class StatefulWorkflow(Workflow):
    @step
    async def first_step(self, ctx: Context, ev: StartEvent) -> NextEvent:
        # 写入数据到上下文
        await ctx.set("user_query", ev.query)
        await ctx.set("start_time", datetime.now())
        return NextEvent()

    @step
    async def second_step(self, ctx: Context, ev: NextEvent) -> StopEvent:
        # 从上下文读取数据，无需经过事件传递
        query = await ctx.get("user_query")
        start_time = await ctx.get("start_time")
        print(f"处理查询：{query}, 耗时：{datetime.now() - start_time}")
        return StopEvent(result="完成")

class UserProfileEvent(Event):
    profile: str

class RecommendationEvent(Event):
    items: List[str]

class AggregationWorkflow(Workflow):
    @step
    async def fetch_profile(self, ctx: Context, ev: StartEvent) -> UserProfileEvent:
        await asyncio.sleep(1)
        return UserProfileEvent(profile="科技爱好者")

    @step
    async def fetch_recommendations(self, ctx: Context, ev: StartEvent) -> RecommendationEvent:
        await asyncio.sleep(1)
        return RecommendationEvent(items=["GPU", "机械键盘"])

    @step
    async def aggregate(self, ctx: Context, ev: StartEvent) -> StopEvent:
        # 等待两个事件都到达
        events = await ctx.collect_events(
            ev, [UserProfileEvent, RecommendationEvent]
        )
        if events is None:
            return None
        profile_event, rec_event = events
        result = f"为用户 {profile_event.profile} 推荐 {rec_event.items}"
        return StopEvent(result=result)

class FanOutWorkflow(Workflow):
    @step
    async def broadcast(self, ctx: Context, ev: StartEvent) -> None:
        for i in range(5):
            ctx.send_event(ProcessEvent(index=i))
        ctx.send_event(CompletionEvent())

    @step
    async def process(self, ctx: Context, ev: ProcessEvent) -> None:
        print(f"处理任务 {ev.index}")

    @step
    async def on_complete(self, ctx: Context, ev: CompletionEvent) -> StopEvent:
        return StopEvent(result="所有任务完成")

handler = workflow.run(stepwise=True)
async for event in handler.stream_events():
    if isinstance(event, HumanInputRequiredEvent):
        user_input = await get_user_input(event.question)
        handler.ctx.send_event(HumanResponseEvent(response=user_input))
        await handler.run_step()
result = await handler

async def debug_workflow():
    workflow = MyComplexWorkflow()
    handler = workflow.run(stepwise=True)
    events = await handler.run_step()
    print(f"第一步产出的事件：{events}")
    events = await handler.run_step()
    print(f"第二步产出的事件：{events}")
    final_result = await handler
    print(f"最终结果：{final_result}")

class CheckpointWorkflow(Workflow):
    @step
    async def critical_step(self, ctx: Context, ev: StartEvent) -> NextEvent:
        result = await self.do_something()
        await self.save_checkpoint(ctx, "after_critical_step")
        return NextEvent(data=result)

workflow = CheckpointWorkflow()
handler = workflow.run()
try:
    result = await handler
except Exception as e:
    last_checkpoint = workflow.get_last_checkpoint()
    new_handler = workflow.run_from(checkpoint=last_checkpoint)
    result = await new_handler

import { Hono } from "hono";
import { createHonoHandler } from "@llamaindex/workflow-core/interrupter/hono";

const app = new Hono();
app.post("/api/run", createHonoHandler(
    myWorkflow,
    async (ctx) => startEvent(await ctx.req.json()),
    stopEvent
));
serve(app);

from llama_index.core.workflow import Workflow, step, StartEvent, StopEvent, Event

class Step1Event(Event):
    data: str

class LinearWorkflow(Workflow):
    @step
    async def step_one(self, ev: StartEvent) -> Step1Event:
        print(f"步骤 1 处理：{ev.input}")
        return Step1Event(data=ev.input.upper())

    @step
    async def step_two(self, ev: Step1Event) -> StopEvent:
        print(f"步骤 2 处理：{ev.data}")
        return StopEvent(result=f"最终结果：{ev.data}")

async def main():
    w = LinearWorkflow()
    result = await w.run(input="hello world")
    print(result) # 输出：最终结果：HELLO WORLD

class RouteEvent(Event):
    value: int

class BranchAEvent(Event):
    result: str

class BranchBEvent(Event):
    result: str

class LoopEvent(Event):
    counter: int

class BranchLoopWorkflow(Workflow):
    @step
    async def router(self, ev: StartEvent) -> RouteEvent:
        return RouteEvent(value=ev.number)

    @step
    async def handle_positive(self, ev: RouteEvent) -> BranchAEvent | LoopEvent:
        if ev.value > 0:
            return BranchAEvent(result=f"正数：{ev.value}")
        elif ev.value < 0:
            return BranchBEvent(result=f"负数：{ev.value}")
        else:
            return LoopEvent(counter=1)

    @step
    async def retry_zero(self, ev: LoopEvent) -> StartEvent:
        if ev.counter < 3:
            print(f"遇到 0，第{ev.counter}次重试...")
            return StartEvent(number=1)
        return BranchAEvent(result="重试次数用尽，强制视为正数")

    @step
    async def finalize(self, ev: BranchAEvent | BranchBEvent) -> StopEvent:
        return StopEvent(result=ev.result)

class StateMaintenanceWorkflow(Workflow):
    @step
    async def accumulate(self, ctx: Context, ev: StartEvent) -> StopEvent:
        history = await ctx.get("history", default=[])
        history.append(ev.message)
        await ctx.set("history", history)
        if len(history) >= 5:
            return StopEvent(result=f"收集完毕：{history}")
        return None

class ProgressEvent(Event):
    msg: str

class StreamingWorkflow(Workflow):
    llm = OpenAI(model="gpt-4o-mini")

    @step
    async def generate(self, ctx: Context, ev: StartEvent) -> StopEvent:
        ctx.write_event_to_stream(ProgressEvent(msg="开始生成..."))
        full_response = ""
        async for chunk in self.llm.astream_complete(ev.prompt):
            full_response += chunk.delta
            ctx.write_event_to_stream(ProgressEvent(msg=chunk.delta))
        ctx.write_event_to_stream(ProgressEvent(msg="生成完成!"))
        return StopEvent(result=full_response)

async def main():
    w = StreamingWorkflow()
    handler = w.run(prompt="写一首关于 AI 的诗")
    async for ev in handler.stream_events():
        if isinstance(ev, ProgressEvent):
            print(f"进度：{ev.msg}", flush=True)
    final = await handler
    print(f"\n\n最终结果:\n{final}")

class ParallelWorkflow(Workflow):
    @step
    async def kickoff(self, ev: StartEvent) -> ProcessEvent:
        for i in range(3):
            self.send_event(ProcessEvent(task_id=i, data=ev.data))

    @step
    async def worker(self, ev: ProcessEvent) -> ResultEvent:
        await asyncio.sleep(1)
        return ResultEvent(task_id=ev.task_id, result=f"任务{ev.task_id}完成")

    @step
    async def collector(self, ctx: Context, ev: ResultEvent) -> StopEvent | None:
        results = await ctx.get("results", default=[])
        results.append(ev.result)
        await ctx.set("results", results)
        if len(results) == 3:
            return StopEvent(result=f"全部完成：{results}")
        return None

class BaseWorkflow(Workflow):
    @step
    async def common_step(self, ev: StartEvent) -> IntermediateEvent:
        return IntermediateEvent(data=ev.input.strip())

    @step
    async def final_step(self, ev: IntermediateEvent) -> StopEvent:
        return StopEvent(result=ev.data)

class CustomWorkflow(BaseWorkflow):
    @step
    async def final_step(self, ev: IntermediateEvent) -> StopEvent:
        return StopEvent(result=f"自定义结果：{ev.data.upper()}")

class ReflectionWorkflow(Workflow):
    @step
    async def reflect(self, ev: StartEvent) -> StopEvent:
        improved = f"改进后的查询：{ev.query} (经过反思优化)"
        return StopEvent(result=improved)

class MainWorkflow(Workflow):
    @step
    async def start(self, ctx: Context, ev: StartEvent, reflection_wf: Workflow) -> ProcessEvent:
        improved = await reflection_wf.run(query=ev.query)
        return ProcessEvent(query=improved)

    @step
    async def process(self, ev: ProcessEvent) -> StopEvent:
        return StopEvent(result=f"最终处理：{ev.query}")

main = MainWorkflow()
main.add_workflows(reflection_wf=ReflectionWorkflow())
result = await main.run(query="初始查询")
print(result)

from IPython.display import HTML

draw_all_possible_flows(MyWorkflow, filename="temp.html")
with open("temp.html", "r") as f:
    display(HTML(f.read()))

from llama_index.core.workflow import Workflow, step, StartEvent, StopEvent, Event, Context
from enum import Enum
from datetime import datetime

class QuestionType(Enum):
    AFTER_SALES = "售后"
    PRE_SALES = "售前"
    COMPLAINT = "投诉"

class ClassifyEvent(Event):
    qtype: QuestionType
    question: str

class AfterSalesEvent(Event):
    question: str

class PreSalesEvent(Event):
    question: str

class ComplaintEvent(Event):
    question: str

class CustomerServiceWorkflow(Workflow):
    @step
    async def classify(self, ctx: Context, ev: StartEvent) -> ClassifyEvent:
        logs = await ctx.get("logs", default=[])
        logs.append(f"[{datetime.now()}] 收到问题：{ev.question}")
        await ctx.set("logs", logs)
        question = ev.question.lower()
        if "退货" in question or "维修" in question:
            qtype = QuestionType.AFTER_SALES
        elif "多少钱" in question or "价格" in question:
            qtype = QuestionType.PRE_SALES
        else:
            qtype = QuestionType.COMPLAINT
        return ClassifyEvent(qtype=qtype, question=ev.question)

    @step
    async def handle_after_sales(self, ctx: Context, ev: ClassifyEvent) -> AfterSalesEvent:
        if ev.qtype != QuestionType.AFTER_SALES:
            return None
        logs = await ctx.get("logs")
        logs.append(f"[{datetime.now()}] 进入售后流程")
        await ctx.set("logs", logs)
        return AfterSalesEvent(question=ev.question)

    @step
    async def handle_pre_sales(self, ctx: Context, ev: ClassifyEvent) -> PreSalesEvent:
        if ev.qtype != QuestionType.PRE_SALES:
            return None
        logs = await ctx.get("logs")
        logs.append(f"[{datetime.now()}] 进入售前流程")
        await ctx.set("logs", logs)
        return PreSalesEvent(question=ev.question)

    @step
    async def handle_complaint(self, ctx: Context, ev: ClassifyEvent) -> ComplaintEvent:
        if ev.qtype != QuestionType.COMPLAINT:
            return None
        logs = await ctx.get("logs")
        logs.append(f"[{datetime.now()}] 进入投诉流程（升级处理）")
        await ctx.set("logs", logs)
        return ComplaintEvent(question=ev.question)

    @step
    async def generate_response(self, ctx: Context, ev: AfterSalesEvent | PreSalesEvent | ComplaintEvent) -> StopEvent:
        if isinstance(ev, AfterSalesEvent):
            response = f"【售后】关于「{ev.question}」，请提供订单号，我们将为您安排退货/维修。"
        elif isinstance(ev, PreSalesEvent):
            response = f"【售前】关于「{ev.question}」，我们的产品售价为 299 元，当前有优惠活动。"
        else:
            response = f"【投诉】非常抱歉给您带来不便，关于「{ev.question}」，已转接人工客服，请稍候。"
        logs = await ctx.get("logs")
        logs.append(f"[{datetime.now()}] 生成回复：{response}")
        await ctx.set("logs", logs)
        print("\n=== 处理日志 ===")
        for log in logs:
            print(log)
        print("===============\n")
        return StopEvent(result=response)

async def test():
    w = CustomerServiceWorkflow()
    result = await w.run(question="我的产品坏了，想退货")
    print(f"最终回复：{result}")