Human in the Loop

预览
代码
文档

/**
 * A LangGraph implementation of the human-in-the-loop agent.
 */

import { ChatOpenAI } from "@langchain/openai";
import { SystemMessage } from "@langchain/core/messages";
import { RunnableConfig } from "@langchain/core/runnables";
import {
  Command,
  interrupt,
  Annotation,
  StateGraph,
  END,
  START,
  MemorySaver,
} from "@langchain/langgraph";
import { ClientStateAnnotation } from "@ag-kit/adapter-langgraph";
import { ToolCall } from "@langchain/core/messages/tool";

const DEFINE_TASK_TOOL = {
  type: "function",
  function: {
    name: "plan_execution_steps",
    description:
      "Make up 10 steps (only a couple of words per step) that are required for a task. The step should be in imperative form (i.e. Dig hole, Open door, ...)",
    parameters: {
      type: "object",
      properties: {
        steps: {
          type: "array",
          items: {
            type: "object",
            properties: {
              description: {
                type: "string",
                description: "The text of the step in imperative form",
              },
              status: {
                type: "string",
                enum: ["enabled"],
                description: "The status of the step, always 'enabled'",
              },
            },
            required: ["description", "status"],
          },
          description:
            "An array of 10 step objects, each containing text and status",
        },
      },
      required: ["steps"],
    },
  },
};

export const AgentStateAnnotation = Annotation.Root({
  steps: Annotation<Array<{ description: string; status: string }>>({
    reducer: (x, y) => y ?? x,
    default: () => [],
  }),
  user_response: Annotation<string | undefined>({
    reducer: (x, y) => y ?? x,
    default: () => undefined,
  }),
  ...ClientStateAnnotation.spec,
});
export type AgentState = typeof AgentStateAnnotation.State;

async function startFlow(
  state: AgentState,
  config?: RunnableConfig
): Promise<Command> {
  /**
   * This is the entry point for the flow.
   */

  // Initialize steps list if not exists
  if (!state.steps) {
    state.steps = [];
  }

  return new Command({
    goto: "chat_node",
    update: {
      messages: state.messages,
      steps: state.steps,
    },
  });
}

async function chatNode(
  state: AgentState,
  config?: RunnableConfig
): Promise<Command> {
  /**
   * Standard chat node where the agent processes messages and generates responses.
   * If task steps are defined, the user can enable/disable them using interrupts.
   */
  const systemPrompt = `
    You are a helpful assistant that can perform any task.
    You MUST call the \`plan_execution_steps\` function when the user asks you to perform a task.
    Always make sure you will provide tasks based on the user query
    `;

  // Define the model
  const model = new ChatOpenAI({
    model: process.env.OPENAI_MODEL || "gpt-4o-mini",
    apiKey: process.env.OPENAI_API_KEY,
    configuration: {
      baseURL: process.env.OPENAI_BASE_URL,
    },
  });

  // Define config for the model
  if (!config) {
    config = { recursionLimit: 25 };
  }

  // Use "predict_state" metadata to set up streaming for the write_document tool
  if (!config.metadata) config.metadata = {};
  config.metadata.predict_state = [
    {
      state_key: "steps",
      tool: "plan_execution_steps",
      tool_argument: "steps",
    },
  ];

  // Bind the tools to the model
  const modelWithTools = model.bindTools(
    [...(state.client.tools || []), DEFINE_TASK_TOOL],
    {
      // Disable parallel tool calls to avoid race conditions
      parallel_tool_calls: false,
    }
  );

  // Run the model and generate a response
  const response = await modelWithTools.invoke(
    [new SystemMessage({ content: systemPrompt }), ...state.messages],
    config
  );

  // Update messages with the response
  const messages = [...state.messages, response];

  const toolCalls: ToolCall[] = [
    ...(response.tool_calls || []),
    ...(response.additional_kwargs.tool_calls?.map((tool) => ({
      name: tool.function.name,
      args: JSON.parse(tool.function.arguments),
      id: tool.id,
      type: "tool_call" as const,
    })) || []),
  ];

  // Handle tool calls
  if (toolCalls.length > 0) {
    const toolCall = toolCalls[0]!;

    if (toolCall.name === "plan_execution_steps") {
      // Get the steps from the tool call
      const stepsRaw = toolCall.args.steps || [];

      // Set initial status to "enabled" for all steps
      const stepsData: Array<{ description: string; status: string }> = [];

      // Handle different potential formats of steps data
      if (Array.isArray(stepsRaw)) {
        for (const step of stepsRaw) {
          if (typeof step === "object" && step.description) {
            stepsData.push({
              description: step.description,
              status: "enabled",
            });
          } else if (typeof step === "string") {
            stepsData.push({
              description: step,
              status: "enabled",
            });
          }
        }
      }

      // If no steps were processed correctly, return to END with the updated messages
      if (stepsData.length === 0) {
        return new Command({
          goto: END,
          update: {
            messages: messages,
            steps: state.steps,
          },
        });
      }

      // Update steps in state and emit to frontend
      state.steps = stepsData;

      // Add a tool response to satisfy OpenAI's requirements
      const toolResponse = {
        role: "tool" as const,
        content: "Task steps generated.",
        tool_call_id: toolCall.id,
      };

      const updatedMessages = [...messages, toolResponse];

      // Move to the process_steps_node which will handle the interrupt and final response
      return new Command({
        goto: "process_steps_node",
        update: {
          messages: updatedMessages,
          steps: state.steps,
        },
      });
    }
  }

  // If no tool calls or not plan_execution_steps, return to END with the updated messages
  return new Command({
    goto: END,
    update: {
      messages: messages,
      steps: state.steps,
    },
  });
}

async function processStepsNode(
  state: AgentState,
  config?: RunnableConfig
): Promise<Command> {
  /**
   * This node handles the user interrupt for step customization and generates the final response.
   */

  let userResponse: string;

  // Check if we already have a user_response in the state
  // This happens when the node restarts after an interrupt
  if (state.user_response) {
    userResponse = state.user_response;
  } else {
    // Use LangGraph interrupt to get user input on steps
    // This will pause execution and wait for user input in the frontend
    userResponse = interrupt({ steps: state.steps });
    // Store the user response in state for when the node restarts
    state.user_response = userResponse;
  }

  // Generate the creative completion response
  const finalPrompt = `
    Provide a textual description of how you are performing the task.
    If the user has disabled a step, you are not allowed to perform that step.
    However, you should find a creative workaround to perform the task, and if an essential step is disabled, you can even use
    some humor in the description of how you are performing the task.
    Don't just repeat a list of steps, come up with a creative but short description (3 sentences max) of how you are performing the task.
    `;

  const finalResponse = await new ChatOpenAI({
    model: process.env.OPENAI_MODEL || "gpt-4o-mini",
    apiKey: process.env.OPENAI_API_KEY,
    configuration: {
      baseURL: process.env.OPENAI_BASE_URL,
    },
  }).invoke(
    [
      new SystemMessage({ content: finalPrompt }),
      { role: "user", content: userResponse },
    ],
    config
  );

  // Add the final response to messages
  const messages = [...state.messages, finalResponse];

  // Clear the user_response from state to prepare for future interactions
  const newState = { ...state };
  delete newState.user_response;

  // Return to END with the updated messages
  return new Command({
    goto: END,
    update: {
      messages: messages,
      steps: state.steps,
    },
  });
}

// Define the graph
const workflow = new StateGraph(AgentStateAnnotation)
  .addNode("start_flow", startFlow)
  .addNode("chat_node", chatNode)
  .addNode("process_steps_node", processStepsNode)
  .addEdge(START, "start_flow")
  .addEdge("start_flow", "chat_node")
  .addEdge("process_steps_node", END)
  .addConditionalEdges(
    "chat_node",
    (state: AgentState) => {
      // This would be determined by the Command returned from chat_node
      // For now, we'll assume the logic is handled in the Command's goto property
      return "continue";
    },
    {
      process_steps_node: "process_steps_node",
      continue: END,
    }
  );

// Compile the graph
export const humanInTheLoopGraph = workflow.compile({
  checkpointer: new MemorySaver(),
});

Human in the Loop - LangGraph

本演示展示

本演示展示了 AG-Kit 使用 LangGraph 的 Human in the Loop 功能：

任务规划：Agent 将复杂任务分解为 10 个可执行步骤
工作流中断：LangGraph 使用 interrupt() 中断以获取人工输入
交互式审批：用户可以在执行前启用/禁用单个步骤
上下文保持：在人工交互期间保持对话上下文
恢复功能：工作流继续执行人工批准的步骤

如何交互

尝试这些建议以触发 Human in the Loop 工作流：

“给我做个三明治”（触发 10 步三明治制作计划）
“送我去火星”（触发复杂的太空任务规划）
“规划一个生日派对”（生成派对规划步骤）

技术实现

后端 (LangGraph)：

plan_execution_steps 工具生成 10 步任务分解
interrupt() 暂停工作流以获取人工输入
带有对话历史的 AGKitStateAnnotation
resume() 继续执行批准的步骤
带有对话历史的状态管理

前端 (React)：

interrupt.renderWithResume 处理中断 UI
Steps 组件提供步骤选择界面
用于步骤启用/禁用的复选框状态管理
恢复 Agent 执行的确认流程

技术流程

用户请求：用户请求复杂任务
任务规划：Agent 调用 plan_execution_steps 工具
工作流中断：LangGraph 使用 interrupt() 中断
人工审查：前端显示交互式步骤选择 UI
审批：用户启用/禁用步骤并确认
恢复：工作流继续执行批准的步骤
执行：Agent 继续执行人工批准的计划

这展示了 LangGraph 强大的工作流中断和人工审批能力！

AG-Kit TS

LangGraph TS

LangChain TS

LangGraph Py

LlamaIndex TS

Mastra TS

OpenAI Agent SDK TS

Human in the Loop - LangGraph

本演示展示

如何交互

技术实现

技术流程

AG-Kit TS

LangGraph TS

LangChain TS

LangGraph Py

LlamaIndex TS

Mastra TS

OpenAI Agent SDK TS

​Human in the Loop - LangGraph

​本演示展示

​如何交互

​技术实现

​技术流程

Human in the Loop - LangGraph

本演示展示

如何交互

技术实现

技术流程