agent_deply/pam_deploy_graph/interactive.py
dark d01c4d3d06 feat: 完善交互式部署与 MCP/LLM 配置能力
- 新增 MCP client 配置加载,支持 CLI/chat 通过配置文件接入 MCP
- 完善 chat 交互命令,支持参数查看、事件查看、checkpoint 列表与加载
- 增加 LLM action 后诊断能力,支持真实 LLM 和本地规则兜底
- 将 chat 人工确认点接入 LangGraph interrupt/checkpointer
- 更新 README、流程图、待办文档和打包说明
- 补充相关单元测试
2026-06-01 16:45:52 +08:00

593 lines
23 KiB
Python
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

"""PAM 部署 Agent 的常驻式交互 CLI 会话。"""
from __future__ import annotations
import time
import json
import shlex
import builtins
from dataclasses import asdict
from pathlib import Path
from typing import Any, Callable
from .agent import PamDeployAgent
from .checkpoint_store import load_agent_state, redact_mapping
from .langgraph_runtime import LangGraphDeploymentRuntime, LangGraphRunResult
from .llm import build_llm_client
from .llm.rule_based import RuleBasedLlmClient
from .mcp_factory import build_mcp_runner_from_config
from .models import AgentState, ExecutionStrategy
InputFunc = Callable[[str], str]
OutputFunc = Callable[[str], None]
COMMAND_HELP = """可用命令:
help 显示帮助
preview 查看当前参数和执行策略
analyze <需求> 只做理解和计划,不执行
params 脱敏展示当前会话参数
events [数量] 查看最近 action 事件,默认 10 条
set KEY=VALUE 修改当前会话参数
llm config KEY=VALUE 配置真实 LLM支持 base_url/api_key/model
llm fallback 切回本地规则 fallback
llm action-analysis on|off 开关 action 后诊断
mcp config <路径> 加载 MCP client JSON 配置
run 创建部署任务并执行
status 查看当前运行状态
approve 确认待处理回滚
reject [原因] 拒绝待处理回滚
resume 从当前 checkpoint 续跑
list checkpoints 列出 checkpoint 目录下的 JSON 文件
load checkpoint <路径> 加载指定 checkpoint
checkpoint 显示 checkpoint 路径
exit 退出
也可以直接输入自然语言需求Agent 会先分析并更新会话参数;执行仍需输入 run。
"""
class InteractiveCliSession:
"""维护一次交互式 CLI 会话的参数、状态和命令处理逻辑。"""
def __init__(
self,
*,
agent: PamDeployAgent,
params: dict[str, Any],
strategy: ExecutionStrategy = "hybrid_node_mcp",
checkpoint_path: str | None = None,
target_ips: list[str] | None = None,
input_func: InputFunc = input,
output_func: OutputFunc = print,
) -> None:
"""初始化会话上下文和输入输出函数。"""
self.agent = agent
self.params = dict(params)
self.strategy = strategy
self.checkpoint_path = checkpoint_path or _default_checkpoint_path()
self.target_ips = list(target_ips or [])
self.input = _build_prompt_input(input_func)
self.output = _build_output_func(output_func)
self.state: AgentState | None = None
self.last_analysis: dict[str, Any] | None = None
self.llm_config: dict[str, str] = {}
self.mcp_config_path: str = ""
self.graph_runtime: LangGraphDeploymentRuntime | None = None
def run(self) -> None:
"""启动 REPL 循环,直到用户 exit 或输入流结束。"""
self.output("PAM 部署 Agent 交互式会话")
self.output("输入 help 查看命令,输入 exit 退出。")
self._load_existing_checkpoint_if_any()
while True:
try:
line = self.input("PAM> ")
except EOFError:
self.output("bye")
return
if not self.handle_line(line):
return
def handle_line(self, line: str) -> bool:
"""处理用户输入的一行命令;返回 False 表示退出会话。"""
text = line.strip()
if not text:
return True
command, _, rest = text.partition(" ")
normalized = command.lower()
if normalized in ("exit", "quit", "q"):
self.output("bye")
return False
if normalized in ("help", "?"):
self.output(COMMAND_HELP.rstrip())
return True
if normalized == "preview":
self.output(self.agent.preview(self.params, self.strategy))
return True
if normalized == "params":
self._show_params()
return True
if normalized == "events":
self._show_events(rest.strip())
return True
if normalized == "analyze":
self._analyze(rest.strip())
return True
if normalized == "set":
self._set_param(rest.strip())
return True
if normalized == "llm":
self._configure_llm(rest.strip())
return True
if normalized == "mcp":
self._configure_mcp(rest.strip())
return True
if normalized in ("run", "deploy", "execute"):
self._run_deploy()
return True
if normalized == "resume":
self._resume()
return True
if normalized == "status":
self._status()
return True
if normalized == "approve":
self._confirm(approved=True, note=rest.strip())
return True
if normalized == "reject":
self._confirm(approved=False, note=rest.strip())
return True
if normalized == "checkpoint":
self.output(f"checkpoint: {self.checkpoint_path}")
return True
if normalized == "list" and rest.strip().lower() == "checkpoints":
self._list_checkpoints()
return True
if normalized == "load" and rest.strip().lower().startswith("checkpoint"):
self._load_checkpoint(rest.strip()[len("checkpoint") :].strip())
return True
self._analyze(text)
return True
def _analyze(self, text: str) -> None:
"""分析自然语言需求,并更新会话中的参数、策略和目标 IP。"""
if not text:
self.output("请输入要分析的自然语言需求例如analyze 请用 MCP 预演部署 HET。")
return
result = self.agent.analyze_request(text, self.params)
self.last_analysis = result
param_result = result["params"]
intent_result = result["intent"]
plan = result["plan"]
self.params = dict(param_result.extracted_params)
self.strategy = _choose_strategy(intent_result.strategy_preference, self.strategy)
user_ips = param_result.extracted_control.get("user_specified_ips")
if isinstance(user_ips, list):
self.target_ips = [str(item) for item in user_ips]
safe_payload = redact_mapping({key: asdict(value) for key, value in result.items()})
self.output("已生成结构化理解:")
self.output(f"- intent: {intent_result.intent}")
self.output(f"- strategy: {self.strategy}")
self.output(f"- summary: {plan.summary}")
if param_result.missing_required_params:
self.output("- missing: " + ", ".join(param_result.missing_required_params))
if self.target_ips:
self.output("- target_ips: " + ", ".join(self.target_ips))
self.output("执行请输 run查看完整 JSON 可用一次性 analyze 命令。")
self.output(_format_redacted_params(safe_payload["params"]["extracted_params"]))
def _set_param(self, assignment: str) -> None:
"""处理 `set KEY=VALUE` 命令,更新当前会话参数。"""
if "=" not in assignment:
self.output("格式set KEY=VALUE")
return
key, value = assignment.split("=", 1)
key = key.strip()
if not key:
self.output("参数名不能为空。")
return
self.params[key] = value.strip()
self.output(f"已设置 {key}")
def _show_params(self) -> None:
"""脱敏展示当前会话参数。"""
self.output(_format_redacted_params(redact_mapping(self.params)))
def _show_events(self, count_text: str) -> None:
"""展示最近若干条事件。"""
if self.state is None or not self.state.events:
self.output("当前没有事件。")
return
try:
count = int(count_text) if count_text else 10
except ValueError:
self.output("格式events [数量]")
return
events = self.state.events[-max(count, 1) :]
self.output(json.dumps(redact_mapping(events), ensure_ascii=False, indent=2, default=str))
def _configure_llm(self, text: str) -> None:
"""热加载 LLM 配置,或开关 action 后诊断。"""
if not text:
self.output("格式llm config base_url=... api_key=... model=... | llm fallback | llm action-analysis on|off")
return
parts = shlex.split(text)
if parts[0] == "fallback":
self.agent.llm_client = RuleBasedLlmClient()
self.llm_config = {}
self.output("已切回本地规则 LLM fallback。")
return
if parts[0] == "action-analysis":
if len(parts) < 2 or parts[1] not in ("on", "off"):
self.output("格式llm action-analysis on|off")
return
self.agent.action_analysis_enabled = parts[1] == "on"
self.output(f"action 后诊断已{'开启' if self.agent.action_analysis_enabled else '关闭'}")
return
if parts[0] != "config":
self.output("未知 llm 命令。")
return
updates = _parse_key_values(parts[1:])
self.llm_config.update(updates)
try:
self.agent.llm_client = build_llm_client(
base_url=self.llm_config.get("base_url"),
api_key=self.llm_config.get("api_key"),
model=self.llm_config.get("model"),
)
except Exception as exc:
self.output(f"LLM 配置失败: {exc}")
return
safe = {**self.llm_config}
if safe.get("api_key"):
safe["api_key"] = "***"
self.output("LLM 配置已加载: " + json.dumps(safe, ensure_ascii=False))
def _configure_mcp(self, text: str) -> None:
"""热加载 MCP client 配置。"""
command, _, path = text.partition(" ")
if command != "config" or not path.strip():
self.output("格式mcp config <mcp_client.json>")
return
path = path.strip().strip('"')
try:
runner = build_mcp_runner_from_config(path)
except Exception as exc:
self.output(f"MCP 配置失败: {exc}")
return
self.agent.mcp_runner = runner
self.agent.router.mcp_runner = runner
self.mcp_config_path = path
self.output(f"MCP 配置已加载: {path}")
def _list_checkpoints(self) -> None:
"""列出当前 checkpoint 目录下的 JSON 文件。"""
checkpoint_dir = Path(self.checkpoint_path).parent
if not checkpoint_dir.exists():
self.output(f"checkpoint 目录不存在: {checkpoint_dir}")
return
files = sorted(checkpoint_dir.glob("*.json"), key=lambda item: item.stat().st_mtime, reverse=True)
if not files:
self.output(f"checkpoint 目录没有 JSON 文件: {checkpoint_dir}")
return
lines = ["checkpoint 列表:"]
for file in files[:20]:
lines.append(f"- {file}")
self.output("\n".join(lines))
def _load_checkpoint(self, path_text: str) -> None:
"""加载指定 checkpoint 文件。"""
if not path_text:
self.output("格式load checkpoint <路径>")
return
checkpoint = Path(path_text)
if not checkpoint.exists():
self.output(f"checkpoint 不存在: {checkpoint}")
return
self.state = load_agent_state(checkpoint)
self.state.checkpoint_path = str(checkpoint)
self.checkpoint_path = str(checkpoint)
self.params = dict(self.state.params)
self.strategy = self.state.execution_strategy
self.target_ips = list(self.state.target_ips)
self.graph_runtime = None
self.output(f"已加载 checkpoint: {checkpoint}")
if self.state.pending_confirmation:
self._print_confirmation()
def _run_deploy(self) -> None:
"""在用户确认后创建状态并执行完整部署流程。"""
if self.state and self.state.pending_confirmation:
self._print_confirmation()
return
if not self._confirm_params_and_scope():
self.output("已取消执行。")
return
if not self._ask_yes_no("即将执行真实 action确认执行请输入 yes: "):
self.output("已取消执行。")
return
self.state = self.agent.create_state(
params=self.params,
execution_strategy=self.strategy,
checkpoint_path=self.checkpoint_path,
target_ips=self.target_ips,
)
self.graph_runtime = None
self._execute_current_state()
def _confirm_params_and_scope(self) -> bool:
"""执行前确认参数和目标 IP 范围。"""
self.output(_format_redacted_params(redact_mapping(self.params)))
if not self._ask_yes_no("确认以上参数请输入 yes: "):
return False
if self.target_ips:
self.output("目标 IP: " + ", ".join(self.target_ips))
else:
self.output("目标 IP: 未指定,将在 get-online-ips 后使用全部在线 IP。")
return self._ask_yes_no("确认目标范围请输入 yes: ")
def _resume(self) -> None:
"""从内存状态或 checkpoint 文件继续执行部署流程。"""
if self.state is None:
checkpoint = Path(self.checkpoint_path)
if not checkpoint.exists():
self.output("当前没有可续跑的 checkpoint。")
return
self.state = load_agent_state(checkpoint)
self.state.checkpoint_path = self.state.checkpoint_path or str(checkpoint)
if self.graph_runtime and self.graph_runtime.waiting_confirmation:
self._print_confirmation()
return
self._execute_current_state()
def _execute_current_state(self) -> None:
"""执行当前 state并输出报告、确认提示和 checkpoint 路径。"""
if self.state is None:
self.output("当前没有运行状态。")
return
try:
if self.graph_runtime is None or not self.graph_runtime.waiting_confirmation:
self.graph_runtime = LangGraphDeploymentRuntime(agent=self.agent)
result = self.graph_runtime.start(self.state)
except RuntimeError as exc:
self.output(f"LangGraph 确认运行器不可用,降级为本地执行: {exc}")
self.graph_runtime = None
self.state = self.agent.run_deploy_flow(self.state)
self._print_state_report_and_checkpoint()
return
self._apply_graph_result(result)
def _apply_graph_result(self, result: LangGraphRunResult) -> None:
"""把 LangGraph 运行结果同步回 chat 会话并输出用户可见状态。"""
if result.state is not None:
self.state = result.state
if self.state is None:
self.output("当前没有运行状态。")
return
self.output(result.report or self.agent.render_report(self.state))
if result.interrupted and result.confirmation:
self._print_confirmation_request(result.confirmation)
elif self.state.pending_confirmation:
self._print_confirmation()
self.output(f"checkpoint: {self.state.checkpoint_path or self.checkpoint_path}")
def _print_state_report_and_checkpoint(self) -> None:
"""输出本地执行路径的状态报告和 checkpoint。"""
if self.state is None:
return
self.output(self.agent.render_report(self.state))
if self.state.pending_confirmation:
self._print_confirmation()
self.output(f"checkpoint: {self.state.checkpoint_path or self.checkpoint_path}")
def _status(self) -> None:
"""输出当前运行状态;没有 state 时输出 checkpoint 路径。"""
if self.state is None:
self.output("当前还没有运行状态。")
self.output(f"checkpoint: {self.checkpoint_path}")
return
self.output(self.agent.render_report(self.state))
if self.state.pending_confirmation:
self._print_confirmation()
def _confirm(self, *, approved: bool, note: str = "") -> None:
"""处理 approve/reject 命令。"""
if self.state is None:
checkpoint = Path(self.checkpoint_path)
if checkpoint.exists():
self.state = load_agent_state(checkpoint)
self.state.checkpoint_path = self.state.checkpoint_path or str(checkpoint)
else:
self.output("当前没有待确认任务。")
return
if not self.state.pending_confirmation:
self.output("当前没有待确认任务。")
return
if self.graph_runtime and self.graph_runtime.waiting_confirmation:
try:
result = self.graph_runtime.resume(approved=approved, note=note)
except RuntimeError as exc:
self.output(f"LangGraph 确认恢复失败,降级为本地确认: {exc}")
else:
self._apply_graph_result(result)
return
self.state = self.agent.confirm_pending(self.state, approved=approved, operator_note=note)
self.output(self.agent.render_report(self.state))
if self.state.pending_confirmation:
self._print_confirmation()
def _print_confirmation(self) -> None:
"""输出当前待人工确认事项。"""
if self.state is None:
return
request = self.agent.build_confirmation_request(self.state)
if not request:
return
self._print_confirmation_request(request)
def _print_confirmation_request(self, request: dict[str, Any]) -> None:
"""输出指定的人工确认请求。"""
self.output("需要人工确认:")
self.output(f"- type: {request.get('type')}")
if request.get("ip"):
self.output(f"- ip: {request['ip']}")
if request.get("failed_stage"):
self.output(f"- failed_stage: {request['failed_stage']}")
if request.get("failure_reason"):
self.output(f"- reason: {request['failure_reason']}")
self.output("输入 approve 执行回滚,或 reject [原因] 拒绝回滚。")
def _ask_yes_no(self, prompt: str) -> bool:
"""读取一次 yes/no 确认,只有 yes/y 视为确认。"""
try:
answer = self.input(prompt).strip().lower()
except EOFError:
return False
return answer in ("yes", "y")
def _load_existing_checkpoint_if_any(self) -> None:
"""会话启动时自动加载已存在的 checkpoint。"""
checkpoint = Path(self.checkpoint_path)
if not checkpoint.exists():
return
self.state = load_agent_state(checkpoint)
self.state.checkpoint_path = self.state.checkpoint_path or str(checkpoint)
self.output(f"已加载 checkpoint: {checkpoint}")
if self.state.pending_confirmation:
self._print_confirmation()
def run_interactive_chat(
*,
agent: PamDeployAgent,
params: dict[str, Any],
strategy: ExecutionStrategy,
checkpoint_path: str | None = None,
target_ips: list[str] | None = None,
input_func: InputFunc = input,
output_func: OutputFunc = print,
) -> InteractiveCliSession:
"""创建并运行交互式 CLI 会话,返回会话对象便于测试。"""
session = InteractiveCliSession(
agent=agent,
params=params,
strategy=strategy,
checkpoint_path=checkpoint_path,
target_ips=target_ips,
input_func=input_func,
output_func=output_func,
)
session.run()
return session
def _default_checkpoint_path() -> str:
"""生成默认 chat checkpoint 路径。"""
return str(Path("runtime") / "checkpoints" / f"chat_{time.strftime('%Y%m%d_%H%M%S')}.json")
def _choose_strategy(preference: str, default: ExecutionStrategy) -> ExecutionStrategy:
"""根据 LLM 偏好更新执行策略,非法值保留默认策略。"""
if preference in ("hybrid_node_mcp", "script_only", "fake"):
return preference # type: ignore[return-value]
return default
def _format_redacted_params(params: dict[str, Any]) -> str:
"""把脱敏后的参数字典格式化为多行文本。"""
lines = ["当前参数:"]
for key in sorted(params):
lines.append(f"- {key}: {params[key]}")
return "\n".join(lines)
def _parse_key_values(parts: list[str]) -> dict[str, str]:
"""解析 KEY=VALUE 参数列表。"""
values: dict[str, str] = {}
for part in parts:
if "=" not in part:
continue
key, value = part.split("=", 1)
if key:
values[key] = value
return values
def _build_prompt_input(input_func: InputFunc) -> InputFunc:
"""如果安装了 prompt_toolkit则启用历史记录和命令补全。"""
if input_func is not builtins.input:
return input_func
try:
from prompt_toolkit import PromptSession
from prompt_toolkit.completion import WordCompleter
from prompt_toolkit.history import FileHistory
except ImportError:
return input_func
commands = [
"help",
"preview",
"analyze",
"params",
"events",
"set",
"llm config",
"llm fallback",
"llm action-analysis on",
"llm action-analysis off",
"mcp config",
"run",
"status",
"approve",
"reject",
"resume",
"list checkpoints",
"load checkpoint",
"checkpoint",
"exit",
]
session = PromptSession(
history=FileHistory(str(Path("runtime") / "chat_history.txt")),
completer=WordCompleter(commands, ignore_case=True, sentence=True),
)
return session.prompt
def _build_output_func(output_func: OutputFunc) -> OutputFunc:
"""如果安装了 rich则使用 rich 输出;否则保持原输出函数。"""
if output_func is not builtins.print:
return output_func
try:
from rich.console import Console
from rich.markdown import Markdown
except ImportError:
return output_func
console = Console()
def rich_print(value: str) -> None:
text = str(value)
stripped = text.lstrip()
if stripped.startswith("{") or stripped.startswith("["):
try:
console.print_json(text)
return
except Exception:
pass
if text.startswith("## ") or "\n| ---" in text:
console.print(Markdown(text))
return
console.print(text)
return rich_print