""" E2E:知你客服12号 — 用户话术「在 D:\\aaa\\aiagent\\user_data 下创建 bbbb.md」 并校验:/health 内置工具、落盘路径必须在工作区内(user_data 子路径)、可选 node_results 中的 file_write 痕迹。 用法(在 backend 目录): .\\venv\\Scripts\\python.exe scripts\\e2e_zhini12_bbbb_md.py 环境变量:API_BASE、E2E_AGENT_NAME、E2E_RESTART_CELERY、E2E_LLM_TOOL_CHOICE。 注意:固定 user_data/bbbb.md 与正文/标记常量;不读取 E2E_REL_FILE、E2E_FILE_CONTENT、E2E_MARKER(避免 Shell 残留误测)。 默认 E2E_LLM_TOOL_CHOICE=auto。 """ from __future__ import annotations import json import os import subprocess import sys import time import uuid from pathlib import Path BACKEND_DIR = Path(__file__).resolve().parents[1] REPO_ROOT = BACKEND_DIR.parent USER_DATA_ROOT = (REPO_ROOT / "user_data").resolve() VENV_PY = BACKEND_DIR / "venv" / "Scripts" / "python.exe" API_BASE = os.environ.get("API_BASE", "http://127.0.0.1:8037") AGENT_NAME = os.environ.get("E2E_AGENT_NAME", "知你客服12号") # 固定测 bbbb.md,勿用 E2E_REL_FILE(PowerShell 里常残留 ccc/bbb) REL_PATH = "user_data/bbbb.md" # 固定内容与标记(不用 E2E_FILE_CONTENT / E2E_MARKER 环境变量,避免 PowerShell 残留旧值) FILE_CONTENT = "# bbbb\n\ne2e bbbb permission marker\n" E2E_MARKER = "e2e bbbb permission marker" def _restart_celery() -> None: ps = ( "Get-CimInstance Win32_Process | " "Where-Object { $_.CommandLine -match 'celery_app' } | " "ForEach-Object { Stop-Process -Id $_.ProcessId -Force -ErrorAction SilentlyContinue }" ) subprocess.run( ["powershell", "-NoProfile", "-Command", ps], cwd=str(BACKEND_DIR), capture_output=True, text=True, ) time.sleep(2) if not VENV_PY.is_file(): print("未找到 venv Python,跳过启动 Celery", file=sys.stderr) return kw: dict = {"cwd": str(BACKEND_DIR), "stdout": subprocess.DEVNULL, "stderr": subprocess.STDOUT} if sys.platform == "win32": kw["creationflags"] = subprocess.CREATE_NEW_PROCESS_GROUP # type: ignore[attr-defined] popen_env = os.environ.copy() if os.environ.get("E2E_LLM_TOOL_CHOICE", "auto").strip().lower() not in ( "0", "false", "no", "auto", ): popen_env["LLM_TOOL_CHOICE"] = "required" subprocess.Popen( [ str(VENV_PY), "-m", "celery", "-A", "app.core.celery_app", "worker", "--loglevel=info", "--pool=threads", "--concurrency=8", ], env=popen_env, **kw, ) print("已启动 Celery,等待就绪…") time.sleep(4) def _health_check(client) -> bool: r = client.get(f"{API_BASE.rstrip('/')}/health", timeout=15.0) r.raise_for_status() data = r.json() print("\n--- GET /health ---") print(json.dumps(data, ensure_ascii=False, indent=2)[:2500]) checks = data.get("checks") if not checks: print( "\n[INFO] /health 无 checks 字段(可能 API 未更新);请以 Worker 日志「内置工具就绪」为准。", file=sys.stderr, ) return True ok = checks.get("builtin_tools_ready") and checks.get("file_agent_core_ready") if not ok: print( "\n[WARN] API 进程 builtin_tools 未完全就绪。请同步重启 API 与 Celery。", file=sys.stderr, ) return bool(ok) def _path_allowed(abs_file: Path) -> tuple[bool, str]: """file_write 合法路径:须在仓库根下,且本次要求落在 user_data 下。""" try: f = abs_file.resolve() repo = REPO_ROOT.resolve() except OSError as e: return False, str(e) try: f.relative_to(repo) except ValueError: return False, f"文件不在仓库根内: {f} vs root {repo}" try: f.relative_to(USER_DATA_ROOT) except ValueError: return False, f"文件不在 user_data 下: {f} vs {USER_DATA_ROOT}" return True, "" def _scan_file_write_in_node_results(od: dict) -> None: nr = od.get("node_results") or {} hits = [] for nid, payload in nr.items(): if not isinstance(payload, dict): continue out = payload.get("output") s = json.dumps(out, ensure_ascii=False) if not isinstance(out, str) else out if "file_write" in s and ("success" in s.lower() or "file_path" in s): hits.append((nid, s[:400])) print("\n--- node_results 中含 file_write 线索的节点 ---") if not hits: print("(未扫到明显 JSON;可能结果只在 LLM 正文或日志中)") for nid, frag in hits: print(f" {nid}: {frag}...") def main() -> int: os.chdir(BACKEND_DIR) sys.path.insert(0, str(BACKEND_DIR)) if os.environ.get("E2E_LLM_TOOL_CHOICE", "auto").strip().lower() not in ("0", "false", "no", "auto"): os.environ["LLM_TOOL_CHOICE"] = "required" if os.environ.get("E2E_RESTART_CELERY", "1").strip().lower() not in ("0", "false", "no"): _restart_celery() import httpx from app.core.database import SessionLocal from app.core.security import create_access_token from app.models.agent import Agent from app.models.user import User db = SessionLocal() try: with httpx.Client(timeout=30.0) as hclient: _health_check(hclient) agent = db.query(Agent).filter(Agent.name == AGENT_NAME).first() if not agent: print(f"未找到「{AGENT_NAME}」", file=sys.stderr) return 1 owner = db.query(User).filter(User.id == agent.user_id).first() user = owner or db.query(User).first() if not user: print("无用户", file=sys.stderr) return 1 token = create_access_token(data={"sub": user.id, "username": user.username}) headers = {"Authorization": f"Bearer {token}"} uid = f"bbbb12_{uuid.uuid4().hex[:10]}" abs_win = str((REPO_ROOT / REL_PATH.replace("/", os.sep)).resolve()) _basename = os.path.basename(REL_PATH.replace("\\", "/")) q = ( f"请在 D:\\\\aaa\\\\aiagent\\\\user_data 目录下创建 {_basename}。" f"必须通过工具 file_write 写入:优先使用 相对路径 {REL_PATH}(相对工作区根);" f"content 为 {json.dumps(FILE_CONTENT, ensure_ascii=False)},mode 为 w。" f"file_write 返回的 JSON 必须原样体现在你最终 reply 的可读说明里(含 success 与 file_path)。" f"最后一行仍输出单行 JSON:intent、reply、user_profile。" ) print(f"\nagent={agent.id} ({AGENT_NAME}) user_id={uid}") print(f"目标文件(解析后): {abs_win}") print(f"权限校验: 须位于 {USER_DATA_ROOT}") def poll(client: httpx.Client, eid: str, timeout: float = 300.0) -> dict: t0 = time.time() while time.time() - t0 < timeout: r = client.get(f"/api/v1/executions/{eid}", headers=headers) r.raise_for_status() d = r.json() st = d.get("status") if st == "completed": return d if st == "failed": print("failed:", d.get("error_message"), file=sys.stderr) raise RuntimeError("执行失败") time.sleep(1.5) raise TimeoutError("超时") with httpx.Client(base_url=API_BASE, timeout=300.0) as client: r = client.post( "/api/v1/executions", json={"agent_id": str(agent.id), "input_data": {"query": q, "user_id": uid}}, headers=headers, ) if r.status_code >= 400: print(r.text, file=sys.stderr) r.raise_for_status() eid = r.json()["id"] print(f"\nexecution={eid}") out = poll(client, eid) od = out.get("output_data") or {} result = od.get("result", od) print("\n--- API output_data.result (截断 1500 字符) ---\n") print(str(result)[:1500]) _scan_file_write_in_node_results(od) abs_file = Path(abs_win).resolve() allowed, reason = _path_allowed(abs_file) if not allowed: print(f"\n[FAIL] 路径权限校验: {reason}", file=sys.stderr) return 3 if not abs_file.is_file(): print(f"\n[FAIL] 磁盘未找到: {abs_file}", file=sys.stderr) print("若 completed:可能未触发 file_write;查 Celery「执行工具 file_write」。", file=sys.stderr) return 2 body = abs_file.read_text(encoding="utf-8", errors="replace") print(f"\n[OK] 文件存在且路径合法: {abs_file}\n--- 内容 ---\n{body}\n---") if E2E_MARKER and E2E_MARKER not in body and FILE_CONTENT.strip() and E2E_MARKER in FILE_CONTENT: print(f"[WARN] 未在文件中发现标记「{E2E_MARKER}」", file=sys.stderr) finally: db.close() print("\n[OK] E2E bbbb.md + 路径权限 通过\n完成") return 0 if __name__ == "__main__": raise SystemExit(main())