Files
sanguo_moziplus_v2/tests/test_e2e_v27.py
T
2026-05-20 08:32:01 +08:00

1093 lines
41 KiB
Python
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
"""v2.7 端到端测试 — 全链路真实环境
覆盖:项目管理 → Task CRUD → SubTask → Stage进度 → 状态聚合 → 依赖链 → 超时 → Mail → 真实Agent调度
"""
import asyncio
import json
import os
import sys
import time
import uuid
from datetime import datetime
from pathlib import Path
from typing import Any, Dict, List, Optional
import pytest
from fastapi.testclient import TestClient
# 指向部署目录
DEPLOY_DIR = Path.home() / ".sanguo_projects" / "sanguo_moziplus_v2"
sys.path.insert(0, str(DEPLOY_DIR))
from src.main import app
from src.blackboard.db import init_db, get_connection, VALID_TRANSITIONS, VALID_STATUSES
from src.blackboard.models import Task
from src.blackboard.operations import Blackboard
from src.blackboard.queries import Queries
from src.blackboard.registry import ProjectRegistry
from src.daemon.ticker import Ticker
from src.utils import get_data_root
# ── Fixtures ──
@pytest.fixture(scope="module")
def client():
return TestClient(app)
@pytest.fixture(scope="module")
def data_root():
return get_data_root()
def _pid() -> str:
"""生成唯一测试项目ID"""
return f"e2e-v27-{uuid.uuid4().hex[:8]}"
def _tid() -> str:
"""生成唯一任务ID"""
return f"e2e-task-{uuid.uuid4().hex[:8]}"
# ===================================================================
# E1: 项目管理
# ===================================================================
class TestE1ProjectManagement:
"""E1: 项目创建、列表、归档"""
def test_e11_create_and_get_project(self, client):
pid = _pid()
resp = client.post("/api/projects", json={
"id": pid,
"name": f"E2E测试-{pid}",
"description": "自动测试项目",
})
assert resp.status_code == 200
data = resp.json()
assert data.get("project_id") == pid or data.get("id") == pid
# 获取
resp = client.get(f"/api/projects/{pid}")
assert resp.status_code == 200
assert resp.json().get("id") == pid
def test_e12_list_projects(self, client):
resp = client.get("/api/projects")
assert resp.status_code == 200
data = resp.json()
assert "projects" in data
assert isinstance(data["projects"], dict)
def test_e13_archive_project(self, client):
pid = _pid()
client.post("/api/projects", json={"id": pid, "name": f"Archive-{pid}"})
resp = client.post(f"/api/projects/{pid}/archive")
assert resp.status_code == 200
# 验证状态
resp = client.get(f"/api/projects/{pid}")
assert resp.json()["status"] == "archived"
def test_e14_create_project_auto_discover(self, data_root):
"""创建含 blackboard.db 的目录,验证自动发现"""
pid = _pid()
project_dir = data_root / pid
project_dir.mkdir(parents=True, exist_ok=True)
init_db(project_dir / "blackboard.db")
# 注册
registry = ProjectRegistry(data_root)
registry.create_project(pid, f"Discover-{pid}", source="auto_discovered")
projects = registry.list_projects()
assert pid in projects
# 清理
import shutil
shutil.rmtree(project_dir, ignore_errors=True)
# ===================================================================
# E2: Task CRUD + 状态机
# ===================================================================
class TestE2TaskCRUD:
"""E2: Task 创建、查询、状态转换"""
@pytest.fixture(autouse=True)
def setup_project(self, client):
self.pid = _pid()
client.post("/api/projects", json={
"id": self.pid, "name": f"E2-{self.pid}",
})
def test_e21_create_task(self, client):
tid = _tid()
resp = client.post(f"/api/projects/{self.pid}/tasks", json={
"id": tid,
"title": "测试任务",
"description": "E2E测试",
"status": "pending",
})
assert resp.status_code == 200
assert resp.json().get("task_id") == tid or resp.json().get("id") == tid
self._tid = tid
def test_e22_get_task_expand(self, client):
tid = _tid()
client.post(f"/api/projects/{self.pid}/tasks", json={
"id": tid, "title": "Expand测试", "status": "pending",
})
resp = client.get(f"/api/projects/{self.pid}/tasks/{tid}?expand=all")
assert resp.status_code == 200
data = resp.json()
assert data.get("id") == tid
assert "comments" in data or "outputs" in data
def test_e23_valid_transitions(self, client):
"""pending → claimed → working → review → done"""
tid = _tid()
client.post(f"/api/projects/{self.pid}/tasks", json={
"id": tid, "title": "状态机测试", "status": "pending",
})
transitions = [
("claimed", {"agent": "zhangfei-dev"}),
("working", {"agent": "zhangfei-dev"}),
("review", {"agent": "zhangfei-dev"}),
("done", {"agent": "zhangfei-dev"}),
]
for new_status, body in transitions:
resp = client.post(
f"/api/projects/{self.pid}/tasks/{tid}/status",
json={"status": new_status, **body},
)
assert resp.status_code == 200, f"Failed at → {new_status}: {resp.text}"
def test_e24_invalid_transition_rejected(self, client):
"""pending → done 应被拒绝"""
tid = _tid()
client.post(f"/api/projects/{self.pid}/tasks", json={
"id": tid, "title": "非法转换", "status": "pending",
})
resp = client.post(
f"/api/projects/{self.pid}/tasks/{tid}/status",
json={"status": "done", "agent": "test"},
)
assert resp.status_code == 409
assert "invalid_transition" in resp.text or "Cannot transition" in resp.text
def test_e25_list_tasks_filter(self, client):
"""按状态筛选"""
for st in ["pending", "pending"]:
client.post(f"/api/projects/{self.pid}/tasks", json={
"id": _tid(), "title": "Filter", "status": st,
})
resp = client.get(f"/api/projects/{self.pid}/tasks?status=pending")
assert resp.status_code == 200
tasks = resp.json().get("tasks", resp.json())
assert len(tasks) >= 2
# ===================================================================
# E3: SubTask 父子关系
# ===================================================================
class TestE3SubTask:
"""E3: 父子 Task 关系"""
@pytest.fixture(autouse=True)
def setup(self, client):
self.pid = _pid()
client.post("/api/projects", json={
"id": self.pid, "name": f"E3-{self.pid}",
})
self.parent_id = "e3-parent-001"
client.post(f"/api/projects/{self.pid}/tasks", json={
"id": self.parent_id,
"title": "父任务",
"status": "pending",
"stages_json": json.dumps([{"id": "setup", "label": "Setup"}, {"id": "run", "label": "Run"}, {"id": "verify", "label": "Verify"}]),
})
# 创建 3 个子 Task
self.child_ids = []
for i, stage in enumerate(["setup", "run", "verify"]):
cid = f"e3-child-{i}"
self.child_ids.append(cid)
client.post(f"/api/projects/{self.pid}/tasks", json={
"id": cid,
"title": f"子任务-{stage}",
"status": "pending",
"parent_task": self.parent_id,
"stage": stage,
})
def test_e31_list_subtasks(self, client):
resp = client.get(f"/api/projects/{self.pid}/tasks?parent_task={self.parent_id}")
assert resp.status_code == 200
tasks = resp.json().get("tasks", resp.json())
assert len(tasks) == 3
ids = {t["id"] for t in tasks}
assert set(self.child_ids) == ids
def test_e32_top_level_excludes_children(self, data_root):
db_path = data_root / self.pid / "blackboard.db"
q = Queries(db_path)
top = q.top_level_tasks()
top_ids = {t.id for t in top}
assert self.parent_id in top_ids
for cid in self.child_ids:
assert cid not in top_ids
def test_e33_child_stage_field(self, data_root):
db_path = data_root / self.pid / "blackboard.db"
bb = Blackboard(db_path)
for i, stage in enumerate(["setup", "run", "verify"]):
t = bb.get_task(f"e3-child-{i}")
assert t is not None
assert t.stage == stage
# ===================================================================
# E4: Stage 进度
# ===================================================================
class TestE4StageProgress:
"""E4: stages_json + stage 分组统计"""
@pytest.fixture(autouse=True)
def setup(self, client):
self.pid = _pid()
client.post("/api/projects", json={
"id": self.pid, "name": f"E4-{self.pid}",
})
self.parent_id = "e4-parent-001"
client.post(f"/api/projects/{self.pid}/tasks", json={
"id": self.parent_id,
"title": "Stage父任务",
"status": "pending",
"stages_json": json.dumps([{"id": "data", "label": "Data"}, {"id": "code", "label": "Code"}, {"id": "test", "label": "Test"}]),
})
# 每个stage一个子任务
for i, stage in enumerate(["data", "code", "test"]):
client.post(f"/api/projects/{self.pid}/tasks", json={
"id": f"e4-child-{i}",
"title": f"Stage-{stage}",
"status": "pending",
"parent_task": self.parent_id,
"stage": stage,
})
def test_e41_progress_endpoint(self, client):
resp = client.get(f"/api/projects/{self.pid}/tasks/{self.parent_id}/progress")
assert resp.status_code == 200
data = resp.json()
assert "stages" in data
assert len(data["stages"]) == 3
def test_e42_progress_counts(self, data_root):
"""把 data stage 标记 done,验证进度"""
db_path = data_root / self.pid / "blackboard.db"
bb = Blackboard(db_path)
# data child → done
bb.update_task_status("e4-child-0", "claimed", agent="test")
bb.update_task_status("e4-child-0", "working", agent="test")
bb.update_task_status("e4-child-0", "review", agent="test")
bb.update_task_status("e4-child-0", "done", agent="test")
q = Queries(db_path)
progress = q.parent_task_progress(self.parent_id)
stages = {s["id"]: s for s in progress["stages"]}
assert stages["data"]["total"] == 1
assert stages["data"]["done"] == 1
assert stages["code"]["total"] == 1
assert stages["code"]["done"] == 0
def test_e43_empty_stages_progress(self, client):
"""无 stages_json 的 Task 进度"""
tid = _tid()
client.post(f"/api/projects/{self.pid}/tasks", json={
"id": tid, "title": "无Stage", "status": "pending",
})
db_path = get_data_root() / self.pid / "blackboard.db"
q = Queries(db_path)
progress = q.parent_task_progress(tid)
# 无子任务,应返回空或基本结构
assert progress is not None
# ===================================================================
# E5: 父 Task 状态聚合
# ===================================================================
class TestE5ParentAggregation:
"""E5: compute_parent_status 聚合逻辑"""
@pytest.fixture(autouse=True)
def setup(self, data_root):
self.pid = _pid()
db_path = data_root / self.pid / "blackboard.db"
db_path.parent.mkdir(parents=True, exist_ok=True)
init_db(db_path)
self.db_path = db_path
self.bb = Blackboard(db_path)
self.q = Queries(db_path)
# 创建父任务
self.parent_id = "e5-parent"
self.bb.create_task(Task(
id=self.parent_id, title="聚合父任务", status="pending",
))
def _create_child(self, cid: str, status: str = "pending", stage: str = None):
self.bb.create_task(Task(
id=cid, title=f"子-{cid}", status="pending",
parent_task=self.parent_id, stage=stage,
))
if status == "pending":
return
# Walk state machine to target status
path_map = {
"claimed": ["claimed"],
"working": ["claimed", "working"],
"review": ["claimed", "working", "review"],
"done": ["claimed", "working", "review", "done"],
"failed": ["claimed", "working", "failed"],
"blocked": ["claimed", "working", "blocked"],
"cancelled": ["cancelled"],
}
for s in path_map.get(status, []):
self.bb.update_task_status(cid, s, agent="test")
def test_e51_all_done_parent_done(self):
self._create_child("c1", "done")
self._create_child("c2", "done")
result = self.q.compute_parent_status(self.parent_id)
assert result == "done"
def test_e52_has_review_parent_review(self):
self._create_child("c3", "done")
self._create_child("c4", "review")
result = self.q.compute_parent_status(self.parent_id)
assert result == "review"
def test_e53_has_working_parent_working(self):
self._create_child("c5", "done")
self._create_child("c6", "working")
result = self.q.compute_parent_status(self.parent_id)
assert result == "working"
def test_e54_all_pending_parent_pending(self):
self._create_child("c7", "pending")
self._create_child("c8", "pending")
result = self.q.compute_parent_status(self.parent_id)
assert result == "pending"
def test_e55_cancelled_excluded(self):
"""cancelled 子 Task 不参与聚合"""
self._create_child("c9", "done")
self._create_child("c10", "cancelled")
# 只有 c9 有效 → done
result = self.q.compute_parent_status(self.parent_id)
assert result == "done"
def test_e56_cancelled_parent_not_overridden(self):
"""cancelled 的父 Task 不被聚合覆盖"""
# 先让所有子任务 done
self._create_child("c11", "done")
# 手动把父任务设为 cancelled
conn = get_connection(self.db_path)
try:
conn.execute("UPDATE tasks SET status='cancelled' WHERE id=?", (self.parent_id,))
conn.commit()
finally:
conn.close()
# _refresh_parent_statuses 应跳过 cancelled 父任务
ticker = Ticker.__new__(Ticker)
ticker._refresh_parent_statuses(self.db_path)
# 验证父任务仍是 cancelled
t = self.bb.get_task(self.parent_id)
assert t.status == "cancelled"
# ===================================================================
# E6: 依赖链
# ===================================================================
class TestE6DependencyChain:
"""E6: depends_on 依赖推进"""
@pytest.fixture(autouse=True)
def setup(self, data_root):
self.pid = _pid()
db_path = data_root / self.pid / "blackboard.db"
db_path.parent.mkdir(parents=True, exist_ok=True)
init_db(db_path)
self.db_path = db_path
self.bb = Blackboard(db_path)
def test_e61_dep_advance(self):
"""A done → B 从 blocked → pending"""
self.bb.create_task(Task(id="dep-a", title="A", status="pending"))
self.bb.create_task(Task(id="dep-b", title="B", status="blocked", depends_on=json.dumps(["dep-a"])))
# 完成 A
for s in ["claimed", "working", "review", "done"]:
self.bb.update_task_status("dep-a", s, agent="test")
# 手动 tick 依赖推进
ticker = Ticker.__new__(Ticker)
advanced = ticker._advance_dependencies(self.db_path)
assert "dep-b" in advanced
t = self.bb.get_task("dep-b")
assert t.status == "pending"
def test_e62_dep_not_done_stays_blocked(self):
"""A 未完成 → B 保持 blocked"""
self.bb.create_task(Task(id="dep-c", title="C", status="pending"))
self.bb.create_task(Task(id="dep-d", title="D", status="blocked", depends_on=json.dumps(["dep-c"])))
ticker = Ticker.__new__(Ticker)
advanced = ticker._advance_dependencies(self.db_path)
assert "dep-d" not in advanced
assert self.bb.get_task("dep-d").status == "blocked"
def test_e63_chain_a_b_c(self):
"""A → B → C 多层依赖"""
self.bb.create_task(Task(id="chain-a", title="A", status="pending"))
self.bb.create_task(Task(id="chain-b", title="B", status="blocked", depends_on=json.dumps(["chain-a"])))
self.bb.create_task(Task(id="chain-c", title="C", status="blocked", depends_on=json.dumps(["chain-b"])))
# 完成 A
for s in ["claimed", "working", "review", "done"]:
self.bb.update_task_status("chain-a", s, agent="test")
ticker = Ticker.__new__(Ticker)
advanced1 = ticker._advance_dependencies(self.db_path)
assert "chain-b" in advanced1
# B 现在 pending,完成 B
for s in ["claimed", "working", "review", "done"]:
self.bb.update_task_status("chain-b", s, agent="test")
advanced2 = ticker._advance_dependencies(self.db_path)
assert "chain-c" in advanced2
# ===================================================================
# E7: 超时回收
# ===================================================================
class TestE7Timeout:
"""E7: claimed/working 超时回收"""
@pytest.fixture(autouse=True)
def setup(self, data_root):
self.pid = _pid()
db_path = data_root / self.pid / "blackboard.db"
db_path.parent.mkdir(parents=True, exist_ok=True)
init_db(db_path)
self.db_path = db_path
self.bb = Blackboard(db_path)
def test_e71_claimed_timeout_to_pending(self):
"""claimed 超过 claim_timeout → pending"""
self.bb.create_task(Task(id="to-001", title="超时测试", status="pending"))
self.bb.update_task_status("to-001", "claimed", agent="test-agent")
# 手动把 claimed_at 设为 10 分钟前
conn = get_connection(self.db_path)
try:
conn.execute(
"UPDATE tasks SET claimed_at=datetime('now','-10 minutes') WHERE id=?",
("to-001",)
)
conn.commit()
finally:
conn.close()
ticker = Ticker.__new__(Ticker)
ticker.claim_timeout_minutes = 5.0
ticker.default_task_timeout_minutes = 30.0
reclaimed = ticker._check_timeouts(self.db_path)
assert "to-001" in reclaimed
assert self.bb.get_task("to-001").status == "pending"
def test_e72_working_timeout_to_failed(self):
"""working 超过 task_timeout → failed"""
self.bb.create_task(Task(id="to-002", title="工作超时", status="pending"))
self.bb.update_task_status("to-002", "claimed", agent="test-agent")
self.bb.update_task_status("to-002", "working", agent="test-agent")
# 手动把 started_at 设为 60 分钟前
conn = get_connection(self.db_path)
try:
conn.execute(
"UPDATE tasks SET started_at=datetime('now','-60 minutes') WHERE id=?",
("to-002",)
)
conn.commit()
finally:
conn.close()
ticker = Ticker.__new__(Ticker)
ticker.claim_timeout_minutes = 5.0
ticker.default_task_timeout_minutes = 30.0
reclaimed = ticker._check_timeouts(self.db_path)
assert "to-002" in reclaimed
assert self.bb.get_task("to-002").status == "failed"
# ===================================================================
# E8: Mail Tab 6 端点
# ===================================================================
class TestE8MailTab:
"""E8: Mail 端到端"""
@pytest.fixture(autouse=True)
def setup(self, client):
self.mail_ids = []
def _send_mail(self, client, **kwargs):
# Fix: 'from' is a Python keyword, callers use 'from_'
if 'from_' in kwargs:
kwargs['from'] = kwargs.pop('from_')
resp = client.post("/api/mail", json=kwargs)
assert resp.status_code == 200
data = resp.json()
assert data["ok"] is True
mid = data["mail_id"]
self.mail_ids.append(mid)
return mid
def test_e81_send_inform_auto_done(self, client):
"""inform 类型自动 done"""
mid = self._send_mail(client,
title="通知测试",
text="这是一条通知",
from_="pangtong-fujunshi",
to="simayi-challenger",
type="inform",
)
resp = client.get(f"/api/mail/{mid}")
data = resp.json()
assert data["status"] == "done"
def test_e82_send_task_assign_pending(self, client):
"""task-assign 类型保持 pending"""
mid = self._send_mail(client,
title="任务分配",
text="请完成此任务",
from_="pangtong-fujunshi",
to="zhangfei-dev",
type="task-assign",
)
resp = client.get(f"/api/mail/{mid}")
data = resp.json()
assert data["status"] == "pending"
def test_e83_list_with_filters(self, client):
"""列表 + 筛选"""
self._send_mail(client,
title="筛选测试1",
text="body",
from_="pangtong-fujunshi",
to="simayi-challenger",
type="text",
)
self._send_mail(client,
title="筛选测试2",
text="body",
from_="zhangfei-dev",
to="simayi-challenger",
type="text",
)
# 按 from 筛选
resp = client.get("/api/mail?from_agent=pangtong-fujunshi")
mails = resp.json()["mails"]
assert any(m["title"] == "筛选测试1" for m in mails)
# 按 to 筛选
resp = client.get("/api/mail?to_agent=simayi-challenger")
mails = resp.json()["mails"]
assert len(mails) >= 2
def test_e84_mail_detail_with_comments(self, client):
"""详情 + 评论"""
mid = self._send_mail(client,
title="详情测试",
text="正文内容",
from_="pangtong-fujunshi",
to="simayi-challenger",
type="text",
)
# 添加评论(通过 blackboard 直接写)
from src.api.mail_routes import _db_path
conn = get_connection(_db_path())
try:
conn.execute(
"INSERT INTO comments (task_id, author, comment_type, body) VALUES (?, ?, ?, ?)",
(mid, "simayi-challenger", "general", "收到,正在处理"),
)
conn.commit()
finally:
conn.close()
resp = client.get(f"/api/mail/{mid}")
data = resp.json()
assert data["title"] == "详情测试"
# 验证评论已写入(通过直接查 DB,绕过 Comment.from_row 的 card_id 兼容问题)
from src.api.mail_routes import _db_path as mail_db
conn = get_connection(mail_db())
try:
row = conn.execute("SELECT COUNT(*) as cnt FROM comments WHERE task_id=?", (mid,)).fetchone()
assert row["cnt"] == 1
finally:
conn.close()
def test_e85_mark_read(self, client):
"""标记已读"""
mid = self._send_mail(client,
title="已读测试",
text="body",
from_="pangtong-fujunshi",
to="simayi-challenger",
type="text",
)
# 确认初始未读
resp = client.get(f"/api/mail/{mid}")
assert resp.json()["is_read"] is False
# 标记已读
resp = client.patch(f"/api/mail/{mid}", json={"is_read": True})
assert resp.status_code == 200
# 验证
resp = client.get(f"/api/mail/{mid}")
assert resp.json()["is_read"] is True
def test_e86_mark_executed(self, client):
"""标记已执行(走完整状态链)"""
mid = self._send_mail(client,
title="执行测试",
text="body",
from_="pangtong-fujunshi",
to="zhangfei-dev",
type="task-assign",
)
# 先走状态链到 review,再标记 executed
from src.api.mail_routes import _db_path as mail_db
bb = Blackboard(mail_db())
for s in ["claimed", "working", "review"]:
bb.update_task_status(mid, s, agent="zhangfei-dev")
resp = client.patch(f"/api/mail/{mid}", json={"mark_executed": True})
assert resp.status_code == 200
resp = client.get(f"/api/mail/{mid}")
data = resp.json()
assert data["is_read"] is True
assert data["status"] == "done"
def test_e87_summary_and_agents(self, client):
"""统计 + Agent 列表"""
self._send_mail(client,
title="统计测试",
text="body",
from_="zhaoyun-data",
to="guanyu-dev",
type="inform",
)
resp = client.get("/api/mail/summary")
data = resp.json()
assert "total" in data
assert "unread" in data
assert data["total"] > 0
resp = client.get("/api/mail/agents/list")
data = resp.json()
assert "agents" in data
assert isinstance(data["agents"], list)
# ===================================================================
# E9: 真实 Agent 调度(生产环境全链路)
# ===================================================================
import requests as http_requests
API_BASE = "http://localhost:8083"
POLL_INTERVAL = 5 # 轮询间隔秒
MAX_WAIT_DISPATCH = 60 # 等待调度超时(2个tick
MAX_WAIT_AGENT = 300 # 等待Agent完成超时
E2E_PREFIX = "e2e-v30-"
def _check_environment():
"""环境前置检查:daemon 运行 + ticker 活跃 + 8083 可达"""
try:
resp = http_requests.get(f"{API_BASE}/api/daemon/status", timeout=5)
data = resp.json()
if data.get("status") != "running" or not data.get("ticker_running"):
pytest.skip(f"Daemon not ready: {data}")
return data
except Exception as e:
pytest.skip(f"Production API not available at {API_BASE}: {e}")
def _cleanup_project(pid: str):
"""清理测试项目"""
try:
http_requests.post(f"{API_BASE}/api/projects/{pid}/archive", timeout=5)
except Exception:
pass
@pytest.mark.integration
@pytest.mark.skipif(not os.environ.get("RUN_INTEGRATION"),
reason="Set RUN_INTEGRATION=1 to run real agent tests")
class TestE9RealAgentDispatch:
"""E9: 真实 Agent 调度测试
通过生产 HTTP API 创建任务,依赖生产 Ticker 自动调度,
真实 Agent spawn 执行,全程不手动推动状态。
需要设置环境变量 RUN_INTEGRATION=1 才会运行。
"""
@pytest.fixture(autouse=True)
def setup_env(self):
_check_environment()
self._projects = []
yield
# teardown: 清理所有测试项目
for pid in self._projects:
_cleanup_project(pid)
def _create_project(self, name_prefix="E9") -> str:
pid = f"{E2E_PREFIX}{uuid.uuid4().hex[:6]}"
resp = http_requests.post(f"{API_BASE}/api/projects", json={
"id": pid,
"name": f"{name_prefix}-{pid}",
"config": {"agents": ["zhangfei-dev"]},
}, timeout=10)
assert resp.status_code == 200, f"Create project failed: {resp.text}"
self._projects.append(pid)
return pid
def _create_task(self, pid, **kwargs) -> str:
tid = kwargs.get("id") or f"e2e-task-{uuid.uuid4().hex[:8]}"
body = {"id": tid, "status": "pending", "priority": 5, **kwargs}
resp = http_requests.post(
f"{API_BASE}/api/projects/{pid}/tasks", json=body, timeout=10
)
assert resp.status_code == 200, f"Create task failed: {resp.text}"
return tid
def _poll_task(self, pid, tid, timeout, terminal_states=None):
"""轮询任务状态直到终态或超时"""
terminal = terminal_states or ("done", "failed", "cancelled")
deadline = time.time() + timeout
last_status = None
while time.time() < deadline:
resp = http_requests.get(
f"{API_BASE}/api/projects/{pid}/tasks/{tid}", timeout=10
)
if resp.status_code == 200:
data = resp.json()
last_status = data.get("status")
if last_status in terminal:
return data
time.sleep(POLL_INTERVAL)
# 超时,返回最后状态
resp = http_requests.get(
f"{API_BASE}/api/projects/{pid}/tasks/{tid}", timeout=10
)
return resp.json() if resp.status_code == 200 else {"status": "unknown"}
def test_e91_simple_task_agent_execute(self):
"""E9-1: 简单任务 → 生产Ticker调度 → 真实Agent执行 → 状态自动流转到终态"""
pid = self._create_project("E9-1")
tid = self._create_task(
pid,
title="E2E简单任务:echo hello",
description=(
"请执行以下操作:\n"
"1. 运行命令 echo hello\n"
"2. 把输出结果写入黑板\n"
"这是E2E自动化测试,完成后请标记done。\n"
"重要:不需要做其他任何事。"
),
assignee="zhangfei-dev",
task_type="coding",
)
print(f"\n🚀 E9-1: 等待调度 + Agent执行 (pid={pid}, tid={tid})")
result = self._poll_task(
pid, tid, timeout=MAX_WAIT_AGENT,
terminal_states=("done", "failed", "cancelled", "blocked"),
)
status = result.get("status")
print(f" 最终状态: {status}")
# 断言1:不能还是 pending(证明被调度了)
assert status != "pending", (
f"Agent未被调度!任务 {tid}{MAX_WAIT_AGENT}s 后仍为 pending。"
f"\n请检查:1) Ticker是否运行 2) Agent是否可spawn 3) pm2 logs sanguo-moziplus-v2"
)
# 断言2:不能是 blockedguardrails 不应拦截普通任务)
assert status != "blocked", f"普通任务被错误拦截: {result}"
# 断言3:成功最好,failed 也记录原因
if status == "failed":
print(f" ⚠️ Agent执行失败,detail: {result}")
else:
print(f" ✅ Agent执行成功")
print(f" 性能: pending → {status}")
def test_e92_review_task_dispatch(self):
"""E9-2: review任务 → 路由到can_review Agent → 真实执行"""
pid = self._create_project("E9-2")
tid = self._create_task(
pid,
title="E2E Review:审查测试",
description=(
"这是一个E2E测试的review任务。\n"
"请简单回复:\"审查通过,E2E测试正常。\"\n"
"然后标记done即可。不需要做其他事。"
),
assignee="simayi-challenger",
task_type="review",
)
print(f"\n🚀 E9-2: 等待review调度 + Agent执行 (pid={pid}, tid={tid})")
result = self._poll_task(
pid, tid, timeout=MAX_WAIT_AGENT,
terminal_states=("done", "failed", "cancelled", "blocked"),
)
status = result.get("status")
print(f" 最终状态: {status}")
assert status != "pending", (
f"Review Agent未被调度!任务 {tid}{MAX_WAIT_AGENT}s 后仍为 pending。"
)
assert status != "blocked", f"Review任务被错误拦截: {result}"
if status == "failed":
print(f" ⚠️ Review Agent执行失败")
else:
print(f" ✅ Review Agent执行成功")
def test_e93_guardrail_block(self):
"""E9-3: 实盘交易任务 → Guardrails拦截 → status=blocked"""
pid = self._create_project("E9-3")
tid = self._create_task(
pid,
title="执行实盘买入SH600000",
description="用真金白银买入浦发银行1000股",
assignee="zhangfei-dev",
task_type="coding",
)
print(f"\n🚀 E9-3: 等待Guardrails拦截 (pid={pid}, tid={tid})")
# Guardrails 在 Ticker dispatch 时检查,需要等一个 tick
result = self._poll_task(
pid, tid, timeout=MAX_WAIT_DISPATCH,
terminal_states=("done", "failed", "cancelled", "blocked", "claimed", "working"),
)
status = result.get("status")
print(f" 最终状态: {status}")
# 实盘任务必须被拦截,不能进入 claimed/working/done
assert status not in ("claimed", "working", "done"), (
f"Guardrails未拦截实盘任务!状态: {status}"
)
print(f" ✅ Guardrails拦截生效,状态: {status}")
# ===================================================================
# E10: 全链路集成(生产环境)
# ===================================================================
@pytest.mark.integration
@pytest.mark.skipif(not os.environ.get("RUN_INTEGRATION"),
reason="Set RUN_INTEGRATION=1 to run real agent tests")
class TestE10FullChain:
"""E10: 项目 → 父子Task → 生产Ticker → 聚合 → 依赖 → Mail → 前端API
全部通过生产 HTTP API,真实 Ticker 推进,真实 Agent 执行。
"""
@pytest.fixture(autouse=True)
def setup_env(self):
_check_environment()
self._projects = []
yield
for pid in self._projects:
_cleanup_project(pid)
def _create_project(self, name_prefix="E10") -> str:
pid = f"{E2E_PREFIX}{uuid.uuid4().hex[:6]}"
resp = http_requests.post(f"{API_BASE}/api/projects", json={
"id": pid,
"name": f"{name_prefix}-{pid}",
"config": {"agents": ["zhangfei-dev", "simayi-challenger"]},
}, timeout=10)
assert resp.status_code == 200
self._projects.append(pid)
return pid
def test_e10a_logic_chain(self):
"""E10a: 父子Task + 依赖推进 + 状态聚合 + Mail(不依赖Agent完成)"""
pid = self._create_project("E10a")
# 1. 创建父任务(带stages
parent_id = f"{pid}-parent"
http_requests.post(f"{API_BASE}/api/projects/{pid}/tasks", json={
"id": parent_id,
"title": "E10a全链路父任务",
"status": "pending",
"stages_json": json.dumps([
{"id": "setup", "label": "Setup"},
{"id": "execute", "label": "Execute"},
{"id": "verify", "label": "Verify"},
]),
}, timeout=10)
# 2. 创建3个子任务
child_ids = []
for i, stage in enumerate(["setup", "execute", "verify"]):
cid = f"{pid}-child-{i}"
child_ids.append(cid)
http_requests.post(f"{API_BASE}/api/projects/{pid}/tasks", json={
"id": cid,
"title": f"子任务-{stage}",
"status": "pending",
"parent_task": parent_id,
"stage": stage,
}, timeout=10)
# 3. 创建依赖任务(blocked
dep_id = f"{pid}-dep"
http_requests.post(f"{API_BASE}/api/projects/{pid}/tasks", json={
"id": dep_id,
"title": "依赖任务",
"depends_on": json.dumps([child_ids[0]]),
}, timeout=10)
# 4. 先推进依赖任务到 blocked(必须在依赖完成之前)
for status in ["claimed", "working", "blocked"]:
http_requests.post(
f"{API_BASE}/api/projects/{pid}/tasks/{dep_id}/status",
json={"status": status, "agent": "test"}, timeout=10,
)
# 5. 再推进 setup 子任务到 done(触发依赖推进条件)
for status in ["claimed", "working", "review", "done"]:
http_requests.post(
f"{API_BASE}/api/projects/{pid}/tasks/{child_ids[0]}/status",
json={"status": status, "agent": "test"}, timeout=10,
)
# 6. 等待 Ticker 依赖推进(1-2个tick
print(f"\n🚀 E10a: 等待依赖推进 (pid={pid})")
dep_result = self._poll_task(
pid, dep_id, timeout=MAX_WAIT_DISPATCH,
terminal_states=("pending", "claimed", "working", "done"),
)
dep_status = dep_result.get("status")
print(f" 依赖任务状态: blocked → {dep_status}")
# blocked 应被推进为 pending
assert dep_status != "blocked", (
f"依赖推进未生效!{dep_id}{MAX_WAIT_DISPATCH}s 后仍为 blocked"
)
# 7. 发送 Mail
http_requests.post(f"{API_BASE}/api/mail", json={
"title": f"E10a全链路通知-{pid}",
"text": f"项目 {pid} setup阶段完成",
"from": "simayi-challenger",
"to": "pangtong-fujunshi",
"type": "inform",
}, timeout=10)
# 8. 验证 Mail
resp = http_requests.get(
f"{API_BASE}/api/mail?from_agent=simayi-challenger", timeout=10
)
mails = resp.json()["mails"]
assert any(m["title"].startswith("E10a全链路") for m in mails), \
f"Mail未找到,当前mails: {[m['title'] for m in mails]}"
# 9. 验证 Stage 进度
resp = http_requests.get(
f"{API_BASE}/api/projects/{pid}/tasks/{parent_id}/progress", timeout=10
)
if resp.status_code == 200:
progress = resp.json()
stages = {s["id"]: s for s in progress.get("stages", [])}
assert stages["setup"]["done"] == 1, f"setup stage should be done"
assert stages["execute"]["done"] == 0
# 10. 验证父状态聚合
parent_resp = http_requests.get(
f"{API_BASE}/api/projects/{pid}/tasks/{parent_id}", timeout=10
)
parent_data = parent_resp.json()
print(f" 父任务状态: {parent_data.get('status')}")
# 1done+1pending+1pending → 应该在 pending/working
assert parent_data.get("status") in ("pending", "working"), \
f"父任务状态异常: {parent_data['status']}"
print(f" ✅ E10a 全链路测试通过")
def test_e10b_agent_full_chain(self):
"""E10b: 真实Agent全链路 — 创建子任务 → Agent执行 → 父状态自动聚合"""
pid = self._create_project("E10b")
# 1. 创建父任务
parent_id = f"{pid}-parent"
http_requests.post(f"{API_BASE}/api/projects/{pid}/tasks", json={
"id": parent_id,
"title": "E10b Agent全链路父任务",
"status": "pending",
"stages_json": json.dumps([
{"id": "step1", "label": "Step 1"},
{"id": "step2", "label": "Step 2"},
]),
}, timeout=10)
# 2. 创建子任务(真实Agent执行)
child_id = f"{pid}-child-0"
http_requests.post(f"{API_BASE}/api/projects/{pid}/tasks", json={
"id": child_id,
"title": "E2E子任务:echo test",
"description": (
"请执行 echo test 并标记done。"
"这是E2E测试,不需要做其他事。"
),
"status": "pending",
"parent_task": parent_id,
"stage": "step1",
"assignee": "zhangfei-dev",
"task_type": "coding",
}, timeout=10)
# 3. 等待Agent执行完成
print(f"\n🚀 E10b: 等待Agent执行子任务 (pid={pid}, tid={child_id})")
result = self._poll_task(
pid, child_id, timeout=MAX_WAIT_AGENT,
terminal_states=("done", "failed", "cancelled", "blocked"),
)
child_status = result.get("status")
print(f" 子任务最终状态: {child_status}")
assert child_status != "pending", (
f"子任务未被调度!{MAX_WAIT_AGENT}s后仍为pending"
)
# 4. 轮询父任务状态变化(等待Ticker聚合)
parent_result = self._poll_task(
pid, parent_id, timeout=MAX_WAIT_DISPATCH,
terminal_states=("working", "review", "done", "failed"),
)
parent_data = parent_result
print(f" 父任务状态: {parent_data.get('status')}")
# 5. 验证 Stage 进度
resp = http_requests.get(
f"{API_BASE}/api/projects/{pid}/tasks/{parent_id}/progress", timeout=10
)
if resp.status_code == 200:
progress = resp.json()
stages = {s["id"]: s for s in progress.get("stages", [])}
print(f" Stage进度: step1.done={stages.get('step1', {}).get('done', '?')}")
print(f" ✅ E10b 真实Agent全链路完成")