feat(experts): add SharedWorkspace state offloading for long-horizon runs

U4: ExpertTeam accepts redis_client, passes to SharedWorkspace. After phase completion, full result is written to workspace and in-memory phase.result is replaced with a 500-char summary + _ref_key. Dependency output reading resolves offloaded content from workspace on demand, with graceful fallback to summary on read failure. Tests: 8 scenarios (offload creation, short content, dependency resolution, workspace failure fallback, non-offloaded passthrough, redis_client wiring, memory dict fallback, pipeline integration) — all pass.
2026-06-24 20:32:10 +08:00 · 2026-06-24 20:32:10 +08:00 · ef84e3fd53
parent 122173ec2c
commit ef84e3fd53
4 changed files with 204 additions and 7 deletions
--- a/src/agentkit/experts/orchestrator.py
+++ b/src/agentkit/experts/orchestrator.py
@ -441,6 +441,40 @@ class TeamOrchestrator:

        return phases

+    # U4: State offloading helpers — keep memory lean for long-horizon runs.
+
+    _OFFLOAD_SUMMARY_LIMIT = 500
+
+    def _offload_result(self, content: str, ref_key: str) -> dict[str, Any]:
+        """Create an offloaded result: summary in memory, full content in workspace."""
+        summary = (
+            content[: self._OFFLOAD_SUMMARY_LIMIT] + "..."
+            if len(content) > self._OFFLOAD_SUMMARY_LIMIT
+            else content
+        )
+        return {
+            "content": summary,
+            "_ref_key": ref_key,
+            "_offloaded": True,
+        }
+
+    async def _read_dependency_output(self, dep_phase: PlanPhase) -> str:
+        """Read a dependency phase's output, resolving offloaded content from workspace."""
+        if not dep_phase.result:
+            return ""
+        content = dep_phase.result.get("content", str(dep_phase.result))
+        # U4: If offloaded, read full content from workspace
+        if dep_phase.result.get("_offloaded"):
+            ref_key = dep_phase.result.get("_ref_key", "")
+            if ref_key:
+                try:
+                    full_data = await self._team.workspace.read(ref_key)
+                    if full_data:
+                        return full_data.get("value", content)
+                except Exception as e:
+                    logger.warning(f"Failed to read offloaded output '{ref_key}': {e}")
+        return content
+
    async def _execute_phase(self, phase: PlanPhase, plan: TeamPlan) -> dict[str, Any]:
        """Execute a single phase, dispatching by phase_type.

@ -504,8 +538,9 @@ class TeamOrchestrator:
                for dep_id in phase.depends_on:
                    dep_phase = plan.get_phase(dep_id)
                    if dep_phase and dep_phase.status == PhaseStatus.COMPLETED and dep_phase.result:
-                        dependency_outputs[dep_phase.name] = dep_phase.result.get(
-                            "content", str(dep_phase.result)
+                        # U4: Resolve offloaded content from workspace if needed
+                        dependency_outputs[dep_phase.name] = await self._read_dependency_output(
+                            dep_phase
                        )

                # 按协作契约读取相关专家的输出（可见性 — 打破上下文隔离，但限定在契约范围内）
@ -519,8 +554,10 @@ class TeamOrchestrator:
                                and prev_phase.status == PhaseStatus.COMPLETED
                                and prev_phase.result
                            ):
-                                content = prev_phase.result.get("content", str(prev_phase.result))
-                                collaboration_outputs[contract.from_expert] = content
+                                # U4: Resolve offloaded content from workspace
+                                collaboration_outputs[contract.from_expert] = (
+                                    await self._read_dependency_output(prev_phase)
+                                )
                                break

                # Emit expert_step event
@ -635,14 +672,17 @@ class TeamOrchestrator:
                if passed:
                    # 验收通过 — 写入 SharedWorkspace + 通知协作方 + 标记完成
                    phase.status = PhaseStatus.COMPLETED
-                    phase.result = result
                    # P2: SharedWorkspace 写入移到验收通过后 — 避免持久化被拒输出
                    output_key = f"{plan.id}/phase/{phase.id}/output"
+                    full_content = result.get("content", str(result))
                    await self._team.workspace.write(
                        output_key,
-                        result.get("content", str(result)),
+                        full_content,
                        expert.config.name,
                    )
+                    # U4: State offloading — keep only summary in memory,
+                    # full content lives in workspace (Redis or local dict).
+                    phase.result = self._offload_result(full_content, output_key)
                    await self._broadcast_event(
                        "review_result",
                        {
--- a/src/agentkit/experts/team.py
+++ b/src/agentkit/experts/team.py
@ -17,6 +17,7 @@ import enum
 import logging
 import time
 import uuid
+from typing import Any

 from .config import ExpertConfig
 from .expert import Expert
@ -62,9 +63,12 @@ class ExpertTeam:
        workspace: SharedWorkspace | None = None,
        pool: AgentPool | None = None,
        template_registry: ExpertTemplateRegistry | None = None,
+        redis_client: Any = None,
    ):
        self.team_id = team_id or str(uuid.uuid4())
-        self._workspace = workspace or SharedWorkspace()
+        # U4: Accept redis_client for SharedWorkspace state offloading.
+        # If workspace is explicitly provided, redis_client is ignored.
+        self._workspace = workspace or SharedWorkspace(redis_client=redis_client)
        self._pool = pool
        self._template_registry = template_registry or ExpertTemplateRegistry()
        self._handoff_transport = InProcessHandoffTransport()
--- a/src/agentkit/server/routes/chat.py
+++ b/src/agentkit/server/routes/chat.py
@ -407,6 +407,7 @@ async def _execute_team_collab(
    team = ExpertTeam(
        pool=app_state.agent_pool,
        template_registry=template_registry,
+        redis_client=getattr(app_state, "working_redis_client", None),
    )

    # Register handoff_transport handler to relay team events to WebSocket
--- a/tests/unit/experts/test_team_orchestrator.py
+++ b/tests/unit/experts/test_team_orchestrator.py
@ -1183,3 +1183,155 @@ class TestConcurrencyLimit:
        # 4 experts, semaphore limit=3 → max 3 concurrent
        assert tracker.max_seen <= 3
        assert tracker.max_seen >= 2  # At least some parallelism
+
+
+# ── U4: SharedWorkspace Redis 化 + 状态卸载测试 ─────────────
+
+
+class TestSharedWorkspaceRedis:
+    """U4: SharedWorkspace 状态卸载 — 阶段输出写入 workspace，内存只保留摘要"""
+
+    def test_offload_result_creates_summary_with_ref(self):
+        """_offload_result 返回摘要 + _ref_key + _offloaded=True"""
+        team = _make_team_with_experts()
+        orchestrator = TeamOrchestrator(team)
+
+        long_content = "x" * 1000
+        result = orchestrator._offload_result(long_content, "plan/phase/p1/output")
+
+        assert result["_offloaded"] is True
+        assert result["_ref_key"] == "plan/phase/p1/output"
+        assert len(result["content"]) < len(long_content)
+        assert result["content"].endswith("...")
+
+    def test_offload_result_short_content_no_truncation(self):
+        """短内容不截断，但仍标记为 offloaded"""
+        team = _make_team_with_experts()
+        orchestrator = TeamOrchestrator(team)
+
+        short_content = "short result"
+        result = orchestrator._offload_result(short_content, "ref_key")
+
+        assert result["_offloaded"] is True
+        assert result["content"] == short_content
+
+    @pytest.mark.asyncio
+    async def test_read_dependency_output_resolves_offloaded(self):
+        """Happy path: offloaded result → 从 workspace 读取完整内容"""
+        team = _make_team_with_experts()
+        orchestrator = TeamOrchestrator(team)
+
+        # Write full content to workspace
+        full_content = "x" * 1000
+        ref_key = "plan/phase/p1/output"
+        await team.workspace.write(ref_key, full_content, "lead")
+
+        # Create a phase with offloaded result
+        dep_phase = PlanPhase(
+            id="p1",
+            name="Phase1",
+            assigned_expert="lead",
+            task_description="test",
+            depends_on=[],
+        )
+        dep_phase.status = PhaseStatus.COMPLETED
+        dep_phase.result = orchestrator._offload_result(full_content, ref_key)
+
+        # Read should return full content from workspace
+        content = await orchestrator._read_dependency_output(dep_phase)
+        assert content == full_content
+
+    @pytest.mark.asyncio
+    async def test_read_dependency_output_falls_back_on_workspace_failure(self):
+        """Edge case: workspace 读取失败 → 降级到内存摘要"""
+        team = _make_team_with_experts()
+        orchestrator = TeamOrchestrator(team)
+
+        dep_phase = PlanPhase(
+            id="p1",
+            name="Phase1",
+            assigned_expert="lead",
+            task_description="test",
+            depends_on=[],
+        )
+        dep_phase.status = PhaseStatus.COMPLETED
+        dep_phase.result = {
+            "content": "summary content",
+            "_ref_key": "nonexistent_key",
+            "_offloaded": True,
+        }
+
+        # Workspace read returns None (key doesn't exist) → fallback to summary
+        content = await orchestrator._read_dependency_output(dep_phase)
+        assert content == "summary content"
+
+    @pytest.mark.asyncio
+    async def test_read_dependency_output_non_offloaded_returns_directly(self):
+        """Non-offloaded result → 直接返回 content"""
+        team = _make_team_with_experts()
+        orchestrator = TeamOrchestrator(team)
+
+        dep_phase = PlanPhase(
+            id="p1",
+            name="Phase1",
+            assigned_expert="lead",
+            task_description="test",
+            depends_on=[],
+        )
+        dep_phase.status = PhaseStatus.COMPLETED
+        dep_phase.result = {"content": "direct content"}
+
+        content = await orchestrator._read_dependency_output(dep_phase)
+        assert content == "direct content"
+
+    @pytest.mark.asyncio
+    async def test_team_accepts_redis_client(self):
+        """ExpertTeam 创建时接收 redis_client 参数"""
+        mock_redis = AsyncMock()
+        team = ExpertTeam(redis_client=mock_redis)
+
+        assert team._workspace._redis is mock_redis
+
+    @pytest.mark.asyncio
+    async def test_team_without_redis_uses_memory_dict(self):
+        """ExpertTeam 无 redis_client → 使用内存 dict"""
+        team = ExpertTeam()
+
+        assert team._workspace._redis is None
+        assert team._workspace._local_store == {}
+
+    @pytest.mark.asyncio
+    async def test_pipeline_offloads_large_results(self):
+        """Integration: 流水线执行后，大输出被卸载到 workspace"""
+        team = _make_team_with_experts()
+        orchestrator = TeamOrchestrator(team)
+
+        gateway = _make_mock_llm_gateway(phases=[
+            {"name": "A", "assigned_expert": "lead", "task_description": "A", "depends_on": []},
+            {"name": "B", "assigned_expert": "member1", "task_description": "B", "depends_on": ["A"]},
+        ])
+        team._experts["lead"].agent._llm_gateway = gateway
+
+        # Mock _execute_phase to return large content + verify offloading
+        large_content = "x" * 1000
+
+        async def mock_execute_phase(phase, plan):
+            phase.status = PhaseStatus.COMPLETED
+            # Simulate the offloading that happens in _execute_execution_phase
+            output_key = f"{plan.id}/phase/{phase.id}/output"
+            await team.workspace.write(output_key, large_content, phase.assigned_expert)
+            phase.result = orchestrator._offload_result(large_content, output_key)
+            return phase.result
+
+        orchestrator._execute_phase = mock_execute_phase
+        orchestrator._check_divergence_and_insert_debates = AsyncMock(return_value=None)
+
+        result = await orchestrator.execute("test")
+
+        assert result["status"] == "completed"
+        # Verify phases have offloaded results
+        plan = result["plan"]
+        for ph in plan.phases:
+            if ph.status == PhaseStatus.COMPLETED:
+                assert ph.result.get("_offloaded") is True
+                assert len(ph.result["content"]) < len(large_content)