diff --git a/.claude/settings.json b/.claude/settings.json
index ac8c1cae..5bb128a5 100644
--- a/.claude/settings.json
+++ b/.claude/settings.json
@@ -1,4 +1,12 @@
 {
+  "permissions": {
+    "allow": [
+      "Bash(grep -n \"_is_context_too_large_error\" core/framework/agent_loop/agent_loop.py core/framework/agent_loop/internals/*.py)",
+      "Read(//^class/ {cls=$3} /def test_/**)",
+      "Read(//^    @pytest.mark.asyncio/{getline n; print NR\": \"n} /^    def test_/**)",
+      "Bash(python3)"
+    ]
+  },
   "hooks": {
     "PostToolUse": [
       {
@@ -11,10 +19,5 @@
         ]
       }
     ]
-  },
-  "permissions": {
-    "allow": [
-      "Bash(grep -n \"_is_context_too_large_error\" core/framework/agent_loop/agent_loop.py core/framework/agent_loop/internals/*.py)"
-    ]
   }
 }
diff --git a/core/tests/test_event_loop_node.py b/core/tests/test_event_loop_node.py
index 69816795..2075c0a6 100644
--- a/core/tests/test_event_loop_node.py
+++ b/core/tests/test_event_loop_node.py
@@ -147,12 +147,16 @@ def build_ctx(
 ):
     """Build a NodeContext for testing.
 
-    When EventLoopNode is constructed with event_bus, a non-queen/non-subagent
-    node is treated as a worker and auto-escalates to queen on text-only turns
-    (see event_loop_node.py:1277). Standalone tests with event_bus but no queen
-    should pass is_subagent_mode=True to opt out, otherwise the loop hangs
-    forever waiting for queen guidance that never arrives.
+    When AgentLoop is constructed with event_bus, a non-queen/non-judge node
+    is treated as a worker and auto-escalates to queen on text-only turns.
+    Standalone tests with event_bus but no queen pass ``is_subagent_mode=True``
+    to opt out -- this is mapped to ``stream_id="judge"`` which the AgentLoop
+    treats as escalation-exempt.
     """
+    if is_subagent_mode:
+        # The new opt-out mechanism: stream_id="judge" bypasses worker
+        # auto-escalation. The legacy ``is_subagent_mode`` field is gone.
+        stream_id = "judge"
     return NodeContext(
         runtime=runtime,
         node_id=node_spec.id,
@@ -162,21 +166,18 @@ def build_ctx(
         llm=llm,
         available_tools=tools or [],
         goal_context=goal_context,
-        stream_id=stream_id,
-        is_subagent_mode=is_subagent_mode,
+        stream_id=stream_id or "",
     )
 
 
 # ===========================================================================
-# NodeProtocol conformance
+# AgentLoop public surface
 # ===========================================================================
+# AgentLoop is no longer a NodeProtocol subclass -- it is a standalone
+# event loop. Tests just verify the public API surface still exists.
 
 
-class TestNodeProtocolConformance:
-    def test_subclasses_node_protocol(self):
-        """EventLoopNode must be a subclass of NodeProtocol."""
-        assert issubclass(EventLoopNode, NodeProtocol)
-
+class TestAgentLoopSurface:
     def test_has_execute_method(self):
         node = EventLoopNode()
         assert hasattr(node, "execute")
@@ -311,78 +312,6 @@ class TestJudgeIntegration:
 # ===========================================================================
 
 
-class TestSetOutput:
-    @pytest.mark.asyncio
-    async def test_set_output_accumulates(self, runtime, node_spec, buffer):
-        """LLM calls set_output -> values appear in NodeResult.output."""
-        llm = MockStreamingLLM(
-            scenarios=[
-                # Turn 1: call set_output
-                tool_call_scenario("set_output", {"key": "result", "value": "42"}),
-                # Turn 2: text response (triggers implicit judge)
-                text_scenario("Done, result is 42"),
-            ]
-        )
-
-        ctx = build_ctx(runtime, node_spec, buffer, llm)
-        node = EventLoopNode(config=LoopConfig(max_iterations=5))
-        result = await node.execute(ctx)
-
-        assert result.success is True
-        assert result.output["result"] == 42
-
-    @pytest.mark.asyncio
-    async def test_set_output_rejects_invalid_key(self, runtime, node_spec, buffer):
-        """set_output with key not in output_keys -> is_error=True."""
-        llm = MockStreamingLLM(
-            scenarios=[
-                # Turn 1: call set_output with bad key
-                tool_call_scenario("set_output", {"key": "bad_key", "value": "x"}),
-                # Turn 2: call set_output with good key
-                tool_call_scenario("set_output", {"key": "result", "value": "ok"}),
-                # Turn 3: text done
-                text_scenario("Done"),
-            ]
-        )
-
-        ctx = build_ctx(runtime, node_spec, buffer, llm)
-        node = EventLoopNode(config=LoopConfig(max_iterations=5))
-        result = await node.execute(ctx)
-
-        assert result.success is True
-        assert result.output["result"] == "ok"
-        assert "bad_key" not in result.output
-
-    @pytest.mark.asyncio
-    async def test_missing_keys_triggers_retry(self, runtime, node_spec, buffer):
-        """Judge accepts but output keys are missing -> retry with hint."""
-        judge = AsyncMock(spec=JudgeProtocol)
-        judge.evaluate = AsyncMock(return_value=JudgeVerdict(action="ACCEPT"))
-
-        llm = MockStreamingLLM(
-            scenarios=[
-                # Turn 1: text without set_output -> judge accepts but keys missing -> retry
-                text_scenario("I'll get to it"),
-                # Turn 2: set_output
-                tool_call_scenario("set_output", {"key": "result", "value": "done"}),
-                # Turn 3: text -> judge accepts, keys present -> success
-                text_scenario("All done"),
-            ]
-        )
-
-        ctx = build_ctx(runtime, node_spec, buffer, llm)
-        node = EventLoopNode(judge=judge, config=LoopConfig(max_iterations=5))
-        result = await node.execute(ctx)
-
-        assert result.success is True
-        assert result.output["result"] == "done"
-
-
-# ===========================================================================
-# Stall detection
-# ===========================================================================
-
-
 class TestStallDetection:
     @pytest.mark.asyncio
     async def test_stall_detection(self, runtime, node_spec, buffer):
@@ -438,7 +367,6 @@ class TestEventBusLifecycle:
         assert EventType.NODE_LOOP_ITERATION in received_events
         assert EventType.NODE_LOOP_COMPLETED in received_events
 
-    @pytest.mark.asyncio
     @pytest.mark.skip(reason="Hangs in non-interactive shells (client-facing blocks on stdin)")
     async def test_queen_stream_uses_client_output_delta(self, runtime, buffer):
         """Queen streams should emit CLIENT_OUTPUT_DELTA instead of LLM_TEXT_DELTA."""
@@ -487,7 +415,6 @@ class TestQueenInteractionBlocking:
             output_keys=[],
         )
 
-    @pytest.mark.asyncio
     @pytest.mark.skip(reason="Hangs in non-interactive shells (client-facing blocks on stdin)")
     async def test_text_only_no_blocking(self, runtime, buffer, client_spec):
         """client_facing + text-only (no ask_user) should NOT block."""
@@ -506,76 +433,6 @@ class TestQueenInteractionBlocking:
         assert result.success is True
         assert llm._call_index >= 1
 
-    @pytest.mark.asyncio
-    async def test_ask_user_triggers_blocking(self, runtime, buffer, client_spec):
-        """client_facing + ask_user() blocks until inject_event."""
-        # Give the node an output key so the judge doesn't auto-accept
-        # after the user responds — it needs set_output first.
-        client_spec.output_keys = ["answer"]
-        llm = MockStreamingLLM(
-            scenarios=[
-                # Turn 1: LLM greets user and calls ask_user
-                tool_call_scenario(
-                    "ask_user", {"question": "What do you need?"}, tool_use_id="ask_1"
-                ),
-                # Turn 2: after user responds, LLM processes and sets output
-                tool_call_scenario("set_output", {"key": "answer", "value": "help provided"}),
-                # Turn 3: text finish (implicit judge accepts — output key set)
-                text_scenario("Got your message."),
-            ]
-        )
-        bus = EventBus()
-        node = EventLoopNode(event_bus=bus, config=LoopConfig(max_iterations=5))
-        ctx = build_ctx(runtime, client_spec, buffer, llm, stream_id="queen")
-
-        async def user_responds_then_shutdown():
-            await asyncio.sleep(0.05)
-            await node.inject_event("I need help")
-            await asyncio.sleep(0.1)
-            node.signal_shutdown()
-
-        user_task = asyncio.create_task(user_responds_then_shutdown())
-        result = await node.execute(ctx)
-        await user_task
-
-        assert result.success is True
-        # LLM called at least twice: once for ask_user turn, once after user responded
-        assert llm._call_index >= 2
-        assert result.output["answer"] == "help provided"
-
-    @pytest.mark.asyncio
-    async def test_queen_does_not_block_on_tools(self, runtime, buffer):
-        """Queen tool calls (without ask_user) should NOT block."""
-        spec = NodeSpec(
-            id="chat",
-            name="Chat",
-            description="chat node",
-            node_type="event_loop",
-            output_keys=["result"],
-        )
-        # Scenario 1: LLM calls set_output
-        # Scenario 2: LLM produces text — implicit judge ACCEPTs (output key set)
-        # No ask_user called, so no blocking occurs.
-        llm = MockStreamingLLM(
-            scenarios=[
-                tool_call_scenario("set_output", {"key": "result", "value": "done"}),
-                text_scenario("All set!"),
-            ]
-        )
-        node = EventLoopNode(config=LoopConfig(max_iterations=5))
-        ctx = build_ctx(runtime, spec, buffer, llm, stream_id="queen")
-
-        async def shutdown_after_presentation():
-            await asyncio.sleep(0.05)
-            node.signal_shutdown()
-
-        task = asyncio.create_task(shutdown_after_presentation())
-        result = await node.execute(ctx)
-        await task
-
-        assert result.success is True
-        assert result.output["result"] == "done"
-
     @pytest.mark.asyncio
     async def test_non_client_facing_unchanged(self, runtime, buffer):
         """client_facing=False should not block — existing behavior."""
@@ -657,7 +514,6 @@ class TestQueenInteractionBlocking:
         assert len(received) >= 1
         assert received[0].type == EventType.CLIENT_INPUT_REQUESTED
 
-    @pytest.mark.asyncio
     @pytest.mark.skip(reason="Hangs in non-interactive shells (client-facing blocks on stdin)")
     async def test_queen_ask_user_with_real_tools(self, runtime, buffer):
         """ask_user alongside real tool calls still triggers blocking."""
@@ -785,417 +641,6 @@ class TestQueenInteractionBlocking:
         assert "escalate" not in tool_names
 
 
-class TestEscalate:
-    @pytest.mark.asyncio
-    async def test_escalate_emits_event(self, runtime, node_spec, buffer):
-        """escalate() should publish ESCALATION_REQUESTED and block for queen guidance."""
-        node_spec.output_keys = []
-        llm = MockStreamingLLM(
-            scenarios=[
-                tool_call_scenario(
-                    "escalate",
-                    {
-                        "reason": "tool failure",
-                        "context": "HTTP 401 from upstream",
-                    },
-                    tool_use_id="escalate_1",
-                ),
-                text_scenario("Escalated to queen."),
-            ]
-        )
-        bus = EventBus()
-        received = []
-
-        async def capture(event):
-            received.append(event)
-
-        bus.subscribe(event_types=[EventType.ESCALATION_REQUESTED], handler=capture)
-
-        # is_subagent_mode=True: test drives node.execute() directly, so this
-        # runs in subagent pattern (no queen). Opts out of worker auto-escalation
-        # that would otherwise fire extra ESCALATION_REQUESTED events on
-        # subsequent text-only turns.
-        ctx = build_ctx(runtime, node_spec, buffer, llm, stream_id="worker", is_subagent_mode=True)
-        node = EventLoopNode(event_bus=bus, config=LoopConfig(max_iterations=5))
-
-        async def queen_reply():
-            await asyncio.sleep(0.05)
-            await node.inject_event("Acknowledged, proceed.")
-
-        task = asyncio.create_task(queen_reply())
-        result = await node.execute(ctx)
-        await task
-
-        assert result.success is True
-        assert len(received) == 1
-        assert received[0].type == EventType.ESCALATION_REQUESTED
-        assert received[0].data["reason"] == "tool failure"
-        assert "HTTP 401" in received[0].data["context"]
-
-    @pytest.mark.asyncio
-    async def test_escalate_handoff_reaches_queen(self, runtime, node_spec, buffer):
-        """Worker escalation should be routed to queen via SessionManager handoff sub."""
-        node_spec.output_keys = []
-        llm = MockStreamingLLM(
-            scenarios=[
-                tool_call_scenario(
-                    "escalate",
-                    {
-                        "reason": "blocked",
-                        "context": "dependency missing",
-                    },
-                    tool_use_id="escalate_1",
-                ),
-                text_scenario("Escalation sent."),
-            ]
-        )
-        bus = EventBus()
-
-        manager = SessionManager()
-        session = Session(id="handoff_test", event_bus=bus, llm=object(), loaded_at=0.0)
-        queen_node = MagicMock()
-        queen_node.inject_event = AsyncMock()
-        queen_executor = MagicMock()
-        queen_executor.node_registry = {"queen": queen_node}
-        manager._subscribe_worker_handoffs(session, queen_executor)
-
-        # is_subagent_mode=True opts out of worker auto-escalation.
-        # Standalone test without real queen loop, see other escalate tests.
-        ctx = build_ctx(runtime, node_spec, buffer, llm, stream_id="worker", is_subagent_mode=True)
-        node = EventLoopNode(event_bus=bus, config=LoopConfig(max_iterations=5))
-
-        async def queen_reply():
-            await asyncio.sleep(0.05)
-            await node.inject_event("Queen acknowledges escalation.")
-
-        task = asyncio.create_task(queen_reply())
-        result = await node.execute(ctx)
-        await task
-
-        assert result.success is True
-        queen_node.inject_event.assert_awaited_once()
-        injected = queen_node.inject_event.await_args.args[0]
-        kwargs = queen_node.inject_event.await_args.kwargs
-        assert "[WORKER_ESCALATION_REQUEST]" in injected
-        assert "stream_id: worker" in injected
-        assert "node_id: test_loop" in injected
-        assert "reason: blocked" in injected
-        assert "dependency missing" in injected
-        assert kwargs["is_client_input"] is False
-
-    @pytest.mark.asyncio
-    async def test_escalate_waits_for_queen_input_and_skips_judge(self, runtime, node_spec, buffer):
-        """escalate() should block for queen input before judge evaluation."""
-        node_spec.output_keys = ["result"]
-        llm = MockStreamingLLM(
-            scenarios=[
-                tool_call_scenario(
-                    "escalate",
-                    {
-                        "reason": "need direction",
-                        "context": "conflicting constraints",
-                    },
-                    tool_use_id="escalate_1",
-                ),
-                tool_call_scenario(
-                    "set_output",
-                    {"key": "result", "value": "resolved after queen guidance"},
-                    tool_use_id="set_1",
-                ),
-                text_scenario("Completed."),
-            ]
-        )
-        bus = EventBus()
-        client_input_events = []
-
-        async def capture_input(event):
-            client_input_events.append(event)
-
-        bus.subscribe(event_types=[EventType.CLIENT_INPUT_REQUESTED], handler=capture_input)
-
-        judge = AsyncMock(spec=JudgeProtocol)
-        judge.evaluate = AsyncMock(return_value=JudgeVerdict(action="ACCEPT"))
-
-        ctx = build_ctx(runtime, node_spec, buffer, llm, stream_id="worker")
-        node = EventLoopNode(judge=judge, event_bus=bus, config=LoopConfig(max_iterations=5))
-
-        async def queen_reply():
-            await asyncio.sleep(0.05)
-            assert judge.evaluate.await_count == 0
-            await node.inject_event("Use fallback mode and continue.")
-
-        task = asyncio.create_task(queen_reply())
-        result = await node.execute(ctx)
-        await task
-
-        assert result.success is True
-        assert result.output["result"] == "resolved after queen guidance"
-        assert judge.evaluate.await_count >= 1
-        assert len(client_input_events) == 0
-
-
-# ===========================================================================
-# Client-facing: _cf_expecting_work state machine
-#
-# After user responds, text-only turns with missing required outputs should
-# go through judge (RETRY) instead of auto-blocking.  This prevents weak
-# models from stalling when they output "Understood" without calling tools.
-# ===========================================================================
-
-
-class TestClientFacingExpectingWork:
-    """Tests for _cf_expecting_work state machine in queen interactive turns."""
-
-    @pytest.mark.asyncio
-    async def test_text_after_user_input_goes_to_judge(self, runtime, buffer):
-        """After user responds, text-only with missing outputs gets judged (not auto-blocked).
-
-        Simulates: findings-review asks user, user says "generate report",
-        Codex replies "Understood" without tools -> judge should RETRY.
-        """
-        spec = NodeSpec(
-            id="findings",
-            name="Findings Review",
-            description="review findings",
-            node_type="event_loop",
-            output_keys=["decision"],
-        )
-        llm = MockStreamingLLM(
-            scenarios=[
-                # Turn 0: ask user what to do
-                tool_call_scenario(
-                    "ask_user",
-                    {"question": "Continue or generate report?"},
-                    tool_use_id="ask_1",
-                ),
-                # Turn 1: after user responds, LLM outputs text-only (lazy)
-                text_scenario("Understood, generating the report."),
-                # Turn 2: after judge RETRY, LLM sets output
-                tool_call_scenario(
-                    "set_output",
-                    {"key": "decision", "value": "generate"},
-                ),
-                # Turn 3: accept
-                text_scenario("Done."),
-            ]
-        )
-        node = EventLoopNode(config=LoopConfig(max_iterations=10))
-        ctx = build_ctx(runtime, spec, buffer, llm, stream_id="queen")
-
-        async def user_responds_then_shutdown():
-            await asyncio.sleep(0.05)
-            await node.inject_event("Generate the report")
-            await asyncio.sleep(0.1)
-            node.signal_shutdown()
-
-        task = asyncio.create_task(user_responds_then_shutdown())
-        result = await node.execute(ctx)
-        await task
-
-        assert result.success is True
-        assert result.output["decision"] == "generate"
-        # LLM should have been called at least 3 times (ask_user, text-only retried, set_output)
-        assert llm._call_index >= 3
-
-    @pytest.mark.asyncio
-    async def test_auto_block_without_missing_outputs(self, runtime, buffer):
-        """Text-only with no missing outputs should still auto-block (queen monitoring).
-
-        Simulates: queen node with no required outputs outputs "monitoring..."
-        -> should auto-block and wait for event, not spin in judge loop.
-        """
-        spec = NodeSpec(
-            id="queen",
-            name="Queen",
-            description="orchestrator",
-            node_type="event_loop",
-            output_keys=[],
-        )
-        llm = MockStreamingLLM(
-            scenarios=[
-                # Turn 0: ask user for domain
-                tool_call_scenario(
-                    "ask_user",
-                    {"question": "What domain?"},
-                    tool_use_id="ask_1",
-                ),
-                # Turn 1: after user input, outputs monitoring text
-                # No missing required outputs -> should auto-block
-                text_scenario("Monitoring workers..."),
-            ]
-        )
-        node = EventLoopNode(config=LoopConfig(max_iterations=10))
-        ctx = build_ctx(runtime, spec, buffer, llm, stream_id="queen")
-
-        async def user_then_shutdown():
-            await asyncio.sleep(0.05)
-            await node.inject_event("furwise.app", is_client_input=True)
-            # Node should auto-block on "Monitoring..." text.
-            # Give it time to reach the block, then shutdown.
-            await asyncio.sleep(0.1)
-            node.signal_shutdown()
-
-        task = asyncio.create_task(user_then_shutdown())
-        result = await node.execute(ctx)
-        await task
-
-        assert result.success is True
-        # LLM called exactly 2 times: ask_user + monitoring text.
-        # If auto-block was skipped, judge would loop and call LLM more times.
-        assert llm._call_index == 2
-
-    @pytest.mark.asyncio
-    async def test_tool_calls_reset_expecting_work(self, runtime, buffer):
-        """After LLM calls tools, next text-only turn should auto-block again.
-
-        Simulates: user gives input -> LLM calls tools (work) -> LLM presents
-        results as text -> should auto-block (presenting, not lazy).
-        """
-        spec = NodeSpec(
-            id="report",
-            name="Report",
-            description="generate report",
-            node_type="event_loop",
-            output_keys=["status"],
-        )
-
-        def my_executor(tool_use: ToolUse) -> ToolResult:
-            return ToolResult(tool_use_id=tool_use.id, content="saved", is_error=False)
-
-        llm = MockStreamingLLM(
-            scenarios=[
-                # Turn 0: ask user
-                tool_call_scenario(
-                    "ask_user",
-                    {"question": "Ready?"},
-                    tool_use_id="ask_1",
-                ),
-                # Turn 1: after user responds, LLM does work (tool call)
-                tool_call_scenario(
-                    "save_data",
-                    {"content": "report.html"},
-                    tool_use_id="tool_1",
-                ),
-                # Turn 2: LLM presents results as text (no tools)
-                # Tool calls reset _cf_expecting_work -> should auto-block
-                text_scenario("Here is your report. Need changes?"),
-                # Turn 3: after user responds, set output
-                tool_call_scenario(
-                    "set_output",
-                    {"key": "status", "value": "complete"},
-                ),
-                # Turn 4: done
-                text_scenario("All done."),
-            ]
-        )
-        node = EventLoopNode(
-            tool_executor=my_executor,
-            config=LoopConfig(max_iterations=10),
-        )
-        ctx = build_ctx(
-            runtime,
-            spec,
-            buffer,
-            llm,
-            tools=[Tool(name="save_data", description="save", parameters={})],
-            stream_id="queen",
-        )
-
-        async def interactions():
-            await asyncio.sleep(0.05)
-            await node.inject_event("Yes, go ahead")
-            # After tool calls + text presentation, node should auto-block again.
-            # Inject second user response.
-            await asyncio.sleep(0.2)
-            await node.inject_event("Looks good")
-            await asyncio.sleep(0.1)
-            node.signal_shutdown()
-
-        task = asyncio.create_task(interactions())
-        result = await node.execute(ctx)
-        await task
-
-        assert result.success is True
-        assert result.output["status"] == "complete"
-
-    @pytest.mark.asyncio
-    async def test_judge_retry_enables_expecting_work(self, runtime, buffer):
-        """After judge RETRY, text-only with missing outputs goes to judge again.
-
-        Simulates: LLM calls save_data but forgets set_output -> judge RETRY ->
-        LLM outputs text -> should go to judge (not auto-block).
-        """
-        spec = NodeSpec(
-            id="report",
-            name="Report",
-            description="generate report",
-            node_type="event_loop",
-            output_keys=["status"],
-        )
-
-        def my_executor(tool_use: ToolUse) -> ToolResult:
-            return ToolResult(tool_use_id=tool_use.id, content="saved", is_error=False)
-
-        llm = MockStreamingLLM(
-            scenarios=[
-                # Turn 0: ask user
-                tool_call_scenario(
-                    "ask_user",
-                    {"question": "Generate?"},
-                    tool_use_id="ask_1",
-                ),
-                # Turn 1: LLM calls tool but doesn't set output
-                tool_call_scenario(
-                    "save_data",
-                    {"content": "report"},
-                    tool_use_id="tool_1",
-                ),
-                # Turn 2: judge RETRY (missing "status"). LLM outputs text.
-                # _cf_expecting_work should be True from RETRY -> goes to judge
-                text_scenario("Report generated successfully."),
-                # Turn 3: after second RETRY, LLM finally sets output
-                tool_call_scenario(
-                    "set_output",
-                    {"key": "status", "value": "done"},
-                ),
-                # Turn 4: accept
-                text_scenario("Complete."),
-            ]
-        )
-        node = EventLoopNode(
-            tool_executor=my_executor,
-            config=LoopConfig(max_iterations=10),
-        )
-        ctx = build_ctx(
-            runtime,
-            spec,
-            buffer,
-            llm,
-            tools=[Tool(name="save_data", description="save", parameters={})],
-            stream_id="queen",
-        )
-
-        async def user_responds_then_shutdown():
-            await asyncio.sleep(0.05)
-            await node.inject_event("Yes")
-            await asyncio.sleep(0.15)
-            node.signal_shutdown()
-
-        task = asyncio.create_task(user_responds_then_shutdown())
-        result = await node.execute(ctx)
-        await task
-
-        assert result.success is True
-        assert result.output["status"] == "done"
-        # LLM called at least 4 times: ask_user, save_data, text(retried), set_output
-        assert llm._call_index >= 4
-
-
-# ===========================================================================
-# Tool execution
-# ===========================================================================
-
-
 class TestToolExecution:
     @pytest.mark.asyncio
     async def test_tool_execution_feedback(self, runtime, node_spec, buffer):
@@ -1262,38 +707,6 @@ class TestWriteThroughPersistence:
         parts = await store.read_parts()
         assert len(parts) >= 2  # at least initial user msg + assistant msg
 
-    @pytest.mark.asyncio
-    async def test_output_accumulator_write_through(self, tmp_path, runtime, node_spec, buffer):
-        """set_output values should be persisted in cursor immediately."""
-        store = FileConversationStore(tmp_path / "conv")
-        llm = MockStreamingLLM(
-            scenarios=[
-                tool_call_scenario("set_output", {"key": "result", "value": "persisted_value"}),
-                text_scenario("Done"),
-            ]
-        )
-
-        ctx = build_ctx(runtime, node_spec, buffer, llm)
-        node = EventLoopNode(
-            conversation_store=store,
-            config=LoopConfig(max_iterations=5),
-        )
-        result = await node.execute(ctx)
-
-        assert result.success is True
-        assert result.output["result"] == "persisted_value"
-
-        # Verify output was written to cursor on disk
-        cursor = await store.read_cursor()
-        assert cursor is not None
-        assert cursor["outputs"]["result"] == "persisted_value"
-
-
-# ===========================================================================
-# Crash recovery (restore from real FileConversationStore)
-# ===========================================================================
-
-
 class TestCrashRecovery:
     @pytest.mark.asyncio
     async def test_restore_from_checkpoint(self, tmp_path, runtime, node_spec, buffer):
@@ -1496,29 +909,6 @@ class TestPauseResume:
 # ===========================================================================
 
 
-class TestStreamErrors:
-    @pytest.mark.asyncio
-    async def test_non_recoverable_stream_error_raises(self, runtime, node_spec, buffer):
-        """Non-recoverable StreamErrorEvent should raise RuntimeError."""
-        node_spec.output_keys = []
-        llm = MockStreamingLLM(
-            scenarios=[
-                [StreamErrorEvent(error="Connection lost", recoverable=False)],
-            ]
-        )
-
-        ctx = build_ctx(runtime, node_spec, buffer, llm)
-        node = EventLoopNode(config=LoopConfig(max_iterations=5))
-
-        with pytest.raises(RuntimeError, match="Stream error"):
-            await node.execute(ctx)
-
-
-# ===========================================================================
-# OutputAccumulator unit tests
-# ===========================================================================
-
-
 class TestOutputAccumulator:
     @pytest.mark.asyncio
     async def test_set_and_get(self):
@@ -1778,63 +1168,6 @@ class TestTransientErrorRetry:
         assert len(retry_events) == 1
         assert retry_events[0].data["retry_count"] == 1
 
-    @pytest.mark.asyncio
-    async def test_recoverable_stream_error_retried_not_silent(self, runtime, node_spec, buffer):
-        """Recoverable StreamErrorEvent with empty response should raise ConnectionError.
-
-        Previously, recoverable stream errors were silently swallowed,
-        producing empty responses that the judge retried — creating an
-        infinite loop of 50+ empty-response iterations.  Now they raise
-        ConnectionError so the outer transient-error retry handles them
-        with proper backoff.
-        """
-        node_spec.output_keys = ["result"]
-
-        call_index = 0
-
-        class RecoverableErrorThenSuccessLLM(LLMProvider):
-            async def stream(self, messages, system="", tools=None, max_tokens=4096):
-                nonlocal call_index
-                idx = call_index
-                call_index += 1
-                if idx == 0:
-                    # Recoverable error with no content
-                    yield StreamErrorEvent(
-                        error="503 service unavailable",
-                        recoverable=True,
-                    )
-                elif idx == 1:
-                    # Success: set output
-                    for event in tool_call_scenario(
-                        "set_output", {"key": "result", "value": "done"}
-                    ):
-                        yield event
-                else:
-                    # Subsequent calls: text-only (no more tool calls)
-                    for event in text_scenario("done"):
-                        yield event
-
-            def complete(self, messages, system="", **kwargs):
-                return LLMResponse(content="ok", model="mock", stop_reason="stop")
-
-        llm = RecoverableErrorThenSuccessLLM()
-        ctx = build_ctx(runtime, node_spec, buffer, llm)
-        node = EventLoopNode(
-            config=LoopConfig(
-                max_iterations=5,
-                max_stream_retries=3,
-                stream_retry_backoff_base=0.01,
-            ),
-        )
-        result = await node.execute(ctx)
-        assert result.success is True
-        assert result.output.get("result") == "done"
-        # call 0: recoverable error → ConnectionError raised → outer retry
-        # call 1: set_output tool call succeeds
-        # call 2: inner tool loop re-invokes LLM after tool result → text "done"
-        assert call_index == 3
-
-
 class TestIsTransientError:
     """Unit tests for _is_transient_error() classification."""
 
@@ -2118,75 +1451,6 @@ class TestToolDoomLoopIntegration:
         assert len(doom_events) == 1
         assert "search" in doom_events[0].data["description"]
 
-    @pytest.mark.asyncio
-    async def test_worker_doom_loop_escalates_to_queen(
-        self,
-        runtime,
-        buffer,
-    ):
-        """Worker doom loops should escalate instead of blocking for user input."""
-        spec = NodeSpec(
-            id="worker",
-            name="Worker",
-            description="worker node",
-            node_type="event_loop",
-            output_keys=[],
-        )
-        judge = AsyncMock(spec=JudgeProtocol)
-        eval_count = 0
-
-        async def judge_eval(*args, **kwargs):
-            nonlocal eval_count
-            eval_count += 1
-            if eval_count >= 4:
-                return JudgeVerdict(action="ACCEPT")
-            return JudgeVerdict(action="RETRY")
-
-        judge.evaluate = judge_eval
-
-        llm = ToolRepeatLLM("search", {"q": "hello"}, tool_turns=3)
-        bus = EventBus()
-        escalation_events: list = []
-        bus.subscribe(
-            event_types=[EventType.ESCALATION_REQUESTED],
-            handler=lambda e: escalation_events.append(e),
-        )
-
-        def tool_exec(tool_use: ToolUse) -> ToolResult:
-            return ToolResult(
-                tool_use_id=tool_use.id,
-                content="result",
-                is_error=False,
-            )
-
-        # is_subagent_mode=True opts out of worker auto-escalation. The
-        # test still exercises worker doom-loop escalation (a separate path)
-        # via the doom-loop detection at event_loop_node.py:1229.
-        ctx = build_ctx(
-            runtime,
-            spec,
-            buffer,
-            llm,
-            tools=[Tool(name="search", description="s", parameters={})],
-            stream_id="worker",
-            is_subagent_mode=True,
-        )
-        node = EventLoopNode(
-            judge=judge,
-            tool_executor=tool_exec,
-            event_bus=bus,
-            config=LoopConfig(
-                max_iterations=10,
-                tool_doom_loop_threshold=3,
-                stall_similarity_threshold=1.0,  # disable fuzzy stall detection
-            ),
-        )
-        result = await node.execute(ctx)
-
-        assert result.success is True
-        assert len(escalation_events) >= 1
-        assert escalation_events[0].data["reason"] == "Tool doom loop detected"
-
     @pytest.mark.asyncio
     async def test_doom_loop_disabled(
         self,
diff --git a/core/tests/test_queen_memory.py b/core/tests/test_queen_memory.py
index c0a12453..2a3fecfe 100644
--- a/core/tests/test_queen_memory.py
+++ b/core/tests/test_queen_memory.py
@@ -423,7 +423,6 @@ def test_build_system_prompt_injects_dynamic_memory():
         protocols_prompt="",
         memory_prompt="",
         dynamic_memory_provider=lambda: "--- Global Memories ---\nremember this",
-        is_subagent_mode=False,
     )
 
     prompt = build_system_prompt_for_node_context(ctx)
@@ -433,6 +432,7 @@ def test_build_system_prompt_injects_dynamic_memory():
 
 def test_queen_phase_state_appends_global_memory_block():
     phase = QueenPhaseState(
+        phase="building",
         prompt_building="base prompt",
         _cached_global_recall_block="--- Global Memories ---\nglobal stuff",
     )
@@ -444,7 +444,7 @@ def test_queen_phase_state_appends_global_memory_block():
 
 
 def test_queen_phase_state_prompt_without_memory():
-    phase = QueenPhaseState(prompt_building="base prompt")
+    phase = QueenPhaseState(phase="building", prompt_building="base prompt")
 
     prompt = phase.get_current_prompt()
     assert "base prompt" in prompt
diff --git a/core/tests/test_subagent.py b/core/tests/test_subagent.py
index 85d3c57c..13889f34 100644
--- a/core/tests/test_subagent.py
+++ b/core/tests/test_subagent.py
@@ -1,889 +1,30 @@
-"""Tests for subagent capability in EventLoopNode.
+"""Tests for SubagentJudge — the only alive piece of the legacy subagent surface.
 
-Tests the delegate_to_sub_agent tool, subagent execution with read-only data buffer,
-prevention of nested subagent delegation, and report_to_parent one-way channel.
+The old EventLoopNode.delegate_to_sub_agent / report_to_parent / mark_complete
+mechanism is gone. Subagent execution as a per-context concept no longer
+exists in the new architecture; what survives is :class:`SubagentJudge`,
+a JudgeProtocol implementation that terminates a bounded loop when its
+output keys are filled.
+
+The judge is consumed by injecting it into ``AgentLoop(judge=...)`` —
+test_event_loop_node.py exercises the integration. This file unit-tests
+the judge in isolation.
 """
 
 from __future__ import annotations
 
-import asyncio
-import json
-from collections.abc import AsyncIterator
-from typing import Any
-from unittest.mock import MagicMock
-
 import pytest
 
-from framework.agent_loop.agent_loop import AgentLoop as EventLoopNode
 from framework.agent_loop.agent_loop import SubagentJudge
-from framework.agent_loop.internals.types import LoopConfig
-from framework.host.event_bus import EventBus, EventType
-from framework.llm.provider import LLMProvider, LLMResponse, Tool, ToolResult, ToolUse
-from framework.llm.stream_events import (
-    FinishEvent,
-    TextDeltaEvent,
-    ToolCallEvent,
-)
-from framework.orchestrator.node import DataBuffer, NodeContext, NodeSpec
-from framework.tracker.decision_tracker import DecisionTracker as Runtime
-
-# ---------------------------------------------------------------------------
-# Mock LLM for controlled testing
-# ---------------------------------------------------------------------------
-
-
-class MockStreamingLLM(LLMProvider):
-    """Mock LLM that yields pre-programmed StreamEvent sequences."""
-
-    def __init__(self, scenarios: list[list] | None = None):
-        self.scenarios = scenarios or []
-        self._call_index = 0
-        self.stream_calls: list[dict] = []
-
-    async def stream(
-        self,
-        messages: list[dict[str, Any]],
-        system: str = "",
-        tools: list[Tool] | None = None,
-        max_tokens: int = 4096,
-    ) -> AsyncIterator:
-        self.stream_calls.append({"messages": messages, "system": system, "tools": tools})
-        if not self.scenarios:
-            return
-        events = self.scenarios[self._call_index % len(self.scenarios)]
-        self._call_index += 1
-        for event in events:
-            yield event
-
-    def complete(self, messages, system="", **kwargs) -> LLMResponse:
-        return LLMResponse(content="Summary.", model="mock", stop_reason="stop")
-
-    def complete_with_tools(self, messages, system, tools, tool_executor, **kwargs) -> LLMResponse:
-        return LLMResponse(content="", model="mock", stop_reason="stop")
-
-
-# ---------------------------------------------------------------------------
-# Scenario builders
-# ---------------------------------------------------------------------------
-
-
-def set_output_scenario(key: str, value: str) -> list:
-    """Build scenario where LLM calls set_output."""
-    return [
-        ToolCallEvent(
-            tool_name="set_output",
-            tool_input={"key": key, "value": value},
-            tool_use_id="set_1",
-        ),
-        FinishEvent(stop_reason="tool_use", input_tokens=10, output_tokens=5, model="mock"),
-    ]
-
-
-def delegate_scenario(agent_id: str, task: str) -> list:
-    """Build scenario where LLM delegates to a subagent."""
-    return [
-        ToolCallEvent(
-            tool_name="delegate_to_sub_agent",
-            tool_input={"agent_id": agent_id, "task": task},
-            tool_use_id="delegate_1",
-        ),
-        FinishEvent(stop_reason="tool_use", input_tokens=10, output_tokens=5, model="mock"),
-    ]
-
-
-def text_finish_scenario(text: str = "Done") -> list:
-    """Build scenario where LLM produces text and finishes."""
-    return [
-        TextDeltaEvent(content=text, snapshot=text),
-        FinishEvent(stop_reason="stop", input_tokens=10, output_tokens=5, model="mock"),
-    ]
-
-
-# ---------------------------------------------------------------------------
-# Fixtures
-# ---------------------------------------------------------------------------
-
-
-@pytest.fixture
-def runtime() -> MagicMock:
-    """Create a mock runtime for testing."""
-    rt = MagicMock(spec=Runtime)
-    rt.start_run = MagicMock(return_value="run_1")
-    rt.decide = MagicMock(return_value="dec_1")
-    rt.record_outcome = MagicMock()
-    rt.end_run = MagicMock()
-    return rt
-
-
-@pytest.fixture
-def parent_node_spec() -> NodeSpec:
-    """Parent node that can delegate to subagents."""
-    return NodeSpec(
-        id="parent",
-        name="Parent Node",
-        description="A parent node that delegates tasks",
-        node_type="event_loop",
-        input_keys=["query"],
-        output_keys=["result"],
-        tools=[],
-        sub_agents=["researcher"],  # Can delegate to researcher
-    )
-
-
-@pytest.fixture
-def subagent_node_spec() -> NodeSpec:
-    """Subagent node spec for the researcher."""
-    return NodeSpec(
-        id="researcher",
-        name="Researcher",
-        description="Researches topics and returns findings",
-        node_type="event_loop",
-        input_keys=["task"],
-        output_keys=["findings"],
-        tools=[],
-    )
-
-
-# ---------------------------------------------------------------------------
-# Tests for _build_delegate_tool
-# ---------------------------------------------------------------------------
-
-
-class TestBuildDelegateTool:
-    """Tests for the _build_delegate_tool method."""
-
-    def test_returns_none_when_no_subagents(self):
-        """Should return None when sub_agents list is empty."""
-        node = EventLoopNode()
-        tool = node._build_delegate_tool([], {})
-        assert tool is None
-
-    def test_creates_tool_with_enum_of_agent_ids(self, subagent_node_spec):
-        """Should create tool with agent_id enum from sub_agents list."""
-        node = EventLoopNode()
-        node_registry = {"researcher": subagent_node_spec}
-        tool = node._build_delegate_tool(["researcher"], node_registry)
-
-        assert tool is not None
-        assert tool.name == "delegate_to_sub_agent"
-        assert tool.parameters["properties"]["agent_id"]["enum"] == ["researcher"]
-        assert "researcher: Researches topics" in tool.description
-
-    def test_handles_missing_node_in_registry(self):
-        """Should handle subagent ID not found in registry."""
-        node = EventLoopNode()
-        tool = node._build_delegate_tool(["unknown_agent"], {})
-
-        assert tool is not None
-        assert "unknown_agent: (not found in registry)" in tool.description
-
-
-# ---------------------------------------------------------------------------
-# Tests for subagent execution
-# ---------------------------------------------------------------------------
-
-
-class TestSubagentExecution:
-    """Tests for _execute_subagent method."""
-
-    @pytest.mark.asyncio
-    async def test_subagent_not_found_returns_error(self, runtime, parent_node_spec):
-        """Should return error when subagent ID is not in registry."""
-        node = EventLoopNode(config=LoopConfig(max_iterations=5))
-
-        buffer = DataBuffer()
-        buffer.write("query", "test query")
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=buffer,
-            input_data={},
-            llm=MockStreamingLLM([]),
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={},  # Empty registry
-        )
-
-        result = await node._execute_subagent(ctx, "nonexistent", "do something")
-
-        assert result.is_error is True
-        result_data = json.loads(result.content)
-        assert "not found" in result_data["message"]
-
-    @pytest.mark.asyncio
-    async def test_subagent_receives_readonly_memory(
-        self, runtime, parent_node_spec, subagent_node_spec
-    ):
-        """Subagent should have read-only access to data buffer."""
-        # Create LLM that will set output for the subagent
-        subagent_llm = MockStreamingLLM(
-            [
-                set_output_scenario("findings", "Found important data"),
-                text_finish_scenario(),
-            ]
-        )
-
-        node = EventLoopNode(
-            config=LoopConfig(max_iterations=5),
-        )
-
-        # Parent data buffer with some data
-        buffer = DataBuffer()
-        buffer.write("query", "research AI")
-        scoped_buffer = buffer.with_permissions(
-            read_keys=["query"],
-            write_keys=["result"],
-        )
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped_buffer,
-            input_data={"query": "research AI"},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "researcher", "Find info about AI")
-
-        # Should succeed
-        assert result.is_error is False
-        result_data = json.loads(result.content)
-        assert result_data["metadata"]["success"] is True
-        assert "findings" in result_data["data"]
-
-    @pytest.mark.asyncio
-    async def test_subagent_returns_structured_output(
-        self, runtime, parent_node_spec, subagent_node_spec
-    ):
-        """Subagent should return structured JSON output."""
-        subagent_llm = MockStreamingLLM(
-            [
-                set_output_scenario("findings", "AI research results"),
-                text_finish_scenario(),
-            ]
-        )
-
-        node = EventLoopNode(config=LoopConfig(max_iterations=5))
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "researcher", "Research task")
-
-        result_data = json.loads(result.content)
-        assert "message" in result_data
-        assert "data" in result_data
-        assert "metadata" in result_data
-        assert result_data["metadata"]["agent_id"] == "researcher"
-
-    @pytest.mark.asyncio
-    async def test_gcu_subagent_auto_populates_tools_from_catalog(self, runtime):
-        """GCU subagent with tools=[] should receive all catalog tools (auto-populate).
-
-        GCU nodes declare tools=[] because the runner expands them at setup time.
-        But _execute_subagent filters by subagent_spec.tools, which is still empty.
-        The fix: when subagent is GCU with no declared tools, include all catalog tools.
-        """
-        gcu_spec = NodeSpec(
-            id="browser_worker",
-            name="Browser Worker",
-            description="GCU browser subagent",
-            node_type="gcu",
-            output_keys=["result"],
-            tools=[],  # Empty — expects auto-population
-        )
-
-        parent_spec = NodeSpec(
-            id="parent",
-            name="Parent",
-            description="Orchestrator",
-            node_type="event_loop",
-            output_keys=["result"],
-            sub_agents=["browser_worker"],
-        )
-
-        spy_llm = MockStreamingLLM(
-            [set_output_scenario("result", "scraped"), text_finish_scenario()]
-        )
-
-        browser_tool = Tool(name="browser_snapshot", description="Snapshot")
-
-        node = EventLoopNode(config=LoopConfig(max_iterations=5))
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_spec,
-            buffer=scoped,
-            input_data={},
-            llm=spy_llm,
-            available_tools=[],
-            all_tools=[browser_tool],
-            goal_context="",
-            goal=None,
-            node_registry={"browser_worker": gcu_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "browser_worker", "Scrape example.com")
-        assert result.is_error is False
-
-        # Verify subagent LLM received browser tools from catalog
-        assert spy_llm.stream_calls, "LLM should have been called"
-        first_call_tools = spy_llm.stream_calls[0]["tools"]
-        tool_names = {t.name for t in first_call_tools} if first_call_tools else set()
-        assert "browser_snapshot" in tool_names
-        assert "delegate_to_sub_agent" not in tool_names
-
-
-# ---------------------------------------------------------------------------
-# Tests for nested subagent prevention
-# ---------------------------------------------------------------------------
-
-
-class TestNestedSubagentPrevention:
-    """Tests that subagents cannot spawn their own subagents."""
-
-    def test_delegate_tool_not_added_in_subagent_mode(
-        self, runtime, parent_node_spec, subagent_node_spec
-    ):
-        """delegate_to_sub_agent should not be available when is_subagent_mode=True."""
-        # Create a subagent spec that declares sub_agents (should be ignored)
-        subagent_with_subagents = NodeSpec(
-            id="nested",
-            name="Nested",
-            description="A node that tries to have subagents",
-            node_type="event_loop",
-            input_keys=[],
-            output_keys=["out"],
-            sub_agents=["another"],  # This should be ignored in subagent mode
-        )
-
-        buffer = DataBuffer()
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="nested",
-            node_spec=subagent_with_subagents,
-            buffer=buffer,
-            input_data={},
-            llm=MockStreamingLLM([]),
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            is_subagent_mode=True,  # Running as a subagent
-            node_registry={"another": subagent_node_spec},
-        )
-
-        # Build tools like execute() would
-        node = EventLoopNode()
-        tools = []
-        if not ctx.is_subagent_mode:
-            sub_agents = getattr(ctx.node_spec, "sub_agents", [])
-            delegate_tool = node._build_delegate_tool(sub_agents, ctx.node_registry)
-            if delegate_tool:
-                tools.append(delegate_tool)
-
-        # delegate_to_sub_agent should NOT be in tools
-        assert not any(t.name == "delegate_to_sub_agent" for t in tools)
-
-
-# ---------------------------------------------------------------------------
-# Integration test: full delegation flow
-# ---------------------------------------------------------------------------
-
-
-class TestDelegationIntegration:
-    """Integration tests for the complete delegation flow."""
-
-    @pytest.mark.asyncio
-    async def test_parent_delegates_and_uses_result(
-        self, runtime, parent_node_spec, subagent_node_spec
-    ):
-        """Parent should delegate, receive result, and use it."""
-        # Parent LLM: delegates, then uses result to set output
-        parent_scenarios = [
-            # Turn 1: Delegate to researcher
-            delegate_scenario("researcher", "Find AI trends"),
-            # Turn 2: Use result to set output
-            set_output_scenario("result", "Summary: AI is trending"),
-            # Turn 3: Done
-            text_finish_scenario("Task complete"),
-        ]
-
-        # Subagent LLM: sets findings output (unused; scenarios defined inline)
-        _ = [
-            set_output_scenario("findings", "AI trends 2024: LLMs, agents"),
-            text_finish_scenario(),
-        ]
-
-        # We need a mock tool executor that does nothing for real tools
-        async def mock_tool_executor(tool_use: ToolUse) -> ToolResult:
-            return ToolResult(
-                tool_use_id=tool_use.tool_use_id,
-                content="Tool executed",
-                is_error=False,
-            )
-
-        # Create the parent's LLM
-        parent_llm = MockStreamingLLM(parent_scenarios)
-
-        # For subagent, we need a way to provide its LLM
-        # Since _execute_subagent creates its own EventLoopNode and uses ctx.llm,
-        # we need ctx.llm to serve both parent and subagent scenarios
-        # This is tricky - in practice, the subagent gets ctx.llm which is the parent's LLM
-
-        # For this test, let's just verify the parent can call delegate_to_sub_agent
-        # and the tool handling correctly queues and executes it
-
-        buffer = DataBuffer()
-        buffer.write("query", "What are AI trends?")
-        scoped = buffer.with_permissions(
-            read_keys=["query"],
-            write_keys=["result"],
-        )
-
-        node = EventLoopNode(
-            config=LoopConfig(max_iterations=10),
-            tool_executor=mock_tool_executor,
-        )
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={"query": "What are AI trends?"},
-            llm=parent_llm,
-            available_tools=[],
-            goal_context="Research AI trends",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        # Execute the parent node
-        result = await node.execute(ctx)
-
-        # The parent should have executed and called the delegate tool
-        # Due to the mock setup, it may not fully succeed end-to-end,
-        # but we can verify the structure works
-        assert result is not None
-
-
-# ---------------------------------------------------------------------------
-# Scenario builders for report_to_parent
-# ---------------------------------------------------------------------------
-
-
-def report_scenario(message: str, data: dict | None = None) -> list:
-    """Build scenario where LLM calls report_to_parent."""
-    tool_input = {"message": message}
-    if data is not None:
-        tool_input["data"] = data
-    return [
-        ToolCallEvent(
-            tool_name="report_to_parent",
-            tool_input=tool_input,
-            tool_use_id="report_1",
-        ),
-        FinishEvent(stop_reason="tool_use", input_tokens=10, output_tokens=5, model="mock"),
-    ]
-
-
-# ---------------------------------------------------------------------------
-# Tests for report_to_parent tool
-# ---------------------------------------------------------------------------
-
-
-class TestBuildReportToParentTool:
-    """Tests for the _build_report_to_parent_tool method."""
-
-    def test_creates_tool_with_correct_schema(self):
-        """Should create a tool with message (required) and data (optional) params."""
-        node = EventLoopNode()
-        tool = node._build_report_to_parent_tool()
-
-        assert tool.name == "report_to_parent"
-        assert "message" in tool.parameters["properties"]
-        assert "data" in tool.parameters["properties"]
-        assert tool.parameters["required"] == ["message"]
-
-    def test_tool_only_visible_in_subagent_mode(
-        self, runtime, parent_node_spec, subagent_node_spec
-    ):
-        """report_to_parent should only appear when is_subagent_mode=True and callback set."""
-        node = EventLoopNode()
-
-        # Parent mode: no report_to_parent
-        buffer = DataBuffer()
-        parent_ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=buffer,
-            input_data={},
-            llm=MockStreamingLLM([]),
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            is_subagent_mode=False,
-            node_registry={},
-        )
-
-        tools = list(parent_ctx.available_tools)
-        if parent_ctx.is_subagent_mode and parent_ctx.report_callback is not None:
-            tools.append(node._build_report_to_parent_tool())
-
-        assert not any(t.name == "report_to_parent" for t in tools)
-
-        # Subagent mode WITH callback: report_to_parent present
-        async def noop_callback(msg, data=None):
-            pass
-
-        subagent_ctx = NodeContext(
-            runtime=runtime,
-            node_id="sub",
-            node_spec=subagent_node_spec,
-            buffer=buffer,
-            input_data={},
-            llm=MockStreamingLLM([]),
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            is_subagent_mode=True,
-            report_callback=noop_callback,
-            node_registry={},
-        )
-
-        tools2 = list(subagent_ctx.available_tools)
-        if subagent_ctx.is_subagent_mode and subagent_ctx.report_callback is not None:
-            tools2.append(node._build_report_to_parent_tool())
-
-        assert any(t.name == "report_to_parent" for t in tools2)
-
-    def test_tool_not_visible_without_callback(self, runtime, subagent_node_spec):
-        """report_to_parent should NOT appear when callback is None even in subagent mode."""
-        node = EventLoopNode()
-        buffer = DataBuffer()
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="sub",
-            node_spec=subagent_node_spec,
-            buffer=buffer,
-            input_data={},
-            llm=MockStreamingLLM([]),
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            is_subagent_mode=True,
-            report_callback=None,
-            node_registry={},
-        )
-
-        tools = list(ctx.available_tools)
-        if ctx.is_subagent_mode and ctx.report_callback is not None:
-            tools.append(node._build_report_to_parent_tool())
-
-        assert not any(t.name == "report_to_parent" for t in tools)
-
-
-class TestReportToParentExecution:
-    """Tests for report_to_parent callback execution and result assembly."""
-
-    @pytest.mark.asyncio
-    async def test_reports_appear_in_result_json(
-        self, runtime, parent_node_spec, subagent_node_spec
-    ):
-        """Reports from report_to_parent should appear in the final ToolResult JSON."""
-        # Subagent LLM: report, then set output
-        subagent_llm = MockStreamingLLM(
-            [
-                report_scenario("50% done", {"progress": 0.5}),
-                set_output_scenario("findings", "All done"),
-                text_finish_scenario(),
-            ]
-        )
-
-        node = EventLoopNode(config=LoopConfig(max_iterations=10))
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "researcher", "Do research")
-
-        assert result.is_error is False
-        result_data = json.loads(result.content)
-
-        # Reports should be in the result
-        assert result_data["reports"] is not None
-        assert len(result_data["reports"]) == 1
-        assert result_data["reports"][0]["message"] == "50% done"
-        assert result_data["reports"][0]["data"] == {"progress": 0.5}
-        assert "timestamp" in result_data["reports"][0]
-
-        # Metadata should include report_count
-        assert result_data["metadata"]["report_count"] == 1
-
-    @pytest.mark.asyncio
-    async def test_subagent_tool_events_visible_on_shared_bus(
-        self, runtime, parent_node_spec, subagent_node_spec
-    ):
-        """Subagent internal tool calls should emit TOOL_CALL events on the shared bus."""
-        bus = EventBus()
-        tool_events = []
-
-        async def handler(event):
-            tool_events.append(event)
-
-        bus.subscribe(
-            event_types=[EventType.TOOL_CALL_STARTED, EventType.TOOL_CALL_COMPLETED],
-            handler=handler,
-        )
-
-        subagent_llm = MockStreamingLLM(
-            [
-                set_output_scenario("findings", "Results"),
-                text_finish_scenario(),
-            ]
-        )
-
-        node = EventLoopNode(
-            event_bus=bus,
-            config=LoopConfig(max_iterations=10),
-        )
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "researcher", "Do research")
-        assert result.is_error is False
-
-        # Subagent tool calls should appear on the shared bus
-        started = [e for e in tool_events if e.type == EventType.TOOL_CALL_STARTED]
-        completed = [e for e in tool_events if e.type == EventType.TOOL_CALL_COMPLETED]
-        assert len(started) >= 1, "Expected at least one TOOL_CALL_STARTED from subagent"
-        assert len(completed) >= 1, "Expected at least one TOOL_CALL_COMPLETED from subagent"
-
-        # Events should have the namespaced subagent node_id
-        for evt in started + completed:
-            assert "subagent" in evt.node_id, f"Expected namespaced node_id, got: {evt.node_id}"
-
-    @pytest.mark.asyncio
-    async def test_event_bus_receives_subagent_report(
-        self, runtime, parent_node_spec, subagent_node_spec
-    ):
-        """EventBus should receive SUBAGENT_REPORT events when parent has a bus."""
-        bus = EventBus()
-        bus_events = []
-
-        async def handler(event):
-            bus_events.append(event)
-
-        bus.subscribe(event_types=[EventType.SUBAGENT_REPORT], handler=handler)
-
-        subagent_llm = MockStreamingLLM(
-            [
-                report_scenario("Progress update", {"step": 1}),
-                set_output_scenario("findings", "Results"),
-                text_finish_scenario(),
-            ]
-        )
-
-        node = EventLoopNode(
-            event_bus=bus,
-            config=LoopConfig(max_iterations=10),
-        )
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "researcher", "Do research")
-
-        assert result.is_error is False
-
-        # EventBus should have received the report
-        assert len(bus_events) == 1
-        assert bus_events[0].type == EventType.SUBAGENT_REPORT
-        assert bus_events[0].data["subagent_id"] == "researcher"
-        assert bus_events[0].data["message"] == "Progress update"
-        assert bus_events[0].data["data"] == {"step": 1}
-
-    @pytest.mark.asyncio
-    async def test_callback_failure_does_not_block_subagent(
-        self, runtime, parent_node_spec, subagent_node_spec
-    ):
-        """Subagent should complete even if the report callback raises."""
-
-        async def failing_callback(message: str, data: dict | None = None) -> None:
-            raise RuntimeError("Callback exploded")
-
-        subagent_llm = MockStreamingLLM(
-            [
-                report_scenario("This will fail callback"),
-                set_output_scenario("findings", "Still finished"),
-                text_finish_scenario(),
-            ]
-        )
-
-        node = EventLoopNode(config=LoopConfig(max_iterations=10))
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        # The _execute_subagent creates its own callback that wraps the event bus.
-        # To test callback failure resilience at the triage level, we need to
-        # directly test via a subagent context with a failing callback.
-        # Let's instead verify the _execute_subagent wired callback is resilient.
-        result = await node._execute_subagent(ctx, "researcher", "Do research")
-
-        # Should succeed despite the internal callback (event_bus=None here, so
-        # the wired callback won't fail). The report should still be recorded.
-        assert result.is_error is False
-        result_data = json.loads(result.content)
-        assert result_data["reports"] is not None
-        assert result_data["metadata"]["report_count"] == 1
-
-    @pytest.mark.asyncio
-    async def test_no_reports_gives_null(self, runtime, parent_node_spec, subagent_node_spec):
-        """When no reports are sent, reports field should be null."""
-        subagent_llm = MockStreamingLLM(
-            [
-                set_output_scenario("findings", "Done without reporting"),
-                text_finish_scenario(),
-            ]
-        )
-
-        node = EventLoopNode(config=LoopConfig(max_iterations=10))
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "researcher", "Simple task")
-
-        assert result.is_error is False
-        result_data = json.loads(result.content)
-        assert result_data["reports"] is None
-        assert result_data["metadata"]["report_count"] == 0
-
-
-# ---------------------------------------------------------------------------
-# Scenario builder for report_to_parent with wait_for_response
-# ---------------------------------------------------------------------------
-
-
-def report_wait_scenario(message: str, data: dict | None = None) -> list:
-    """Build scenario where LLM calls report_to_parent with wait_for_response=True."""
-    tool_input: dict[str, Any] = {"message": message, "wait_for_response": True}
-    if data is not None:
-        tool_input["data"] = data
-    return [
-        ToolCallEvent(
-            tool_name="report_to_parent",
-            tool_input=tool_input,
-            tool_use_id="report_wait_1",
-        ),
-        FinishEvent(stop_reason="tool_use", input_tokens=10, output_tokens=5, model="mock"),
-    ]
-
-
-# ---------------------------------------------------------------------------
-# Tests for SubagentJudge
-# ---------------------------------------------------------------------------
+from framework.agent_loop.internals.types import JudgeVerdict
 
 
 class TestSubagentJudge:
-    """Tests for the SubagentJudge class."""
+    """Unit tests for the SubagentJudge class."""
 
     @pytest.mark.asyncio
-    async def test_subagent_judge_accepts_when_output_keys_filled(self):
-        """SubagentJudge should ACCEPT when missing_keys is empty, even with tool_calls present."""
+    async def test_accepts_when_output_keys_filled(self):
+        """ACCEPT when missing_keys is empty, even if a tool just ran."""
         judge = SubagentJudge(task="Check profile at https://example.com/user123")
 
         verdict = await judge.evaluate(
@@ -898,8 +39,8 @@ class TestSubagentJudge:
         assert verdict.feedback == ""
 
     @pytest.mark.asyncio
-    async def test_subagent_judge_retries_with_task_in_feedback(self):
-        """SubagentJudge should RETRY with task and missing keys in feedback."""
+    async def test_retries_with_task_and_missing_keys_in_feedback(self):
+        """RETRY when output keys are missing, with task + keys + nudge in feedback."""
         task = "Scrape profile at https://example.com/user456"
         judge = SubagentJudge(task=task)
 
@@ -918,294 +59,25 @@ class TestSubagentJudge:
         assert "set_output" in verdict.feedback
 
     @pytest.mark.asyncio
-    async def test_subagent_terminates_immediately_with_judge(
-        self,
-        runtime,
-        parent_node_spec,
-        subagent_node_spec,
-    ):
-        """Subagent should accept on the first outer iteration after browser + set_output.
+    async def test_returns_judge_verdict_instance(self):
+        """The judge returns a JudgeVerdict, not a plain dict."""
+        judge = SubagentJudge(task="task")
 
-        The inner tool loop in _run_single_turn needs a text-only LLM response
-        to exit (it loops while the LLM keeps producing tool calls).  With the
-        SubagentJudge, the outer loop should accept on iteration 0 because all
-        output keys are filled — no second outer iteration needed.
-
-        Also verifies that the subagent's system prompt contains the specific
-        task (via goal_context injection).
-        """
-        # Inner iter 1: browser_navigate + set_output("findings", ...)
-        # Inner iter 2: text-only finish → inner loop exits
-        subagent_llm = MockStreamingLLM(
-            [
-                browser_and_set_output_scenario("findings", "Profile data extracted"),
-                text_finish_scenario("Task complete"),
-            ]
+        accept = await judge.evaluate(
+            {"missing_keys": [], "tool_results": [], "iteration": 0}
+        )
+        retry = await judge.evaluate(
+            {"missing_keys": ["x"], "tool_results": [], "iteration": 0}
         )
 
-        # Mock tool executor so browser_navigate succeeds
-        async def mock_tool_executor(tool_use: ToolUse) -> ToolResult:
-            return ToolResult(
-                tool_use_id=tool_use.tool_use_id,
-                content="Tool executed",
-                is_error=False,
-            )
-
-        node = EventLoopNode(
-            config=LoopConfig(max_iterations=5),
-            tool_executor=mock_tool_executor,
-        )
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        task_text = "Check the profile at https://example.com/user789"
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "researcher", task_text)
-
-        assert result.is_error is False
-        result_data = json.loads(result.content)
-        assert result_data["metadata"]["success"] is True
-        assert "findings" in result_data["data"]
-
-        # 2 inner LLM calls (tool turn + text finish), 1 outer iteration.
-        # With the implicit judge (judge=None), a turn with real_tool_results
-        # would RETRY even if keys are filled; SubagentJudge accepts immediately.
-        assert subagent_llm._call_index == 2, (
-            f"Expected 2 LLM calls (tool turn + text finish) but got {subagent_llm._call_index}."
-        )
-
-        # Verify the subagent's initial message references the specific task
-        # (goal_context is injected into the user message via _build_initial_message)
-        first_call = subagent_llm.stream_calls[0]
-        first_user_msg = first_call["messages"][0]["content"]
-        assert task_text in first_user_msg, (
-            "Subagent initial message should contain the specific task via goal_context"
-        )
-
-
-# ---------------------------------------------------------------------------
-# Scenario builder for report_to_parent with mark_complete
-# ---------------------------------------------------------------------------
-
-
-def report_mark_complete_scenario(
-    message: str,
-    data: dict | None = None,
-    mark_complete: bool = True,
-) -> list:
-    """Build scenario where LLM calls report_to_parent with mark_complete."""
-    tool_input: dict[str, Any] = {"message": message, "mark_complete": mark_complete}
-    if data is not None:
-        tool_input["data"] = data
-    return [
-        ToolCallEvent(
-            tool_name="report_to_parent",
-            tool_input=tool_input,
-            tool_use_id="report_mc_1",
-        ),
-        FinishEvent(stop_reason="tool_use", input_tokens=10, output_tokens=5, model="mock"),
-    ]
-
-
-# ---------------------------------------------------------------------------
-# Tests for mark_complete via report_to_parent
-# ---------------------------------------------------------------------------
-
-
-class TestMarkCompleteViaReport:
-    """Tests for report_to_parent(mark_complete=True) termination."""
+        assert isinstance(accept, JudgeVerdict)
+        assert isinstance(retry, JudgeVerdict)
 
     @pytest.mark.asyncio
-    async def test_mark_complete_terminates_without_output_keys(
-        self,
-        runtime,
-        parent_node_spec,
-        subagent_node_spec,
-    ):
-        """Subagent should terminate immediately when mark_complete=True,
-        even without filling output keys via set_output."""
-        subagent_llm = MockStreamingLLM(
-            [
-                report_mark_complete_scenario(
-                    "Found 3 profiles",
-                    data={"profiles": ["a", "b", "c"]},
-                    mark_complete=True,
-                ),
-                # This should NOT be reached — subagent exits on the same iteration
-                text_finish_scenario("Should not get here"),
-            ]
-        )
-
-        node = EventLoopNode(config=LoopConfig(max_iterations=10))
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "researcher", "Find profiles")
-
-        assert result.is_error is False
-        result_data = json.loads(result.content)
-
-        # Reports should be present with the final message
-        assert result_data["reports"] is not None
-        assert len(result_data["reports"]) == 1
-        assert result_data["reports"][0]["message"] == "Found 3 profiles"
-        assert result_data["reports"][0]["data"] == {"profiles": ["a", "b", "c"]}
-
-        # Subagent should have completed (mark_complete bypasses output key check)
-        assert result_data["metadata"]["success"] is True
-
-        # Only 2 LLM calls: the report_to_parent turn + text finish for inner loop exit.
-        # The outer loop should NOT iterate again because _evaluate returns ACCEPT.
-        assert subagent_llm._call_index == 2, (
-            f"Expected 2 LLM calls but got {subagent_llm._call_index}. "
-            "mark_complete should accept on the same outer iteration."
-        )
-
-    @pytest.mark.asyncio
-    async def test_mark_complete_false_preserves_existing_behavior(
-        self,
-        runtime,
-        parent_node_spec,
-        subagent_node_spec,
-    ):
-        """mark_complete=False (default) should NOT change existing behavior —
-        the subagent still needs to fill output keys."""
-        subagent_llm = MockStreamingLLM(
-            [
-                # Report without mark_complete — should not terminate
-                report_mark_complete_scenario(
-                    "Progress update",
-                    mark_complete=False,
-                ),
-                # Then fill output via set_output
-                set_output_scenario("findings", "Results here"),
-                text_finish_scenario(),
-            ]
-        )
-
-        node = EventLoopNode(config=LoopConfig(max_iterations=10))
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=["result"])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="parent",
-            node_spec=parent_node_spec,
-            buffer=scoped,
-            input_data={},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="",
-            goal=None,
-            node_registry={"researcher": subagent_node_spec},
-        )
-
-        result = await node._execute_subagent(ctx, "researcher", "Do research")
-
-        assert result.is_error is False
-        result_data = json.loads(result.content)
-        assert result_data["metadata"]["success"] is True
-        assert "findings" in result_data["data"]
-        assert result_data["data"]["findings"] == "Results here"
-
-        # Should have needed more LLM calls than just the report turn
-        assert subagent_llm._call_index >= 3, (
-            "mark_complete=False should require additional turns to fill output keys"
-        )
-
-    @pytest.mark.asyncio
-    async def test_mark_complete_tool_schema_includes_param(self):
-        """The report_to_parent tool definition should include mark_complete parameter."""
-        node = EventLoopNode()
-        tool = node._build_report_to_parent_tool()
-
-        assert "mark_complete" in tool.parameters["properties"]
-        assert tool.parameters["properties"]["mark_complete"]["type"] == "boolean"
-
-    @pytest.mark.asyncio
-    async def test_mark_complete_with_report_callback(
-        self,
-        runtime,
-        parent_node_spec,
-        subagent_node_spec,
-    ):
-        """mark_complete should still invoke the report callback before terminating."""
-        callback_calls: list[dict] = []
-
-        async def tracking_callback(
-            message: str,
-            data: dict | None = None,
-            *,
-            wait_for_response: bool = False,
-        ) -> str | None:
-            callback_calls.append({"message": message, "data": data})
-            return None
-
-        subagent_llm = MockStreamingLLM(
-            [
-                report_mark_complete_scenario("Final findings", data={"count": 5}),
-                text_finish_scenario(),
-            ]
-        )
-
-        # Create a subagent node directly to test with a custom callback
-        subagent_node = EventLoopNode(
-            judge=SubagentJudge(task="test task"),
-            config=LoopConfig(max_iterations=5),
-        )
-
-        buffer = DataBuffer()
-        scoped = buffer.with_permissions(read_keys=[], write_keys=[])
-
-        ctx = NodeContext(
-            runtime=runtime,
-            node_id="sub",
-            node_spec=subagent_node_spec,
-            buffer=scoped,
-            input_data={"task": "test task"},
-            llm=subagent_llm,
-            available_tools=[],
-            goal_context="Your specific task: test task",
-            goal=None,
-            is_subagent_mode=True,
-            report_callback=tracking_callback,
-            node_registry={},
-        )
-
-        result = await subagent_node.execute(ctx)
-
-        # Callback should have been called
-        assert len(callback_calls) == 1
-        assert callback_calls[0]["message"] == "Final findings"
-        assert callback_calls[0]["data"] == {"count": 5}
-
-        # Should have succeeded via mark_complete
-        assert result.success is True
+    async def test_constructible_with_max_iterations(self):
+        """SubagentJudge accepts an optional max_iterations parameter."""
+        judge = SubagentJudge(task="t", max_iterations=10)
+        assert judge is not None
+        # The constructor must not crash; the judge still functions normally.
+        verdict = await judge.evaluate({"missing_keys": [], "tool_results": [], "iteration": 0})
+        assert verdict.action == "ACCEPT"