377 lines
12 KiB
Python
377 lines
12 KiB
Python
"""Agent graph construction for Email Inbox Management Agent."""
|
|
|
|
from pathlib import Path
|
|
|
|
from framework.graph import EdgeCondition, EdgeSpec, Goal, SuccessCriterion, Constraint
|
|
from framework.graph.checkpoint_config import CheckpointConfig
|
|
from framework.graph.edge import GraphSpec
|
|
from framework.graph.executor import ExecutionResult, GraphExecutor
|
|
from framework.llm import LiteLLMProvider
|
|
from framework.runner.tool_registry import ToolRegistry
|
|
from framework.runtime.agent_runtime import create_agent_runtime
|
|
from framework.runtime.event_bus import EventBus
|
|
from framework.runtime.execution_stream import EntryPointSpec
|
|
|
|
from .config import default_config, metadata
|
|
from .nodes import (
|
|
intake_node,
|
|
fetch_emails_node,
|
|
classify_and_act_node,
|
|
report_node,
|
|
)
|
|
|
|
# Goal definition
|
|
goal = Goal(
|
|
id="email-inbox-management",
|
|
name="Email Inbox Management",
|
|
description=(
|
|
"Manage Gmail inbox emails autonomously using user-defined free-text rules. "
|
|
"For every five minutes, fetch inbox emails (configurable batch size, default 100), "
|
|
"apply the user's rules to each email, and execute the appropriate Gmail actions — trash, "
|
|
"mark as spam, mark important, mark read/unread, star, draft replies, "
|
|
"create/apply custom labels, and more."
|
|
),
|
|
success_criteria=[
|
|
SuccessCriterion(
|
|
id="correct-action-execution",
|
|
description=(
|
|
"Gmail actions are applied correctly to the right emails "
|
|
"based on the user's rules"
|
|
),
|
|
metric="action_correctness",
|
|
target=">=95%",
|
|
weight=0.30,
|
|
),
|
|
SuccessCriterion(
|
|
id="action-report",
|
|
description=(
|
|
"Produces a summary report showing what was done: how many emails "
|
|
"were affected by each action type, with email subjects listed"
|
|
),
|
|
metric="report_completeness",
|
|
target="100%",
|
|
weight=0.25,
|
|
),
|
|
SuccessCriterion(
|
|
id="batch-completeness",
|
|
description=(
|
|
"All fetched emails up to the configured max are processed and acted upon; "
|
|
"none are silently skipped"
|
|
),
|
|
metric="emails_processed_ratio",
|
|
target="100%",
|
|
weight=0.30,
|
|
),
|
|
SuccessCriterion(
|
|
id="label-management",
|
|
description="Custom labels are created and applied correctly when rules require them",
|
|
metric="label_coverage",
|
|
target="100%",
|
|
weight=0.15,
|
|
),
|
|
],
|
|
constraints=[
|
|
Constraint(
|
|
id="process-all-emails",
|
|
description=(
|
|
"Must loop through all inbox emails by paginating with max_emails as page size; "
|
|
"no emails should be silently skipped"
|
|
),
|
|
constraint_type="hard",
|
|
category="operational",
|
|
),
|
|
Constraint(
|
|
id="non-destructive-default",
|
|
description=(
|
|
"Archiving removes from inbox but preserves the email; only explicit "
|
|
"trash rules move emails to trash"
|
|
),
|
|
constraint_type="hard",
|
|
category="safety",
|
|
),
|
|
Constraint(
|
|
id="draft-not-send",
|
|
description="Agent creates draft replies but NEVER sends them automatically",
|
|
constraint_type="hard",
|
|
category="safety",
|
|
),
|
|
],
|
|
)
|
|
|
|
# Node list
|
|
nodes = [
|
|
intake_node,
|
|
fetch_emails_node,
|
|
classify_and_act_node,
|
|
report_node,
|
|
]
|
|
|
|
# Edge definitions
|
|
edges = [
|
|
EdgeSpec(
|
|
id="intake-to-fetch-emails",
|
|
source="intake",
|
|
target="fetch-emails",
|
|
condition=EdgeCondition.ON_SUCCESS,
|
|
priority=1,
|
|
),
|
|
EdgeSpec(
|
|
id="fetch-emails-to-classify",
|
|
source="fetch-emails",
|
|
target="classify-and-act",
|
|
condition=EdgeCondition.ON_SUCCESS,
|
|
priority=1,
|
|
),
|
|
# Pagination loop: if next_page_token is non-empty, loop back to fetch
|
|
EdgeSpec(
|
|
id="classify-to-fetch-loop",
|
|
source="classify-and-act",
|
|
target="fetch-emails",
|
|
condition=EdgeCondition.CONDITIONAL,
|
|
condition_expr="str(next_page_token).strip() not in ('', 'None', 'null')",
|
|
priority=2,
|
|
),
|
|
# Exit to report when no more pages
|
|
EdgeSpec(
|
|
id="classify-to-report",
|
|
source="classify-and-act",
|
|
target="report",
|
|
condition=EdgeCondition.CONDITIONAL,
|
|
condition_expr="str(next_page_token).strip() in ('', 'None', 'null')",
|
|
priority=1,
|
|
),
|
|
EdgeSpec(
|
|
id="report-to-intake",
|
|
source="report",
|
|
target="intake",
|
|
condition=EdgeCondition.ON_SUCCESS,
|
|
priority=1,
|
|
),
|
|
]
|
|
|
|
# Graph configuration
|
|
entry_node = "intake"
|
|
entry_points = {"start": "intake"}
|
|
pause_nodes = []
|
|
terminal_nodes = []
|
|
loop_config = {
|
|
"max_iterations": 100,
|
|
"max_tool_calls_per_turn": 30,
|
|
"max_tool_result_chars": 8000,
|
|
"max_history_tokens": 32000,
|
|
}
|
|
conversation_mode = "continuous"
|
|
identity_prompt = (
|
|
"You are an email inbox management assistant. You help users manage "
|
|
"their Gmail inbox by applying free-text rules to emails — trash, "
|
|
"mark as spam, mark important, mark read/unread, star, draft replies, "
|
|
"create/apply custom labels, and more."
|
|
)
|
|
|
|
|
|
class EmailInboxManagementAgent:
|
|
"""
|
|
Email Inbox Management Agent — continuous 4-node pipeline for email triage.
|
|
|
|
Flow: intake -> fetch-emails -> classify-and-act -> report -> intake (loop)
|
|
|
|
Uses AgentRuntime for:
|
|
- Multi-entry-point execution (primary + timer-driven)
|
|
- Session-scoped storage
|
|
- Shared state for rules persistence across entry points
|
|
- Checkpointing for resume capability
|
|
"""
|
|
|
|
def __init__(self, config=None):
|
|
self.config = config or default_config
|
|
self.goal = goal
|
|
self.nodes = nodes
|
|
self.edges = edges
|
|
self.entry_node = entry_node
|
|
self.entry_points = entry_points
|
|
self.pause_nodes = pause_nodes
|
|
self.terminal_nodes = terminal_nodes
|
|
self._executor: GraphExecutor | None = None
|
|
self._graph: GraphSpec | None = None
|
|
self._event_bus: EventBus | None = None
|
|
self._tool_registry: ToolRegistry | None = None
|
|
|
|
def _build_graph(self) -> GraphSpec:
|
|
"""Build the GraphSpec."""
|
|
return GraphSpec(
|
|
id="email-inbox-management-graph",
|
|
goal_id=self.goal.id,
|
|
version="1.0.0",
|
|
entry_node=self.entry_node,
|
|
entry_points=self.entry_points,
|
|
terminal_nodes=self.terminal_nodes,
|
|
pause_nodes=self.pause_nodes,
|
|
nodes=self.nodes,
|
|
edges=self.edges,
|
|
default_model=self.config.model,
|
|
max_tokens=self.config.max_tokens,
|
|
loop_config=loop_config,
|
|
conversation_mode=conversation_mode,
|
|
identity_prompt=identity_prompt,
|
|
)
|
|
|
|
def _setup(self, mock_mode=False) -> None:
|
|
"""Set up the agent runtime with sessions, checkpoints, and logging."""
|
|
self._storage_path = Path.home() / ".hive" / "agents" / "email_inbox_management"
|
|
self._storage_path.mkdir(parents=True, exist_ok=True)
|
|
|
|
self._event_bus = EventBus()
|
|
self._tool_registry = ToolRegistry()
|
|
|
|
mcp_config_path = Path(__file__).parent / "mcp_servers.json"
|
|
if mcp_config_path.exists():
|
|
self._tool_registry.load_mcp_config(mcp_config_path)
|
|
|
|
# Discover custom script tools (e.g. bulk_fetch_emails)
|
|
tools_path = Path(__file__).parent / "tools.py"
|
|
if tools_path.exists():
|
|
self._tool_registry.discover_from_module(tools_path)
|
|
|
|
llm = None
|
|
if not mock_mode:
|
|
llm = LiteLLMProvider(
|
|
model=self.config.model,
|
|
api_key=self.config.api_key,
|
|
api_base=self.config.api_base,
|
|
)
|
|
|
|
tool_executor = self._tool_registry.get_executor()
|
|
tools = list(self._tool_registry.get_tools().values())
|
|
|
|
self._graph = self._build_graph()
|
|
|
|
checkpoint_config = CheckpointConfig(
|
|
enabled=True,
|
|
checkpoint_on_node_start=False,
|
|
checkpoint_on_node_complete=True,
|
|
checkpoint_max_age_days=7,
|
|
async_checkpoint=True,
|
|
)
|
|
|
|
# Build entry point specs for AgentRuntime
|
|
entry_point_specs = [
|
|
# Primary entry point (user-facing)
|
|
EntryPointSpec(
|
|
id="default",
|
|
name="Default",
|
|
entry_node=self.entry_node,
|
|
trigger_type="manual",
|
|
isolation_level="shared",
|
|
),
|
|
]
|
|
|
|
self._agent_runtime = create_agent_runtime(
|
|
graph=self._graph,
|
|
goal=self.goal,
|
|
storage_path=self._storage_path,
|
|
entry_points=entry_point_specs,
|
|
llm=llm,
|
|
tools=tools,
|
|
tool_executor=tool_executor,
|
|
checkpoint_config=checkpoint_config,
|
|
)
|
|
|
|
return self._executor
|
|
|
|
async def start(self, mock_mode=False) -> None:
|
|
"""Set up the agent (initialize executor and tools)."""
|
|
if self._executor is None:
|
|
self._setup(mock_mode=mock_mode)
|
|
|
|
async def stop(self) -> None:
|
|
"""Stop and clean up the agent runtime."""
|
|
if self._agent_runtime is not None and self._agent_runtime.is_running:
|
|
await self._agent_runtime.stop()
|
|
|
|
async def trigger_and_wait(
|
|
self,
|
|
entry_point: str,
|
|
input_data: dict,
|
|
timeout: float | None = None,
|
|
session_state: dict | None = None,
|
|
) -> ExecutionResult | None:
|
|
"""Execute the graph and wait for completion."""
|
|
if self._executor is None:
|
|
raise RuntimeError("Agent not started. Call start() first.")
|
|
if self._graph is None:
|
|
raise RuntimeError("Graph not built. Call start() first.")
|
|
|
|
return await self._agent_runtime.trigger_and_wait(
|
|
entry_point_id=entry_point,
|
|
input_data=input_data,
|
|
timeout=timeout,
|
|
session_state=session_state,
|
|
)
|
|
|
|
async def run(
|
|
self, context: dict, mock_mode=False, session_state=None
|
|
) -> ExecutionResult:
|
|
"""Run the agent (convenience method for single execution)."""
|
|
await self.start(mock_mode=mock_mode)
|
|
try:
|
|
result = await self.trigger_and_wait(
|
|
"default", context, session_state=session_state
|
|
)
|
|
return result or ExecutionResult(success=False, error="Execution timeout")
|
|
finally:
|
|
await self.stop()
|
|
|
|
def info(self):
|
|
"""Get agent information."""
|
|
return {
|
|
"name": metadata.name,
|
|
"version": metadata.version,
|
|
"description": metadata.description,
|
|
"goal": {
|
|
"name": self.goal.name,
|
|
"description": self.goal.description,
|
|
},
|
|
"nodes": [n.id for n in self.nodes],
|
|
"edges": [e.id for e in self.edges],
|
|
"entry_node": self.entry_node,
|
|
"entry_points": self.entry_points,
|
|
"pause_nodes": self.pause_nodes,
|
|
"terminal_nodes": self.terminal_nodes,
|
|
"client_facing_nodes": [n.id for n in self.nodes if n.client_facing],
|
|
}
|
|
|
|
def validate(self):
|
|
"""Validate agent structure."""
|
|
errors = []
|
|
warnings = []
|
|
|
|
node_ids = {node.id for node in self.nodes}
|
|
for edge in self.edges:
|
|
if edge.source not in node_ids:
|
|
errors.append(f"Edge {edge.id}: source '{edge.source}' not found")
|
|
if edge.target not in node_ids:
|
|
errors.append(f"Edge {edge.id}: target '{edge.target}' not found")
|
|
|
|
if self.entry_node not in node_ids:
|
|
errors.append(f"Entry node '{self.entry_node}' not found")
|
|
|
|
for terminal in self.terminal_nodes:
|
|
if terminal not in node_ids:
|
|
errors.append(f"Terminal node '{terminal}' not found")
|
|
|
|
for ep_id, node_id in self.entry_points.items():
|
|
if node_id not in node_ids:
|
|
errors.append(
|
|
f"Entry point '{ep_id}' references unknown node '{node_id}'"
|
|
)
|
|
|
|
return {
|
|
"valid": len(errors) == 0,
|
|
"errors": errors,
|
|
"warnings": warnings,
|
|
}
|
|
|
|
|
|
# Create default instance
|
|
default_agent = EmailInboxManagementAgent()
|