From 7ad521efebc3fb183e310ff67fb7d1ddc1920893 Mon Sep 17 00:00:00 2001
From: Timothy <timothy@adenhq.com>
Date: Mon, 19 Jan 2026 20:06:51 -0800
Subject: [PATCH] chore: update core framework readme

---
 core/README.md | 181 +++++++++++++++++++++++++++++++++++++++----------
 1 file changed, 146 insertions(+), 35 deletions(-)

diff --git a/core/README.md b/core/README.md
index c4b6e986..958fb802 100644
--- a/core/README.md
+++ b/core/README.md
@@ -64,7 +64,7 @@ To use the agent builder with Claude Desktop or other MCP clients, add this to y
     "agent-builder": {
       "command": "python",
       "args": ["-m", "framework.mcp.agent_builder_server"],
-      "cwd": "/path/to/goal-agent"
+      "cwd": "/path/to/hive/core"
     }
   }
 }
@@ -78,45 +78,81 @@ The MCP server provides tools for:
 - Validating and exporting agent graphs
 - Testing nodes and full agent graphs
 
+See [MCP_SERVER_GUIDE.md](MCP_SERVER_GUIDE.md) for detailed instructions.
+
 ## Quick Start
 
-### Calculator Agent
+### Running Agents
 
-Run an LLM-powered calculator:
+The framework comes with pre-built example agents in the `exports/` directory:
 
 ```bash
-# Single calculation
-python -m framework calculate "2 + 3 * 4"
+# List available agents
+python -m framework list exports/
 
-# Interactive mode
-python -m framework interactive
+# Show agent information
+python -m framework info exports/task-planner
 
-# Analyze runs with Builder
-python -m framework analyze calculator
+# Run an agent
+python -m framework run exports/task-planner --input '{"objective": "Build a web scraper"}'
+
+# Interactive shell mode (with human-in-the-loop approval)
+python -m framework shell exports/task-planner
 ```
 
-### Using the Runtime
+### Available Commands
+
+- `run` - Execute an exported agent with given input
+- `info` - Display agent details (goal, nodes, edges, success criteria)
+- `validate` - Check that an agent is valid and runnable
+- `list` - List all exported agents in a directory
+- `dispatch` - Route requests to multiple agents using the orchestrator
+- `shell` - Start an interactive session with an agent
+
+### Building Agents Programmatically
+
+You can build agents using the MCP server (recommended) or programmatically:
 
 ```python
 from framework import Runtime
 
-runtime = Runtime("/path/to/storage")
+# Initialize runtime with storage path
+runtime = Runtime("./storage")
 
-# Start a run
-run_id = runtime.start_run("my_goal", "Description of what we're doing")
+# Start a run for a goal
+run_id = runtime.start_run(
+    goal_id="data-processor",
+    goal_description="Process data with quality checks",
+    input_data={"dataset": "customers.csv"}
+)
+
+# Set the current node context
+runtime.set_node("processor-node")
 
 # Record a decision
 decision_id = runtime.decide(
     intent="Choose how to process the data",
     options=[
-        {"id": "fast", "description": "Quick processing", "pros": ["Fast"], "cons": ["Less accurate"]},
-        {"id": "thorough", "description": "Detailed processing", "pros": ["Accurate"], "cons": ["Slower"]},
+        {
+            "id": "fast",
+            "description": "Quick processing",
+            "action_type": "tool_call",
+            "pros": ["Fast"],
+            "cons": ["Less accurate"]
+        },
+        {
+            "id": "thorough",
+            "description": "Detailed processing",
+            "action_type": "tool_call",
+            "pros": ["Accurate"],
+            "cons": ["Slower"]
+        },
     ],
     chosen="thorough",
     reasoning="Accuracy is more important for this task"
 )
 
-# Record the outcome
+# Record the outcome of the decision
 runtime.record_outcome(
     decision_id=decision_id,
     success=True,
@@ -125,58 +161,133 @@ runtime.record_outcome(
 )
 
 # End the run
-runtime.end_run(success=True, narrative="Successfully processed all data")
+runtime.end_run(
+    success=True,
+    narrative="Successfully processed all data",
+    output_data={"total_processed": 100}
+)
 ```
 
-### Analyzing with Builder
+### Analyzing Agent Behavior with Builder
+
+The BuilderQuery interface allows you to analyze agent runs and identify improvements:
 
 ```python
 from framework import BuilderQuery
 
-query = BuilderQuery("/path/to/storage")
+# Initialize Builder query interface
+query = BuilderQuery("./storage")
 
-# Find patterns across runs
-patterns = query.find_patterns("my_goal")
-print(f"Success rate: {patterns.success_rate:.1%}")
+# Find patterns across runs for a goal
+patterns = query.find_patterns("data-processor")
+if patterns:
+    print(f"Success rate: {patterns.success_rate:.1%}")
+    print(f"Runs analyzed: {patterns.run_count}")
 
-# Analyze a failure
-analysis = query.analyze_failure("run_123")
-print(f"Root cause: {analysis.root_cause}")
-print(f"Suggestions: {analysis.suggestions}")
+    # Show problematic nodes
+    for node_id, failure_rate in patterns.problematic_nodes:
+        print(f"Node '{node_id}' has {failure_rate:.1%} failure rate")
 
-# Get improvement recommendations
-suggestions = query.suggest_improvements("my_goal")
+# Analyze a specific failure
+analysis = query.analyze_failure("run_20260119_143022_abc123")
+if analysis:
+    print(f"Failure point: {analysis.failure_point}")
+    print(f"Root cause: {analysis.root_cause}")
+    print(f"\nSuggestions:")
+    for suggestion in analysis.suggestions:
+        print(f"  - {suggestion}")
+
+# Get improvement recommendations for a goal
+suggestions = query.suggest_improvements("data-processor")
 for s in suggestions:
     print(f"[{s['priority']}] {s['recommendation']}")
+    print(f"  Reason: {s['reason']}")
+
+# Get performance metrics for a specific node
+perf = query.get_node_performance("processor-node")
+print(f"Node: {perf['node_id']}")
+print(f"Success rate: {perf['success_rate']:.1%}")
+print(f"Avg latency: {perf['avg_latency_ms']:.0f}ms")
 ```
 
 ## Architecture
 
+The framework consists of several layers:
+
 ```
 ┌─────────────────┐
-│  Human Engineer │  ← Supervision, approval
+│  Human Engineer │  ← Supervision, approval via HITL
 └────────┬────────┘
          │
 ┌────────▼────────┐
-│   Builder LLM   │  ← Analyzes runs, suggests improvements
+│   Builder LLM   │  ← Analyzes runs, suggests improvements (via MCP)
 │  (BuilderQuery) │
 └────────┬────────┘
          │
 ┌────────▼────────┐
-│   Agent LLM     │  ← Executes tasks, records decisions
-│    (Runtime)    │
+│   Agent Graph   │  ← Node-based execution flow
+│   (AgentRunner) │     (llm_generate, llm_tool_use, router, function)
+└────────┬────────┘
+         │
+┌────────▼────────┐
+│    Runtime      │  ← Records decisions, outcomes, problems
+│   (Decision DB) │
 └─────────────────┘
 ```
 
 ## Key Concepts
 
+### Graph-Based Agents
+
+Agents are defined as directed graphs with:
+- **Nodes**: Execution steps (llm_generate, llm_tool_use, router, function)
+- **Edges**: Control flow between nodes, including conditional routing
+- **Goal**: What the agent is designed to accomplish with success criteria
+- **Constraints**: Hard and soft limits on agent behavior
+
+### Decision Recording
+
 - **Decision**: The atomic unit of agent behavior. Captures intent, options, choice, and reasoning.
-- **Run**: A complete execution with all decisions and outcomes.
-- **Runtime**: Interface agents use to record their behavior.
-- **BuilderQuery**: Interface Builder uses to analyze agent behavior.
+- **Outcome**: Result of executing a decision (success/failure, latency, tokens, state changes)
+- **Run**: A complete execution trace with all decisions and outcomes
+- **Problem**: Issues reported during execution with severity and suggested fixes
+
+### Analysis & Improvement
+
+- **Runtime**: Interface agents use to record their behavior during execution
+- **BuilderQuery**: Interface for analyzing agent runs and identifying patterns
+- **PatternAnalysis**: Cross-run analysis showing success rates, common failures, problematic nodes
+- **FailureAnalysis**: Deep dive into why a specific run failed with suggestions
+
+### Human-in-the-Loop (HITL)
+
+- **Approval Callbacks**: Nodes can require human approval before execution
+- **Interactive Shell**: Chat-like interface for running agents with approval prompts
+- **Session State**: Agents can pause and resume based on user input
+
+### Multi-Agent Orchestration
+
+- **AgentOrchestrator**: Dispatch requests to multiple agents
+- **Agent Discovery**: Automatically discover and register agents from a directory
+- **Dispatch Strategy**: Route requests to the most appropriate agent(s)
+
+## Example Agents
+
+The `exports/` directory contains example agents you can run or use as templates:
+
+- **task-planner**: Breaks down complex objectives into actionable tasks with dependencies
+- **research-summary-agent**: Conducts research and generates summaries
+- **outbound-sales-agent**: Handles outbound sales workflows
+- **youtube-comments-research**: Analyzes YouTube comments for insights
+
+Each agent includes:
+- `agent.json`: Graph definition with nodes, edges, goal, and constraints
+- `README.md`: Agent documentation
+- `tools.py` (optional): Custom tool implementations
 
 ## Requirements
 
 - Python 3.11+
 - pydantic >= 2.0
 - anthropic >= 0.40.0 (for LLM-powered agents)
+- mcp, fastmcp (optional, for MCP server)