autonomy build, phase 1

2025-12-14 01:44:05 -05:00
parent fa4dd46cfc
commit 49f792f20c
10 changed files with 735 additions and 14 deletions
--- a/cortex/tests/test_autonomy_phase1.py
+++ b/cortex/tests/test_autonomy_phase1.py
@@ -0,0 +1,197 @@
+"""
+Integration tests for Phase 1 autonomy features.
+Tests monologue integration, executive planning, and self-state persistence.
+"""
+
+import asyncio
+import json
+import sys
+import os
+
+# Add parent directory to path for imports
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+
+from autonomy.monologue.monologue import InnerMonologue
+from autonomy.self.state import load_self_state, update_self_state, get_self_state_instance
+from autonomy.executive.planner import plan_execution
+
+
+async def test_monologue_integration():
+    """Test monologue generates valid output."""
+    print("\n" + "="*60)
+    print("TEST 1: Monologue Integration")
+    print("="*60)
+
+    mono = InnerMonologue()
+
+    context = {
+        "user_message": "Explain quantum computing to me like I'm 5",
+        "session_id": "test_001",
+        "self_state": load_self_state(),
+        "context_summary": {"message_count": 5}
+    }
+
+    result = await mono.process(context)
+
+    assert "intent" in result, "Missing intent field"
+    assert "tone" in result, "Missing tone field"
+    assert "depth" in result, "Missing depth field"
+    assert "consult_executive" in result, "Missing consult_executive field"
+
+    print("✓ Monologue integration test passed")
+    print(f"  Result: {json.dumps(result, indent=2)}")
+
+    return result
+
+
+async def test_executive_planning():
+    """Test executive planner generates valid plans."""
+    print("\n" + "="*60)
+    print("TEST 2: Executive Planning")
+    print("="*60)
+
+    plan = await plan_execution(
+        user_prompt="Help me build a distributed system with microservices architecture",
+        intent="technical_implementation",
+        context_state={
+            "tools_available": ["RAG", "WEB", "CODEBRAIN"],
+            "message_count": 3,
+            "minutes_since_last_msg": 2.5,
+            "active_project": None
+        },
+        identity_block={}
+    )
+
+    assert "summary" in plan, "Missing summary field"
+    assert "plan_text" in plan, "Missing plan_text field"
+    assert "steps" in plan, "Missing steps field"
+    assert len(plan["steps"]) > 0, "No steps generated"
+
+    print("✓ Executive planning test passed")
+    print(f"  Plan summary: {plan['summary']}")
+    print(f"  Steps: {len(plan['steps'])}")
+    print(f"  Complexity: {plan.get('estimated_complexity', 'unknown')}")
+
+    return plan
+
+
+def test_self_state_persistence():
+    """Test self-state loads and updates."""
+    print("\n" + "="*60)
+    print("TEST 3: Self-State Persistence")
+    print("="*60)
+
+    state1 = load_self_state()
+    assert "mood" in state1, "Missing mood field"
+    assert "energy" in state1, "Missing energy field"
+    assert "interaction_count" in state1, "Missing interaction_count"
+
+    initial_count = state1.get("interaction_count", 0)
+    print(f"  Initial interaction count: {initial_count}")
+
+    update_self_state(
+        mood_delta=0.1,
+        energy_delta=-0.05,
+        new_focus="testing"
+    )
+
+    state2 = load_self_state()
+    assert state2["interaction_count"] == initial_count + 1, "Interaction count not incremented"
+    assert state2["focus"] == "testing", "Focus not updated"
+
+    print("✓ Self-state persistence test passed")
+    print(f"  New interaction count: {state2['interaction_count']}")
+    print(f"  New focus: {state2['focus']}")
+    print(f"  New energy: {state2['energy']:.2f}")
+
+    return state2
+
+
+async def test_end_to_end_flow():
+    """Test complete flow from monologue through planning."""
+    print("\n" + "="*60)
+    print("TEST 4: End-to-End Flow")
+    print("="*60)
+
+    # Step 1: Monologue detects complex query
+    mono = InnerMonologue()
+    mono_result = await mono.process({
+        "user_message": "Design a scalable ML pipeline with CI/CD integration",
+        "session_id": "test_e2e",
+        "self_state": load_self_state(),
+        "context_summary": {}
+    })
+
+    print(f"  Monologue intent: {mono_result.get('intent')}")
+    print(f"  Consult executive: {mono_result.get('consult_executive')}")
+
+    # Step 2: If executive requested, generate plan
+    if mono_result.get("consult_executive"):
+        plan = await plan_execution(
+            user_prompt="Design a scalable ML pipeline with CI/CD integration",
+            intent=mono_result.get("intent", "unknown"),
+            context_state={"tools_available": ["CODEBRAIN", "WEB"]},
+            identity_block={}
+        )
+
+        assert plan is not None, "Plan should be generated"
+        print(f"  Executive plan generated: {len(plan.get('steps', []))} steps")
+
+    # Step 3: Update self-state
+    update_self_state(
+        energy_delta=-0.1,  # Complex task is tiring
+        new_focus="ml_pipeline_design",
+        confidence_delta=0.05
+    )
+
+    state = load_self_state()
+    assert state["focus"] == "ml_pipeline_design", "Focus should be updated"
+
+    print("✓ End-to-end flow test passed")
+    print(f"  Final state: {state['mood']}, energy={state['energy']:.2f}")
+
+    return True
+
+
+async def run_all_tests():
+    """Run all Phase 1 tests."""
+    print("\n" + "="*60)
+    print("PHASE 1 AUTONOMY TESTS")
+    print("="*60)
+
+    try:
+        # Test 1: Monologue
+        mono_result = await test_monologue_integration()
+
+        # Test 2: Executive Planning
+        plan_result = await test_executive_planning()
+
+        # Test 3: Self-State
+        state_result = test_self_state_persistence()
+
+        # Test 4: End-to-End
+        await test_end_to_end_flow()
+
+        print("\n" + "="*60)
+        print("ALL TESTS PASSED ✓")
+        print("="*60)
+
+        print("\nSummary:")
+        print(f"  - Monologue: {mono_result.get('intent')} ({mono_result.get('tone')})")
+        print(f"  - Executive: {plan_result.get('estimated_complexity')} complexity")
+        print(f"  - Self-state: {state_result.get('interaction_count')} interactions")
+
+        return True
+
+    except Exception as e:
+        print("\n" + "="*60)
+        print(f"TEST FAILED: {e}")
+        print("="*60)
+        import traceback
+        traceback.print_exc()
+        return False
+
+
+if __name__ == "__main__":
+    success = asyncio.run(run_all_tests())
+    sys.exit(0 if success else 1)