228 lines
7.4 KiB
Python
228 lines
7.4 KiB
Python
# router.py
|
|
|
|
import os
|
|
import logging
|
|
from fastapi import APIRouter, HTTPException
|
|
from pydantic import BaseModel
|
|
|
|
from reasoning.reasoning import reason_check
|
|
from reasoning.reflection import reflect_notes
|
|
from reasoning.refine import refine_answer
|
|
from persona.speak import speak
|
|
from persona.identity import load_identity
|
|
from ingest.intake_client import IntakeClient
|
|
from context import collect_context, update_last_assistant_message
|
|
from intake.intake import add_exchange_internal
|
|
|
|
|
|
# -----------------------------
|
|
# Debug configuration
|
|
# -----------------------------
|
|
VERBOSE_DEBUG = os.getenv("VERBOSE_DEBUG", "false").lower() == "true"
|
|
logger = logging.getLogger(__name__)
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.setLevel(logging.DEBUG)
|
|
|
|
# Console handler
|
|
console_handler = logging.StreamHandler()
|
|
console_handler.setFormatter(logging.Formatter(
|
|
'%(asctime)s [ROUTER] %(levelname)s: %(message)s',
|
|
datefmt='%H:%M:%S'
|
|
))
|
|
logger.addHandler(console_handler)
|
|
|
|
# File handler
|
|
try:
|
|
os.makedirs('/app/logs', exist_ok=True)
|
|
file_handler = logging.FileHandler('/app/logs/cortex_verbose_debug.log', mode='a')
|
|
file_handler.setFormatter(logging.Formatter(
|
|
'%(asctime)s [ROUTER] %(levelname)s: %(message)s',
|
|
datefmt='%Y-%m-%d %H:%M:%S'
|
|
))
|
|
logger.addHandler(file_handler)
|
|
logger.debug("VERBOSE_DEBUG mode enabled for router.py - logging to file")
|
|
except Exception as e:
|
|
logger.debug(f"VERBOSE_DEBUG mode enabled for router.py - file logging failed: {e}")
|
|
|
|
# -----------------------------
|
|
# Router (NOT FastAPI app)
|
|
# -----------------------------
|
|
cortex_router = APIRouter()
|
|
|
|
# Initialize Intake client once
|
|
intake_client = IntakeClient()
|
|
|
|
|
|
# -----------------------------
|
|
# Pydantic models
|
|
# -----------------------------
|
|
class ReasonRequest(BaseModel):
|
|
session_id: str
|
|
user_prompt: str
|
|
temperature: float | None = None
|
|
|
|
|
|
# -----------------------------
|
|
# /reason endpoint
|
|
# -----------------------------
|
|
@cortex_router.post("/reason")
|
|
async def run_reason(req: ReasonRequest):
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"\n{'='*80}")
|
|
logger.debug(f"[PIPELINE START] Session: {req.session_id}")
|
|
logger.debug(f"[PIPELINE START] User prompt: {req.user_prompt[:200]}...")
|
|
logger.debug(f"{'='*80}\n")
|
|
|
|
# 0. Collect unified context from all sources
|
|
if VERBOSE_DEBUG:
|
|
logger.debug("[STAGE 0] Collecting unified context...")
|
|
|
|
context_state = await collect_context(req.session_id, req.user_prompt)
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"[STAGE 0] Context collected - {len(context_state.get('rag', []))} RAG results")
|
|
|
|
# 0.5. Load identity block
|
|
if VERBOSE_DEBUG:
|
|
logger.debug("[STAGE 0.5] Loading identity block...")
|
|
|
|
identity_block = load_identity(req.session_id)
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"[STAGE 0.5] Identity loaded: {identity_block.get('name', 'Unknown')}")
|
|
|
|
# 1. Extract Intake summary for reflection
|
|
# Use L20 (Session Overview) as primary summary for reflection
|
|
intake_summary = "(no context available)"
|
|
if context_state.get("intake"):
|
|
l20_summary = context_state["intake"].get("L20")
|
|
if l20_summary and isinstance(l20_summary, dict):
|
|
intake_summary = l20_summary.get("summary", "(no context available)")
|
|
elif isinstance(l20_summary, str):
|
|
intake_summary = l20_summary
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"[STAGE 1] Intake summary extracted (L20): {intake_summary[:150]}...")
|
|
|
|
# 2. Reflection
|
|
if VERBOSE_DEBUG:
|
|
logger.debug("[STAGE 2] Running reflection...")
|
|
|
|
try:
|
|
reflection = await reflect_notes(intake_summary, identity_block=identity_block)
|
|
reflection_notes = reflection.get("notes", [])
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"[STAGE 2] Reflection complete - {len(reflection_notes)} notes generated")
|
|
for idx, note in enumerate(reflection_notes, 1):
|
|
logger.debug(f" Note {idx}: {note}")
|
|
except Exception as e:
|
|
reflection_notes = []
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"[STAGE 2] Reflection failed: {e}")
|
|
|
|
# 3. First-pass reasoning draft
|
|
if VERBOSE_DEBUG:
|
|
logger.debug("[STAGE 3] Running reasoning (draft)...")
|
|
|
|
draft = await reason_check(
|
|
req.user_prompt,
|
|
identity_block=identity_block,
|
|
rag_block=context_state.get("rag", []),
|
|
reflection_notes=reflection_notes,
|
|
context=context_state
|
|
)
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"[STAGE 3] Draft answer ({len(draft)} chars):")
|
|
logger.debug(f"--- DRAFT START ---\n{draft}\n--- DRAFT END ---")
|
|
|
|
# 4. Refinement
|
|
if VERBOSE_DEBUG:
|
|
logger.debug("[STAGE 4] Running refinement...")
|
|
|
|
result = await refine_answer(
|
|
draft_output=draft,
|
|
reflection_notes=reflection_notes,
|
|
identity_block=identity_block,
|
|
rag_block=context_state.get("rag", []),
|
|
)
|
|
final_neutral = result["final_output"]
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"[STAGE 4] Refined answer ({len(final_neutral)} chars):")
|
|
logger.debug(f"--- REFINED START ---\n{final_neutral}\n--- REFINED END ---")
|
|
|
|
# 5. Persona layer
|
|
if VERBOSE_DEBUG:
|
|
logger.debug("[STAGE 5] Applying persona layer...")
|
|
|
|
persona_answer = await speak(final_neutral)
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"[STAGE 5] Persona answer ({len(persona_answer)} chars):")
|
|
logger.debug(f"--- PERSONA START ---\n{persona_answer}\n--- PERSONA END ---")
|
|
|
|
# 6. Update session state with assistant's response
|
|
if VERBOSE_DEBUG:
|
|
logger.debug("[STAGE 6] Updating session state...")
|
|
|
|
update_last_assistant_message(req.session_id, persona_answer)
|
|
|
|
if VERBOSE_DEBUG:
|
|
logger.debug(f"\n{'='*80}")
|
|
logger.debug(f"[PIPELINE COMPLETE] Session: {req.session_id}")
|
|
logger.debug(f"[PIPELINE COMPLETE] Final answer length: {len(persona_answer)} chars")
|
|
logger.debug(f"{'='*80}\n")
|
|
|
|
# 7. Return full bundle
|
|
return {
|
|
"draft": draft,
|
|
"neutral": final_neutral,
|
|
"persona": persona_answer,
|
|
"reflection": reflection_notes,
|
|
"session_id": req.session_id,
|
|
"context_summary": {
|
|
"rag_results": len(context_state.get("rag", [])),
|
|
"minutes_since_last": context_state.get("minutes_since_last_msg"),
|
|
"message_count": context_state.get("message_count"),
|
|
"mode": context_state.get("mode"),
|
|
}
|
|
}
|
|
|
|
|
|
# -----------------------------
|
|
# Intake ingest (internal feed)
|
|
# -----------------------------
|
|
class IngestPayload(BaseModel):
|
|
session_id: str
|
|
user_msg: str
|
|
assistant_msg: str
|
|
|
|
@cortex_router.post("/ingest")
|
|
async def ingest(payload: IngestPayload):
|
|
"""
|
|
Relay calls this after /reason.
|
|
We update Cortex state AND feed Intake's internal buffer.
|
|
"""
|
|
|
|
# 1. Update Cortex session state
|
|
update_last_assistant_message(payload.session_id, payload.assistant_msg)
|
|
|
|
# 2. Feed Intake internally (no HTTP)
|
|
try:
|
|
add_exchange_internal({
|
|
"session_id": payload.session_id,
|
|
"user_msg": payload.user_msg,
|
|
"assistant_msg": payload.assistant_msg,
|
|
})
|
|
|
|
logger.debug(f"[INGEST] Added exchange to Intake for {payload.session_id}")
|
|
except Exception as e:
|
|
logger.warning(f"[INGEST] Failed to add exchange to Intake: {e}")
|
|
|
|
return {"ok": True, "session_id": payload.session_id}
|
|
|