v0.8.0: refactor agent.py into modular package

Split 1161-line monolith into agent/ package: auth, llm, types, process, runtime, api, and nodes/ (base, sensor, input, output, thinker, memorizer). No logic changes — pure structural split. uvicorn agent:app entrypoint unchanged. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
2026-03-28 01:36:41 +01:00 · 2026-03-28 01:36:41 +01:00 · 7458b2ea35
commit 7458b2ea35
parent 20363a1f2f
15 changed files with 1172 additions and 1160 deletions
--- a/agent.py
+++ b/agent.py
--- a/agent/init.py
+++ b/agent/init.py
@ -0,0 +1,37 @@
+"""Cognitive Agent Runtime — modular package.
+
+uvicorn entrypoint: agent:app
+"""
+
+import logging
+from pathlib import Path
+
+from dotenv import load_dotenv
+load_dotenv(Path(__file__).parent.parent / ".env")
+
+logging.basicConfig(level=logging.INFO, format="%(asctime)s [%(name)s] %(message)s", datefmt="%H:%M:%S")
+
+from fastapi import FastAPI
+from fastapi.responses import FileResponse
+from fastapi.staticfiles import StaticFiles
+
+from .api import register_routes
+
+STATIC_DIR = Path(__file__).parent.parent / "static"
+
+app = FastAPI(title="cog")
+
+# Register all API + WS routes
+register_routes(app)
+
+# Serve index.html explicitly, then static assets
+@app.get("/")
+async def index():
+    return FileResponse(STATIC_DIR / "index.html")
+
+@app.get("/callback")
+async def callback():
+    """OIDC callback — serves the same SPA, JS handles the code exchange."""
+    return FileResponse(STATIC_DIR / "index.html")
+
+app.mount("/static", StaticFiles(directory=STATIC_DIR), name="static")
--- a/agent/api.py
+++ b/agent/api.py
@ -0,0 +1,188 @@
+"""API endpoints, SSE, polling."""
+
+import asyncio
+import hashlib
+import json
+import logging
+from asyncio import Queue
+from pathlib import Path
+
+from fastapi import Depends, HTTPException, Query, WebSocket, WebSocketDisconnect
+from starlette.responses import StreamingResponse
+
+import httpx
+
+from .auth import AUTH_ENABLED, ZITADEL_ISSUER, _validate_token, require_auth
+from .runtime import Runtime, TRACE_FILE
+
+log = logging.getLogger("runtime")
+
+# Active runtime reference (set by WS endpoint)
+_active_runtime: Runtime | None = None
+
+# SSE subscribers
+_sse_subscribers: list[Queue] = []
+
+
+def _broadcast_sse(event: dict):
+    """Push an event to all SSE subscribers."""
+    for q in _sse_subscribers:
+        try:
+            q.put_nowait(event)
+        except asyncio.QueueFull:
+            pass
+
+
+def _state_hash() -> str:
+    if not _active_runtime:
+        return "no_session"
+    raw = json.dumps({
+        "mem": _active_runtime.memorizer.state,
+        "hlen": len(_active_runtime.history),
+    }, sort_keys=True)
+    return hashlib.md5(raw.encode()).hexdigest()[:12]
+
+
+def register_routes(app):
+    """Register all API routes on the FastAPI app."""
+
+    @app.get("/health")
+    async def health():
+        return {"status": "ok"}
+
+    @app.get("/auth/config")
+    async def auth_config():
+        from .auth import ZITADEL_ISSUER, ZITADEL_CLIENT_ID, ZITADEL_PROJECT_ID, AUTH_ENABLED
+        return {
+            "enabled": AUTH_ENABLED,
+            "issuer": ZITADEL_ISSUER,
+            "clientId": ZITADEL_CLIENT_ID,
+            "projectId": ZITADEL_PROJECT_ID,
+        }
+
+    @app.websocket("/ws")
+    async def ws_endpoint(ws: WebSocket, token: str | None = Query(None),
+                          access_token: str | None = Query(None)):
+        global _active_runtime
+        user_claims = {"sub": "anonymous"}
+        if AUTH_ENABLED and token:
+            try:
+                user_claims = await _validate_token(token)
+                if not user_claims.get("name") and access_token:
+                    async with httpx.AsyncClient() as client:
+                        resp = await client.get(f"{ZITADEL_ISSUER}/oidc/v1/userinfo",
+                                                headers={"Authorization": f"Bearer {access_token}"})
+                        if resp.status_code == 200:
+                            info = resp.json()
+                            log.info(f"[auth] userinfo enrichment: {info}")
+                            user_claims["name"] = info.get("name")
+                            user_claims["preferred_username"] = info.get("preferred_username")
+                            user_claims["email"] = info.get("email")
+            except HTTPException:
+                await ws.close(code=4001, reason="Invalid token")
+                return
+        origin = ws.headers.get("origin", ws.headers.get("host", ""))
+        await ws.accept()
+        runtime = Runtime(ws, user_claims=user_claims, origin=origin, broadcast=_broadcast_sse)
+        _active_runtime = runtime
+        try:
+            while True:
+                data = await ws.receive_text()
+                msg = json.loads(data)
+                if msg.get("type") == "action":
+                    action_text = f"[user clicked: {msg.get('action', 'unknown')}]"
+                    if msg.get("data"):
+                        action_text += f" data: {json.dumps(msg['data'])}"
+                    await runtime.handle_message(action_text)
+                elif msg.get("type") == "cancel_process":
+                    runtime.process_manager.cancel(msg.get("pid", 0))
+                else:
+                    await runtime.handle_message(msg.get("text", ""))
+        except WebSocketDisconnect:
+            runtime.sensor.stop()
+            if _active_runtime is runtime:
+                _active_runtime = None
+
+    @app.get("/api/events")
+    async def sse_events(user=Depends(require_auth)):
+        q: Queue = Queue(maxsize=100)
+        _sse_subscribers.append(q)
+
+        async def generate():
+            try:
+                while True:
+                    event = await q.get()
+                    yield f"data: {json.dumps(event)}\n\n"
+            except asyncio.CancelledError:
+                pass
+            finally:
+                _sse_subscribers.remove(q)
+
+        return StreamingResponse(generate(), media_type="text/event-stream",
+                                headers={"Cache-Control": "no-cache", "X-Accel-Buffering": "no"})
+
+    @app.get("/api/poll")
+    async def poll(since: str = "", user=Depends(require_auth)):
+        h = _state_hash()
+        if since and since == h:
+            return {"changed": False, "hash": h}
+        return {
+            "changed": True,
+            "hash": h,
+            "state": _active_runtime.memorizer.state if _active_runtime else None,
+            "history_len": len(_active_runtime.history) if _active_runtime else 0,
+            "last_messages": _active_runtime.history[-3:] if _active_runtime else [],
+        }
+
+    @app.post("/api/send")
+    async def api_send(body: dict, user=Depends(require_auth)):
+        if not _active_runtime:
+            raise HTTPException(status_code=409, detail="No active session -- someone must be connected via WS first")
+        text = body.get("text", "").strip()
+        if not text:
+            raise HTTPException(status_code=400, detail="Missing 'text' field")
+        await _active_runtime.handle_message(text)
+        return {
+            "status": "ok",
+            "response": _active_runtime.history[-1]["content"] if _active_runtime.history else "",
+            "memorizer": _active_runtime.memorizer.state,
+        }
+
+    @app.post("/api/clear")
+    async def api_clear(user=Depends(require_auth)):
+        if not _active_runtime:
+            raise HTTPException(status_code=409, detail="No active session")
+        _active_runtime.history.clear()
+        return {"status": "cleared"}
+
+    @app.get("/api/state")
+    async def get_state(user=Depends(require_auth)):
+        if not _active_runtime:
+            return {"status": "no_session"}
+        return {
+            "status": "active",
+            "memorizer": _active_runtime.memorizer.state,
+            "history_len": len(_active_runtime.history),
+        }
+
+    @app.get("/api/history")
+    async def get_history(last: int = 10, user=Depends(require_auth)):
+        if not _active_runtime:
+            return {"status": "no_session", "messages": []}
+        return {
+            "status": "active",
+            "messages": _active_runtime.history[-last:],
+        }
+
+    @app.get("/api/trace")
+    async def get_trace(last: int = 30, user=Depends(require_auth)):
+        if not TRACE_FILE.exists():
+            return {"lines": []}
+        lines = TRACE_FILE.read_text(encoding="utf-8").strip().split("\n")
+        parsed = []
+        for line in lines[-last:]:
+            try:
+                parsed.append(json.loads(line))
+            except json.JSONDecodeError:
+                pass
+        return {"lines": parsed}
--- a/agent/auth.py
+++ b/agent/auth.py
@ -0,0 +1,92 @@
+"""OIDC auth: Zitadel token validation, FastAPI dependencies."""
+
+import json
+import logging
+import os
+import time
+
+import httpx
+from fastapi import Depends, HTTPException, Query
+from fastapi.security import HTTPAuthorizationCredentials, HTTPBearer
+
+log = logging.getLogger("runtime")
+
+ZITADEL_ISSUER = os.environ.get("ZITADEL_ISSUER", "https://auth.loop42.de")
+ZITADEL_CLIENT_ID = os.environ.get("ZITADEL_CLIENT_ID", "365996029172056091")
+ZITADEL_PROJECT_ID = os.environ.get("ZITADEL_PROJECT_ID", "365995955654230043")
+AUTH_ENABLED = os.environ.get("AUTH_ENABLED", "false").lower() == "true"
+SERVICE_TOKENS = set(filter(None, os.environ.get("SERVICE_TOKENS", "").split(",")))
+
+_jwks_cache: dict = {"keys": [], "fetched_at": 0}
+
+
+async def _get_jwks():
+    if time.time() - _jwks_cache["fetched_at"] < 3600:
+        return _jwks_cache["keys"]
+    async with httpx.AsyncClient() as client:
+        resp = await client.get(f"{ZITADEL_ISSUER}/oauth/v2/keys")
+        _jwks_cache["keys"] = resp.json()["keys"]
+        _jwks_cache["fetched_at"] = time.time()
+    return _jwks_cache["keys"]
+
+
+async def _validate_token(token: str) -> dict:
+    """Validate token: check service tokens, then JWT, then userinfo."""
+    import base64
+
+    if token in SERVICE_TOKENS:
+        return {"sub": "titan", "username": "titan", "source": "service_token"}
+
+    try:
+        parts = token.split(".")
+        if len(parts) == 3:
+            keys = await _get_jwks()
+            header_b64 = parts[0] + "=" * (4 - len(parts[0]) % 4)
+            header = json.loads(base64.urlsafe_b64decode(header_b64))
+            kid = header.get("kid")
+            key = next((k for k in keys if k["kid"] == kid), None)
+            if key:
+                import jwt as pyjwt
+                from jwt import PyJWK
+                jwk_obj = PyJWK(key)
+                claims = pyjwt.decode(
+                    token, jwk_obj.key, algorithms=["RS256"],
+                    issuer=ZITADEL_ISSUER, options={"verify_aud": False},
+                )
+                return claims
+    except Exception:
+        pass
+
+    async with httpx.AsyncClient() as client:
+        resp = await client.get(
+            f"{ZITADEL_ISSUER}/oidc/v1/userinfo",
+            headers={"Authorization": f"Bearer {token}"},
+        )
+        if resp.status_code == 200:
+            info = resp.json()
+            log.info(f"[auth] userinfo response: {info}")
+            return {"sub": info.get("sub"), "preferred_username": info.get("preferred_username"),
+                    "email": info.get("email"), "name": info.get("name"), "source": "userinfo"}
+
+    raise HTTPException(status_code=401, detail="Invalid token")
+
+
+_bearer = HTTPBearer(auto_error=False)
+
+
+async def require_auth(credentials: HTTPAuthorizationCredentials | None = Depends(_bearer)):
+    """Dependency: require valid JWT when AUTH_ENABLED."""
+    if not AUTH_ENABLED:
+        return {"sub": "anonymous"}
+    if not credentials:
+        raise HTTPException(status_code=401, detail="Missing token")
+    return await _validate_token(credentials.credentials)
+
+
+async def ws_auth(token: str | None = Query(None)) -> dict:
+    """Validate WebSocket token from query param."""
+    if not AUTH_ENABLED:
+        return {"sub": "anonymous"}
+    if not token:
+        return None
+    return await _validate_token(token)
--- a/agent/llm.py
+++ b/agent/llm.py
@ -0,0 +1,76 @@
+"""LLM helper: OpenRouter calls, token estimation, context fitting."""
+
+import json
+import logging
+import os
+from typing import Any
+
+import httpx
+
+log = logging.getLogger("runtime")
+
+API_KEY = os.environ.get("OPENROUTER_API_KEY", "")
+OPENROUTER_URL = "https://openrouter.ai/api/v1/chat/completions"
+
+
+async def llm_call(model: str, messages: list[dict], stream: bool = False) -> Any:
+    """Single LLM call via OpenRouter. Returns full text or (client, response) for streaming."""
+    headers = {"Authorization": f"Bearer {API_KEY}", "Content-Type": "application/json"}
+    body = {"model": model, "messages": messages, "stream": stream}
+
+    client = httpx.AsyncClient(timeout=60)
+    if stream:
+        resp = await client.send(client.build_request("POST", OPENROUTER_URL, headers=headers, json=body), stream=True)
+        return client, resp
+
+    resp = await client.post(OPENROUTER_URL, headers=headers, json=body)
+    await client.aclose()
+    data = resp.json()
+    if "choices" not in data:
+        log.error(f"LLM error: {data}")
+        return f"[LLM error: {data.get('error', {}).get('message', 'unknown')}]"
+    return data["choices"][0]["message"]["content"]
+
+
+def estimate_tokens(text: str) -> int:
+    """Rough token estimate: 1 token ~ 4 chars."""
+    return len(text) // 4
+
+
+def fit_context(messages: list[dict], max_tokens: int, protect_last: int = 4) -> list[dict]:
+    """Trim oldest messages (after system prompt) to fit token budget.
+    Always keeps: system prompt(s) at start + last `protect_last` messages."""
+    if not messages:
+        return messages
+
+    system_msgs = []
+    rest = []
+    for m in messages:
+        if not rest and m["role"] == "system":
+            system_msgs.append(m)
+        else:
+            rest.append(m)
+
+    protected = rest[-protect_last:] if len(rest) > protect_last else rest
+    middle = rest[:-protect_last] if len(rest) > protect_last else []
+
+    fixed_tokens = sum(estimate_tokens(m["content"]) for m in system_msgs + protected)
+
+    if fixed_tokens >= max_tokens:
+        result = system_msgs + protected
+        total = sum(estimate_tokens(m["content"]) for m in result)
+        while total > max_tokens and len(result) > 2:
+            removed = result.pop(1)
+            total -= estimate_tokens(removed["content"])
+        return result
+
+    remaining = max_tokens - fixed_tokens
+    kept_middle = []
+    for m in reversed(middle):
+        t = estimate_tokens(m["content"])
+        if remaining - t < 0:
+            break
+        kept_middle.insert(0, m)
+        remaining -= t
+
+    return system_msgs + kept_middle + protected
--- a/agent/nodes/init.py
+++ b/agent/nodes/init.py
@ -0,0 +1,9 @@
+"""Node modules."""
+
+from .sensor import SensorNode
+from .input import InputNode
+from .output import OutputNode
+from .thinker import ThinkerNode
+from .memorizer import MemorizerNode
+
+__all__ = ["SensorNode", "InputNode", "OutputNode", "ThinkerNode", "MemorizerNode"]
--- a/agent/nodes/base.py
+++ b/agent/nodes/base.py
@ -0,0 +1,31 @@
+"""Base Node class with context management."""
+
+import logging
+
+from ..llm import estimate_tokens, fit_context
+
+log = logging.getLogger("runtime")
+
+
+class Node:
+    name: str = "node"
+    model: str | None = None
+    max_context_tokens: int = 4000
+
+    def __init__(self, send_hud):
+        self.send_hud = send_hud
+        self.last_context_tokens = 0
+        self.context_fill_pct = 0
+
+    async def hud(self, event: str, **data):
+        await self.send_hud({"node": self.name, "event": event, **data})
+
+    def trim_context(self, messages: list[dict]) -> list[dict]:
+        """Fit messages within this node's token budget."""
+        before = len(messages)
+        result = fit_context(messages, self.max_context_tokens)
+        self.last_context_tokens = sum(estimate_tokens(m["content"]) for m in result)
+        self.context_fill_pct = int(100 * self.last_context_tokens / self.max_context_tokens)
+        if before != len(result):
+            log.info(f"[{self.name}] context trimmed: {before} -> {len(result)} msgs, {self.context_fill_pct}% fill")
+        return result
--- a/agent/nodes/input.py
+++ b/agent/nodes/input.py
@ -0,0 +1,48 @@
+"""Input Node: perceives what the user said."""
+
+import logging
+
+from .base import Node
+from ..llm import llm_call
+from ..types import Envelope, Command
+
+log = logging.getLogger("runtime")
+
+
+class InputNode(Node):
+    name = "input"
+    model = "google/gemini-2.0-flash-001"
+    max_context_tokens = 2000
+
+    SYSTEM = """You are the Input node — the ear of this cognitive runtime.
+
+Listener context:
+- Authenticated user: {identity}
+- Channel: {channel} (Chrome browser on Nico's Windows PC, in his room at home)
+- Physical: private space, Nico lives with Tina — she may use this session too
+- Security: single-user account, shared physical space — other voices are trusted household
+
+Your job: describe what you heard. Who spoke, what they want, what tone, what context matters.
+ONE sentence. No content, no response — just your perception of what came through.
+
+{memory_context}"""
+
+    async def process(self, envelope: Envelope, history: list[dict], memory_context: str = "",
+                      identity: str = "unknown", channel: str = "unknown") -> Command:
+        await self.hud("thinking", detail="deciding how to respond")
+        log.info(f"[input] user said: {envelope.text}")
+
+        messages = [
+            {"role": "system", "content": self.SYSTEM.format(
+                memory_context=memory_context, identity=identity, channel=channel)},
+        ]
+        for msg in history[-8:]:
+            messages.append(msg)
+        messages = self.trim_context(messages)
+
+        await self.hud("context", messages=messages, tokens=self.last_context_tokens,
+                       max_tokens=self.max_context_tokens, fill_pct=self.context_fill_pct)
+        instruction = await llm_call(self.model, messages)
+        log.info(f"[input] -> command: {instruction}")
+        await self.hud("perceived", instruction=instruction)
+        return Command(instruction=instruction, source_text=envelope.text)
--- a/agent/nodes/memorizer.py
+++ b/agent/nodes/memorizer.py
@ -0,0 +1,99 @@
+"""Memorizer Node: S2 — shared state / coordination."""
+
+import json
+import logging
+
+from .base import Node
+from ..llm import llm_call
+
+log = logging.getLogger("runtime")
+
+
+class MemorizerNode(Node):
+    name = "memorizer"
+    model = "google/gemini-2.0-flash-001"
+    max_context_tokens = 3000
+
+    DISTILL_SYSTEM = """You are the Memorizer node of a cognitive agent runtime.
+After each exchange you update the shared state that Input and Output nodes read.
+
+Given the conversation so far, output a JSON object with these fields:
+- user_name: string — how the user identifies themselves (null if unknown)
+- user_mood: string — current emotional tone (neutral, happy, frustrated, playful, etc.)
+- topic: string — what the conversation is about right now
+- topic_history: list of strings — previous topics in this session
+- situation: string — social/physical context if mentioned (e.g. "at a pub with tina", "private dev session")
+- language: string — primary language being used (en, de, mixed)
+- style_hint: string — how Output should talk (casual, formal, technical, poetic, etc.)
+- facts: list of strings — important facts learned about the user
+
+Output ONLY valid JSON. No explanation, no markdown fences."""
+
+    def __init__(self, send_hud):
+        super().__init__(send_hud)
+        self.state: dict = {
+            "user_name": None,
+            "user_mood": "neutral",
+            "topic": None,
+            "topic_history": [],
+            "situation": "localhost test runtime, private dev session",
+            "language": "en",
+            "style_hint": "casual, technical",
+            "facts": [],
+        }
+
+    def get_context_block(self, sensor_lines: list[str] = None) -> str:
+        lines = sensor_lines or ["Sensors: (none)"]
+        lines.append("")
+        lines.append("Shared memory (from Memorizer):")
+        for k, v in self.state.items():
+            if v:
+                lines.append(f"- {k}: {v}")
+        return "\n".join(lines)
+
+    async def update(self, history: list[dict]):
+        if len(history) < 2:
+            await self.hud("updated", state=self.state)
+            return
+
+        await self.hud("thinking", detail="updating shared state")
+
+        messages = [
+            {"role": "system", "content": self.DISTILL_SYSTEM},
+            {"role": "system", "content": f"Current state: {json.dumps(self.state)}"},
+        ]
+        for msg in history[-10:]:
+            messages.append(msg)
+        messages.append({"role": "user", "content": "Update the shared state based on this conversation. Output JSON only."})
+        messages = self.trim_context(messages)
+
+        await self.hud("context", messages=messages, tokens=self.last_context_tokens,
+                       max_tokens=self.max_context_tokens, fill_pct=self.context_fill_pct)
+
+        raw = await llm_call(self.model, messages)
+        log.info(f"[memorizer] raw: {raw[:200]}")
+
+        text = raw.strip()
+        if text.startswith("```"):
+            text = text.split("\n", 1)[1] if "\n" in text else text[3:]
+            if text.endswith("```"):
+                text = text[:-3]
+            text = text.strip()
+
+        try:
+            new_state = json.loads(text)
+            old_facts = set(self.state.get("facts", []))
+            new_facts = set(new_state.get("facts", []))
+            new_state["facts"] = list(old_facts | new_facts)[-20:]
+            if self.state.get("topic") and self.state["topic"] != new_state.get("topic"):
+                hist = new_state.get("topic_history", [])
+                if self.state["topic"] not in hist:
+                    hist.append(self.state["topic"])
+                new_state["topic_history"] = hist[-5:]
+            self.state = new_state
+            log.info(f"[memorizer] updated state: {self.state}")
+            await self.hud("updated", state=self.state)
+        except (json.JSONDecodeError, Exception) as e:
+            log.error(f"[memorizer] update error: {e}, raw: {text[:200]}")
+            await self.hud("error", detail=f"Update failed: {e}")
+            await self.hud("updated", state=self.state)
--- a/agent/nodes/output.py
+++ b/agent/nodes/output.py
@ -0,0 +1,63 @@
+"""Output Node: streams natural response to the user."""
+
+import json
+import logging
+
+from fastapi import WebSocket
+
+from .base import Node
+from ..llm import llm_call
+from ..types import Command
+
+log = logging.getLogger("runtime")
+
+
+class OutputNode(Node):
+    name = "output"
+    model = "google/gemini-2.0-flash-001"
+    max_context_tokens = 4000
+
+    SYSTEM = """You are the Output node — the voice of this cognitive runtime.
+The Input node sends you its perception of what the user said. This is internal context for you — never repeat or echo it.
+You respond to the USER, not to the Input node. Use the perception to understand intent, then act on it.
+Be natural. Be concise. If the user asks you to do something, do it — don't describe what you're about to do.
+
+{memory_context}"""
+
+    async def process(self, command: Command, history: list[dict], ws: WebSocket, memory_context: str = "") -> str:
+        await self.hud("streaming")
+
+        messages = [
+            {"role": "system", "content": self.SYSTEM.format(memory_context=memory_context)},
+        ]
+        for msg in history[-20:]:
+            messages.append(msg)
+        messages.append({"role": "system", "content": f"Input perception: {command.instruction}"})
+        messages = self.trim_context(messages)
+
+        await self.hud("context", messages=messages, tokens=self.last_context_tokens,
+                       max_tokens=self.max_context_tokens, fill_pct=self.context_fill_pct)
+
+        client, resp = await llm_call(self.model, messages, stream=True)
+        full_response = ""
+        try:
+            async for line in resp.aiter_lines():
+                if not line.startswith("data: "):
+                    continue
+                payload = line[6:]
+                if payload == "[DONE]":
+                    break
+                chunk = json.loads(payload)
+                delta = chunk["choices"][0].get("delta", {})
+                token = delta.get("content", "")
+                if token:
+                    full_response += token
+                    await ws.send_text(json.dumps({"type": "delta", "content": token}))
+        finally:
+            await resp.aclose()
+            await client.aclose()
+
+        log.info(f"[output] response: {full_response[:100]}...")
+        await ws.send_text(json.dumps({"type": "done"}))
+        await self.hud("done")
+        return full_response
--- a/agent/nodes/sensor.py
+++ b/agent/nodes/sensor.py
@ -0,0 +1,132 @@
+"""Sensor Node: ticks independently, produces context for other nodes."""
+
+import asyncio
+import logging
+import time
+from datetime import datetime, timezone, timedelta
+
+from .base import Node
+
+log = logging.getLogger("runtime")
+
+BERLIN = timezone(timedelta(hours=2))  # CEST
+
+
+class SensorNode(Node):
+    name = "sensor"
+
+    def __init__(self, send_hud):
+        super().__init__(send_hud)
+        self.tick_count = 0
+        self.running = False
+        self._task: asyncio.Task | None = None
+        self.interval = 5
+        self.readings: dict[str, dict] = {}
+        self._last_user_activity: float = time.time()
+        self._prev_memo_state: dict = {}
+
+    def _now(self) -> datetime:
+        return datetime.now(BERLIN)
+
+    def _read_clock(self) -> dict:
+        now = self._now()
+        current = now.strftime("%H:%M")
+        prev = self.readings.get("clock", {}).get("value")
+        if current != prev:
+            return {"value": current, "detail": now.strftime("%Y-%m-%d %H:%M:%S %A"), "changed_at": time.time()}
+        return {}
+
+    def _read_idle(self) -> dict:
+        idle_s = time.time() - self._last_user_activity
+        thresholds = [30, 60, 300, 600, 1800]
+        prev_idle = self.readings.get("idle", {}).get("_raw", 0)
+        for t in thresholds:
+            if prev_idle < t <= idle_s:
+                if idle_s < 60:
+                    label = f"{int(idle_s)}s"
+                else:
+                    label = f"{int(idle_s // 60)}m{int(idle_s % 60)}s"
+                return {"value": label, "_raw": idle_s, "changed_at": time.time()}
+        if "idle" in self.readings:
+            self.readings["idle"]["_raw"] = idle_s
+        return {}
+
+    def _read_memo_changes(self, memo_state: dict) -> dict:
+        changes = []
+        for k, v in memo_state.items():
+            prev = self._prev_memo_state.get(k)
+            if v != prev and prev is not None:
+                changes.append(f"{k}: {prev} -> {v}")
+        self._prev_memo_state = dict(memo_state)
+        if changes:
+            return {"value": "; ".join(changes), "changed_at": time.time()}
+        return {}
+
+    def note_user_activity(self):
+        self._last_user_activity = time.time()
+        self.readings["idle"] = {"value": "active", "_raw": 0, "changed_at": time.time()}
+
+    async def tick(self, memo_state: dict):
+        self.tick_count += 1
+        deltas = {}
+
+        for name, reader in [("clock", self._read_clock),
+                              ("idle", self._read_idle)]:
+            update = reader()
+            if update:
+                self.readings[name] = {**self.readings.get(name, {}), **update}
+                deltas[name] = update.get("value") or update.get("detail")
+
+        memo_update = self._read_memo_changes(memo_state)
+        if memo_update:
+            self.readings["memo_delta"] = memo_update
+            deltas["memo_delta"] = memo_update["value"]
+
+        if deltas:
+            await self.hud("tick", tick=self.tick_count, deltas=deltas)
+
+    async def _loop(self, get_memo_state):
+        self.running = True
+        await self.hud("started", interval=self.interval)
+        try:
+            while self.running:
+                await asyncio.sleep(self.interval)
+                try:
+                    await self.tick(get_memo_state())
+                except Exception as e:
+                    log.error(f"[sensor] tick error: {e}")
+        except asyncio.CancelledError:
+            pass
+        finally:
+            self.running = False
+            await self.hud("stopped")
+
+    def start(self, get_memo_state):
+        if self._task and not self._task.done():
+            return
+        self._task = asyncio.create_task(self._loop(get_memo_state))
+
+    def stop(self):
+        self.running = False
+        if self._task:
+            self._task.cancel()
+
+    def get_context_lines(self) -> list[str]:
+        if not self.readings:
+            return ["Sensors: (no sensor node running)"]
+        lines = [f"Sensors (tick #{self.tick_count}, {self.interval}s interval):"]
+        for name, r in self.readings.items():
+            if name.startswith("_"):
+                continue
+            val = r.get("value", "?")
+            detail = r.get("detail")
+            age = time.time() - r.get("changed_at", time.time())
+            if age < 10:
+                age_str = "just now"
+            elif age < 60:
+                age_str = f"{int(age)}s ago"
+            else:
+                age_str = f"{int(age // 60)}m ago"
+            line = f"- {name}: {detail or val}  [{age_str}]"
+            lines.append(line)
+        return lines
--- a/agent/nodes/thinker.py
+++ b/agent/nodes/thinker.py
@ -0,0 +1,166 @@
+"""Thinker Node: S3 — control, reasoning, tool use."""
+
+import json
+import logging
+import re
+
+from .base import Node
+from ..llm import llm_call
+from ..process import ProcessManager
+from ..types import Command, ThoughtResult
+
+log = logging.getLogger("runtime")
+
+
+class ThinkerNode(Node):
+    name = "thinker"
+    model = "google/gemini-2.5-flash-preview"
+    max_context_tokens = 4000
+
+    SYSTEM = """You are the Thinker node — the brain of this cognitive runtime.
+You receive a perception of what the user said. Decide: answer directly, use a tool, or show UI controls.
+
+TOOLS — write a ```python code block and it WILL be executed. Use print() for output.
+- For math, databases, file ops, any computation: write python. NEVER describe code — write it.
+- For simple conversation: respond directly as text.
+
+UI CONTROLS — to show interactive elements, include a JSON block:
+```controls
+[
+  {{"type": "table", "data": [...], "columns": ["id", "name", "email"]}},
+  {{"type": "button", "label": "Add Customer", "action": "add_customer"}},
+  {{"type": "button", "label": "Refresh", "action": "refresh_customers"}}
+]
+```
+Controls render in the chat. User clicks flow back as actions you can handle.
+
+You can combine text + code + controls in one response.
+
+{memory_context}"""
+
+    def __init__(self, send_hud, process_manager: ProcessManager = None):
+        super().__init__(send_hud)
+        self.pm = process_manager
+
+    def _parse_tool_call(self, response: str) -> tuple[str, str] | None:
+        """Parse tool calls. Supports TOOL: format and auto-detects python code blocks."""
+        text = response.strip()
+
+        if text.startswith("TOOL:"):
+            lines = text.split("\n")
+            tool_name = lines[0].replace("TOOL:", "").strip()
+            code_lines = []
+            in_code = False
+            for line in lines[1:]:
+                if line.strip().startswith("```") and not in_code:
+                    in_code = True
+                    continue
+                elif line.strip().startswith("```") and in_code:
+                    break
+                elif in_code:
+                    code_lines.append(line)
+                elif line.strip().startswith("CODE:"):
+                    continue
+            return (tool_name, "\n".join(code_lines)) if code_lines else None
+
+        block_match = re.search(r'```(?:python|py|sql|sqlite|sh|bash|tool_code)?\s*\n(.*?)```', text, re.DOTALL)
+        if block_match:
+            code = block_match.group(1).strip()
+            if code and len(code.split("\n")) > 0:
+                if "```sql" in text or "```sqlite" in text or ("SELECT" in code.upper() and "CREATE" in code.upper()):
+                    wrapped = f'''import sqlite3
+conn = sqlite3.connect("/tmp/cog_db.sqlite")
+cursor = conn.cursor()
+for stmt in """{code}""".split(";"):
+    stmt = stmt.strip()
+    if stmt:
+        cursor.execute(stmt)
+conn.commit()
+cursor.execute("SELECT name FROM sqlite_master WHERE type='table'")
+tables = cursor.fetchall()
+for t in tables:
+    cursor.execute(f"SELECT * FROM {{t[0]}}")
+    rows = cursor.fetchall()
+    cols = [d[0] for d in cursor.description]
+    print(f"Table: {{t[0]}}")
+    print(" | ".join(cols))
+    for row in rows:
+        print(" | ".join(str(c) for c in row))
+conn.close()'''
+                    return ("python", wrapped)
+                return ("python", code)
+
+        return None
+
+    def _parse_controls(self, response: str) -> list[dict]:
+        """Extract ```controls JSON blocks from response."""
+        controls = []
+        if "```controls" not in response:
+            return controls
+        parts = response.split("```controls")
+        for part in parts[1:]:
+            end = part.find("```")
+            if end != -1:
+                try:
+                    controls.extend(json.loads(part[:end].strip()))
+                except json.JSONDecodeError:
+                    pass
+        return controls
+
+    def _strip_blocks(self, response: str) -> str:
+        """Remove code and control blocks, return plain text."""
+        text = re.sub(r'```(?:python|py|controls).*?```', '', response, flags=re.DOTALL)
+        return text.strip()
+
+    async def process(self, command: Command, history: list[dict], memory_context: str = "") -> ThoughtResult:
+        await self.hud("thinking", detail="reasoning about response")
+
+        messages = [
+            {"role": "system", "content": self.SYSTEM.format(memory_context=memory_context)},
+        ]
+        for msg in history[-12:]:
+            messages.append(msg)
+        messages.append({"role": "system", "content": f"Input perception: {command.instruction}"})
+        messages = self.trim_context(messages)
+
+        await self.hud("context", messages=messages, tokens=self.last_context_tokens,
+                       max_tokens=self.max_context_tokens, fill_pct=self.context_fill_pct)
+
+        response = await llm_call(self.model, messages)
+        log.info(f"[thinker] response: {response[:200]}")
+
+        controls = self._parse_controls(response)
+        if controls:
+            await self.hud("controls", controls=controls)
+
+        tool_call = self._parse_tool_call(response)
+        if tool_call:
+            tool_name, code = tool_call
+
+            if self.pm and tool_name == "python":
+                proc = await self.pm.execute(tool_name, code)
+                tool_output = "\n".join(proc.output_lines)
+            else:
+                tool_output = f"[unknown tool: {tool_name}]"
+
+            log.info(f"[thinker] tool output: {tool_output[:200]}")
+
+            messages.append({"role": "assistant", "content": response})
+            messages.append({"role": "system", "content": f"Tool output:\n{tool_output}"})
+            messages.append({"role": "user", "content": "Respond to the user based on the tool output. If showing data, include a ```controls block with a table. Be natural and concise."})
+            messages = self.trim_context(messages)
+            final = await llm_call(self.model, messages)
+
+            more_controls = self._parse_controls(final)
+            if more_controls:
+                controls.extend(more_controls)
+                await self.hud("controls", controls=more_controls)
+
+            clean_text = self._strip_blocks(final)
+            await self.hud("decided", instruction=clean_text[:200])
+            return ThoughtResult(response=clean_text, tool_used=tool_name,
+                                tool_output=tool_output, controls=controls)
+
+        clean_text = self._strip_blocks(response) or response
+        await self.hud("decided", instruction="direct response (no tools)")
+        return ThoughtResult(response=clean_text, controls=controls)
--- a/agent/process.py
+++ b/agent/process.py
@ -0,0 +1,104 @@
+"""Process Manager: observable tool execution via subprocess."""
+
+import asyncio
+import subprocess
+import tempfile
+import time
+
+
+class Process:
+    """A single observable tool execution."""
+    _next_id = 0
+
+    def __init__(self, tool: str, code: str, send_hud):
+        Process._next_id += 1
+        self.pid = Process._next_id
+        self.tool = tool
+        self.code = code
+        self.send_hud = send_hud
+        self.status = "pending"
+        self.output_lines: list[str] = []
+        self.exit_code: int | None = None
+        self.started_at: float = 0
+        self.ended_at: float = 0
+        self._subprocess: subprocess.Popen | None = None
+
+    async def hud(self, event: str, **data):
+        await self.send_hud({"node": "process", "event": event, "pid": self.pid,
+                             "tool": self.tool, "status": self.status, **data})
+
+    def run_sync(self) -> str:
+        """Execute the tool synchronously. Returns output."""
+        self.status = "running"
+        self.started_at = time.time()
+        try:
+            with tempfile.NamedTemporaryFile(mode='w', suffix='.py', delete=False, encoding='utf-8') as f:
+                f.write(self.code)
+                f.flush()
+                self._subprocess = subprocess.Popen(
+                    ['python3', f.name],
+                    stdout=subprocess.PIPE, stderr=subprocess.PIPE,
+                    text=True, cwd=tempfile.gettempdir()
+                )
+                stdout, stderr = self._subprocess.communicate(timeout=10)
+                self.exit_code = self._subprocess.returncode
+                if stdout:
+                    self.output_lines.extend(stdout.strip().split("\n"))
+                if self.exit_code != 0 and stderr:
+                    self.output_lines.append(f"[stderr: {stderr.strip()}]")
+                self.status = "done" if self.exit_code == 0 else "failed"
+        except subprocess.TimeoutExpired:
+            if self._subprocess:
+                self._subprocess.kill()
+            self.output_lines.append("[error: timed out after 10s]")
+            self.status = "failed"
+            self.exit_code = -1
+        except Exception as e:
+            self.output_lines.append(f"[error: {e}]")
+            self.status = "failed"
+            self.exit_code = -1
+        finally:
+            self.ended_at = time.time()
+        return "\n".join(self.output_lines) or "[no output]"
+
+    def cancel(self):
+        if self._subprocess and self.status == "running":
+            self._subprocess.kill()
+            self.status = "cancelled"
+            self.ended_at = time.time()
+            self.output_lines.append("[cancelled by user]")
+
+
+class ProcessManager:
+    """Manages all tool executions as observable processes."""
+
+    def __init__(self, send_hud):
+        self.send_hud = send_hud
+        self.processes: dict[int, Process] = {}
+
+    async def execute(self, tool: str, code: str) -> Process:
+        """Create and run a process. Returns the completed Process."""
+        proc = Process(tool, code, self.send_hud)
+        self.processes[proc.pid] = proc
+
+        await proc.hud("process_start", code=code[:200])
+
+        loop = asyncio.get_event_loop()
+        output = await loop.run_in_executor(None, proc.run_sync)
+
+        elapsed = round(proc.ended_at - proc.started_at, 2)
+        await proc.hud("process_done", exit_code=proc.exit_code,
+                       output=output[:500], elapsed=elapsed)
+        return proc
+
+    def cancel(self, pid: int) -> bool:
+        proc = self.processes.get(pid)
+        if proc:
+            proc.cancel()
+            return True
+        return False
+
+    def get_status(self) -> list[dict]:
+        return [{"pid": p.pid, "tool": p.tool, "status": p.status,
+                 "elapsed": round((p.ended_at or time.time()) - p.started_at, 2) if p.started_at else 0}
+                for p in self.processes.values()]
--- a/agent/runtime.py
+++ b/agent/runtime.py
@ -0,0 +1,98 @@
+"""Runtime: wires all nodes together into a processing pipeline."""
+
+import json
+import logging
+import time
+from pathlib import Path
+from typing import Callable
+
+from fastapi import WebSocket
+
+from .types import Envelope, Command
+from .process import ProcessManager
+from .nodes import SensorNode, InputNode, OutputNode, ThinkerNode, MemorizerNode
+
+log = logging.getLogger("runtime")
+
+TRACE_FILE = Path(__file__).parent.parent / "trace.jsonl"
+
+
+class Runtime:
+    def __init__(self, ws: WebSocket, user_claims: dict = None, origin: str = "",
+                 broadcast: Callable = None):
+        self.ws = ws
+        self.history: list[dict] = []
+        self.MAX_HISTORY = 40
+        self._broadcast = broadcast or (lambda e: None)
+
+        self.input_node = InputNode(send_hud=self._send_hud)
+        self.process_manager = ProcessManager(send_hud=self._send_hud)
+        self.thinker = ThinkerNode(send_hud=self._send_hud, process_manager=self.process_manager)
+        self.output_node = OutputNode(send_hud=self._send_hud)
+        self.memorizer = MemorizerNode(send_hud=self._send_hud)
+        self.sensor = SensorNode(send_hud=self._send_hud)
+        self.sensor.start(get_memo_state=lambda: self.memorizer.state)
+
+        claims = user_claims or {}
+        log.info(f"[runtime] user_claims: {claims}")
+        self.identity = claims.get("name") or claims.get("preferred_username") or claims.get("username") or "unknown"
+        log.info(f"[runtime] resolved identity: {self.identity}")
+        self.channel = origin or "unknown"
+
+        self.memorizer.state["user_name"] = self.identity
+        self.memorizer.state["situation"] = f"authenticated on {self.channel}" if origin else "local session"
+
+    async def _send_hud(self, data: dict):
+        await self.ws.send_text(json.dumps({"type": "hud", **data}))
+        trace_entry = {"ts": time.strftime("%Y-%m-%d %H:%M:%S.") + f"{time.time() % 1:.3f}"[2:], **data}
+        try:
+            with open(TRACE_FILE, "a", encoding="utf-8") as f:
+                f.write(json.dumps(trace_entry, ensure_ascii=False) + "\n")
+            if TRACE_FILE.exists() and TRACE_FILE.stat().st_size > 500_000:
+                lines = TRACE_FILE.read_text(encoding="utf-8").strip().split("\n")
+                TRACE_FILE.write_text("\n".join(lines[-500:]) + "\n", encoding="utf-8")
+        except Exception as e:
+            log.error(f"trace write error: {e}")
+        self._broadcast(trace_entry)
+
+    async def handle_message(self, text: str):
+        envelope = Envelope(
+            text=text,
+            user_id="nico",
+            session_id="test",
+            timestamp=time.strftime("%Y-%m-%d %H:%M:%S"),
+        )
+
+        self.sensor.note_user_activity()
+        self.history.append({"role": "user", "content": text})
+
+        sensor_lines = self.sensor.get_context_lines()
+        mem_ctx = self.memorizer.get_context_block(sensor_lines=sensor_lines)
+
+        command = await self.input_node.process(
+            envelope, self.history, memory_context=mem_ctx,
+            identity=self.identity, channel=self.channel)
+
+        thought = await self.thinker.process(command, self.history, memory_context=mem_ctx)
+
+        if thought.tool_used:
+            command = Command(
+                instruction=f"Thinker used {thought.tool_used} and says: {thought.response}",
+                source_text=command.source_text
+            )
+        else:
+            command = Command(
+                instruction=f"Thinker says: {thought.response}",
+                source_text=command.source_text
+            )
+
+        response = await self.output_node.process(command, self.history, self.ws, memory_context=mem_ctx)
+        self.history.append({"role": "assistant", "content": response})
+
+        if thought.controls:
+            await self.ws.send_text(json.dumps({"type": "controls", "controls": thought.controls}))
+
+        await self.memorizer.update(self.history)
+
+        if len(self.history) > self.MAX_HISTORY:
+            self.history = self.history[-self.MAX_HISTORY:]
--- a/agent/types.py
+++ b/agent/types.py
@ -0,0 +1,29 @@
+"""Message types flowing between nodes."""
+
+from dataclasses import dataclass, field
+
+
+@dataclass
+class Envelope:
+    """What flows between nodes."""
+    text: str
+    user_id: str = "anon"
+    session_id: str = ""
+    timestamp: str = ""
+
+
+@dataclass
+class Command:
+    """Input node's perception — describes what was heard."""
+    instruction: str
+    source_text: str
+    metadata: dict = field(default_factory=dict)
+
+
+@dataclass
+class ThoughtResult:
+    """Thinker node's output — either a direct answer or tool results."""
+    response: str
+    tool_used: str = ""
+    tool_output: str = ""
+    controls: list = field(default_factory=list)