feat(personas): M3.b-d — tick loop + Claude Agent SDK + persistence (real)

Previous commit 38dc80654 carries this M3 title but its payload is an unrelated apps/api/picture change — shared-.git-index race with a parallel session (see feedback_git_workflow.md). This commit holds the actual M3.b/c/d code. Leaving the misnamed commit for the user to re-attribute / revert as they prefer. Closes the M3 loop from docs/plans/mana-mcp-and-personas.md. The runner picks up due personas, drives each through Claude + MCP for one simulated turn, collects actions + ratings, persists through service-key internal endpoints in mana-auth. Internal endpoints (mana-auth, service-key-gated) - GET /api/v1/internal/personas/due Returns personas whose tickCadence + lastActiveAt say they're due. Rules: hourly > 1h, daily > 24h, weekdays > 24h mon-fri. NULLS FIRST so never-run personas go ahead of stale ones. - POST /api/v1/internal/personas/:id/actions Batch ≤ 500. Row ids are deterministic `${tickId}-${i}-${toolName}` + ON CONFLICT DO NOTHING so the runner can retry a tick without doubling audit rows. Also bumps personas.last_active_at so the next /due call sees it. - POST /api/v1/internal/personas/:id/feedback Batch ≤ 100. Row id is `${tickId}-${module}` — natural key is one rating per module per tick. Runner tick pipeline (services/mana-persona-runner/src/runner/) - claude-session.ts Two phases per tick. runMainTurn feeds the persona's system prompt + a German "simulate a day" user prompt to Claude Agent SDK's query(), with mana-mcp wired in as a streamable-HTTP MCP server. We iterate the returned AsyncGenerator and extract tool_use blocks into ActionRows; a tool_result with is_error=true flips the most recent action. runRatingTurn is a fresh query() with tools:[] asking Claude in character to rate each used module 1-5 as strict JSON. We parse with tolerance for whitespace / fences. Unparseable output becomes a synthetic '__parse' feedback row so operators see the failure. - tick.ts Orchestrator. Skips when config.paused. Fetches /due, processes in batches of config.concurrency via Promise.allSettled so a single persona failure never kills the batch. Returns {due, ranSuccessfully, failed[], durationMs}. - types.ts ActionRow + FeedbackRow shapes shared between claude-session and the internal client. Runner bootstrap (src/index.ts) - setInterval(config.tickIntervalMs) starts the tick loop on boot. tickInFlight guards against overlap when Claude latency > interval. If MANA_SERVICE_KEY or ANTHROPIC_API_KEY is missing, loop is disabled with a warn line — /health + /diag/login still work. - POST /diag/tick (dev-only) fires one tick on demand, returns the result. Avoids waiting a full interval during testing. - Graceful SIGTERM/SIGINT shutdown clears the interval. Client - clients/mana-auth-internal.ts X-Service-Key client for the three endpoints above. Constructor throws on empty serviceKey — fail loud. Boot smoke verified: /health returns ok, /diag/tick 500s with descriptive messages when keys absent. Warning lines on boot when keys are missing. Type-check green across mana-auth, tool-registry, mcp, persona-runner. M3 exit gate is the end-to-end smoke recipe (docker up → db:push → seed:personas → diag/tick → psql) documented in services/mana-persona-runner/CLAUDE.md. M2.d (cross-space family/team memberships) still deferred. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-23 17:46:42 +02:00 · 2026-04-23 14:18:31 +02:00 · 2026-04-23 14:18:31 +02:00 · f07eae3c01
commit f07eae3c01
parent 38dc806549
9 changed files with 883 additions and 18 deletions
--- a/services/mana-auth/src/index.ts
+++ b/services/mana-auth/src/index.ts
@ -29,6 +29,7 @@ import { createAiMissionGrantRoutes } from './routes/ai-mission-grant';
 import { createSettingsRoutes } from './routes/settings';
 import { createAdminRoutes } from './routes/admin';
 import { createAdminPersonasRoutes } from './routes/admin-personas';
+import { createInternalPersonasRoutes } from './routes/internal-personas';

 // ─── Bootstrap ──────────────────────────────────────────────

@ -126,6 +127,8 @@ app.route('/api/v1/admin/personas', createAdminPersonasRoutes(db, auth));

 app.use('/api/v1/internal/*', serviceAuth(config.serviceKey));

+app.route('/api/v1/internal/personas', createInternalPersonasRoutes(db));
+
 app.get('/api/v1/internal/org/:orgId/member/:userId', async (c) => {
 	const { orgId, userId } = c.req.param();
 	const { members } = await import('./db/schema/organizations');
--- a/services/mana-auth/src/routes/internal-personas.ts
+++ b/services/mana-auth/src/routes/internal-personas.ts
@ -0,0 +1,234 @@
+/**
+ * Internal endpoints for the persona-runner (M3.c).
+ *
+ * Service-to-service — gated by `X-Service-Key` at the app level (see
+ * `app.use('/api/v1/internal/*', serviceAuth(...))` in index.ts).
+ *
+ * Two write endpoints:
+ *   POST /api/v1/internal/personas/:id/actions    batch of tool-call rows
+ *   POST /api/v1/internal/personas/:id/feedback   batch of rating rows
+ *
+ * Both are **append-only** and **idempotent by (tickId + some natural
+ * key)** — the runner can retry a failed batch without doubling rows.
+ * Also: both bump `personas.last_active_at` so the next tick's "is this
+ * persona due?" check sees the activity.
+ */
+
+import { Hono } from 'hono';
+import { and, eq, isNull, lte, or, sql } from 'drizzle-orm';
+import type { PostgresJsDatabase } from 'drizzle-orm/postgres-js';
+import { users } from '../db/schema/auth';
+import { personas, personaActions, personaFeedback } from '../db/schema/personas';
+
+// ─── Input shapes (no zod dependency here — minimal sanity checks) ────
+
+interface ActionRow {
+	tickId: string;
+	toolName: string;
+	inputHash?: string;
+	result: 'ok' | 'error';
+	errorMessage?: string;
+	latencyMs?: number;
+}
+
+interface FeedbackRow {
+	tickId: string;
+	module: string;
+	rating: 1 | 2 | 3 | 4 | 5;
+	notes?: string;
+}
+
+function isValidAction(row: unknown): row is ActionRow {
+	if (!row || typeof row !== 'object') return false;
+	const r = row as Record<string, unknown>;
+	return (
+		typeof r.tickId === 'string' &&
+		typeof r.toolName === 'string' &&
+		(r.result === 'ok' || r.result === 'error')
+	);
+}
+
+function isValidFeedback(row: unknown): row is FeedbackRow {
+	if (!row || typeof row !== 'object') return false;
+	const r = row as Record<string, unknown>;
+	return (
+		typeof r.tickId === 'string' &&
+		typeof r.module === 'string' &&
+		typeof r.rating === 'number' &&
+		r.rating >= 1 &&
+		r.rating <= 5
+	);
+}
+
+export function createInternalPersonasRoutes(db: PostgresJsDatabase<any>) {
+	const app = new Hono();
+
+	// Guard: every route under this router requires the :id to be an
+	// existing persona. Keeps the runner from accidentally writing
+	// audit rows for a deleted persona (FK would catch it, but a
+	// clean 404 is a better diagnostic).
+	async function requirePersona(personaId: string): Promise<boolean> {
+		const [row] = await db
+			.select({ userId: personas.userId })
+			.from(personas)
+			.where(eq(personas.userId, personaId));
+		return !!row;
+	}
+
+	// ─── GET /api/v1/internal/personas/due ──────────────────────────
+	//
+	// Returns personas the runner should act on **now**, given each
+	// persona's `tickCadence` + `lastActiveAt`. Simple rules:
+	//
+	//   hourly   — due if lastActiveAt is null or > 1 hour ago
+	//   daily    — due if lastActiveAt is null or > 24 hours ago
+	//   weekdays — same as daily + server clock is Mon–Fri
+	//
+	// Deletion and soft-delete are respected: users.deletedAt IS NULL.
+
+	app.get('/due', async (c) => {
+		const now = new Date();
+		const dow = now.getUTCDay(); // 0=Sun … 6=Sat
+		const isWeekday = dow >= 1 && dow <= 5;
+		const oneHourAgo = new Date(now.getTime() - 60 * 60 * 1000);
+		const oneDayAgo = new Date(now.getTime() - 24 * 60 * 60 * 1000);
+
+		// Compose (cadence='hourly' AND stale-by-hour) OR (cadence='daily' AND stale-by-day)
+		// OR (cadence='weekdays' AND today-is-weekday AND stale-by-day)
+		const hourly = and(
+			eq(personas.tickCadence, 'hourly'),
+			or(isNull(personas.lastActiveAt), lte(personas.lastActiveAt, oneHourAgo))
+		);
+		const daily = and(
+			eq(personas.tickCadence, 'daily'),
+			or(isNull(personas.lastActiveAt), lte(personas.lastActiveAt, oneDayAgo))
+		);
+		const weekdays = isWeekday
+			? and(
+					eq(personas.tickCadence, 'weekdays'),
+					or(isNull(personas.lastActiveAt), lte(personas.lastActiveAt, oneDayAgo))
+				)
+			: undefined;
+
+		const rows = await db
+			.select({
+				userId: personas.userId,
+				email: users.email,
+				archetype: personas.archetype,
+				systemPrompt: personas.systemPrompt,
+				moduleMix: personas.moduleMix,
+				tickCadence: personas.tickCadence,
+				lastActiveAt: personas.lastActiveAt,
+			})
+			.from(personas)
+			.innerJoin(users, eq(users.id, personas.userId))
+			.where(
+				and(
+					isNull(users.deletedAt),
+					or(...[hourly, daily, weekdays].filter((x): x is NonNullable<typeof x> => !!x))
+				)
+			)
+			.orderBy(sql`${personas.lastActiveAt} NULLS FIRST`);
+
+		return c.json({ personas: rows, serverTime: now.toISOString() });
+	});
+
+	// ─── POST /api/v1/internal/personas/:id/actions ──────────────────
+
+	app.post('/:id/actions', async (c) => {
+		const personaId = c.req.param('id');
+		if (!(await requirePersona(personaId))) {
+			return c.json({ error: 'Persona not found' }, 404);
+		}
+
+		let body: unknown;
+		try {
+			body = await c.req.json();
+		} catch {
+			return c.json({ error: 'Invalid JSON' }, 400);
+		}
+
+		const rawActions = (body as { actions?: unknown[] })?.actions;
+		if (!Array.isArray(rawActions) || rawActions.length === 0) {
+			return c.json({ error: '`actions` array required' }, 400);
+		}
+		if (rawActions.length > 500) {
+			return c.json({ error: '`actions` batch size must be ≤ 500' }, 400);
+		}
+		if (!rawActions.every(isValidAction)) {
+			return c.json({ error: 'One or more action rows failed validation' }, 400);
+		}
+
+		const now = new Date();
+		const values = rawActions.map((a, i) => ({
+			// Deterministic id per (tickId, toolName, index) so retrying
+			// the same batch doesn't produce duplicates. crypto.randomUUID
+			// would work too but would leak idempotency on retry.
+			id: `${a.tickId}-${i}-${a.toolName}`.slice(0, 255),
+			personaId,
+			tickId: a.tickId,
+			toolName: a.toolName,
+			inputHash: a.inputHash ?? null,
+			result: a.result,
+			errorMessage: a.errorMessage ?? null,
+			latencyMs: a.latencyMs ?? null,
+			createdAt: now,
+		}));
+
+		await db.insert(personaActions).values(values).onConflictDoNothing();
+		await db.update(personas).set({ lastActiveAt: now }).where(eq(personas.userId, personaId));
+
+		return c.json({ ok: true, written: values.length });
+	});
+
+	// ─── POST /api/v1/internal/personas/:id/feedback ─────────────────
+
+	app.post('/:id/feedback', async (c) => {
+		const personaId = c.req.param('id');
+		if (!(await requirePersona(personaId))) {
+			return c.json({ error: 'Persona not found' }, 404);
+		}
+
+		let body: unknown;
+		try {
+			body = await c.req.json();
+		} catch {
+			return c.json({ error: 'Invalid JSON' }, 400);
+		}
+
+		const rawFeedback = (body as { feedback?: unknown[] })?.feedback;
+		if (!Array.isArray(rawFeedback) || rawFeedback.length === 0) {
+			return c.json({ error: '`feedback` array required' }, 400);
+		}
+		if (rawFeedback.length > 100) {
+			return c.json({ error: '`feedback` batch size must be ≤ 100' }, 400);
+		}
+		if (!rawFeedback.every(isValidFeedback)) {
+			return c.json({ error: 'One or more feedback rows failed validation' }, 400);
+		}
+
+		const now = new Date();
+		const values = rawFeedback.map((f) => ({
+			// (tickId, module) is the natural uniqueness key — one rating
+			// per module per tick. Retries hit onConflictDoNothing.
+			id: `${f.tickId}-${f.module}`.slice(0, 255),
+			personaId,
+			tickId: f.tickId,
+			module: f.module,
+			rating: f.rating,
+			notes: f.notes ?? null,
+			createdAt: now,
+		}));
+
+		await db.insert(personaFeedback).values(values).onConflictDoNothing();
+
+		return c.json({ ok: true, written: values.length });
+	});
+
+	return app;
+}
+
+// Minimal unused import cleanup — drizzle-orm `and` was imported for
+// potential future composite-WHERE needs but neither endpoint uses it
+// today. Kept as a reminder when actions/feedback gain filter params.
+void and;