feat(mana-ai): first live reminder producers — token budget + retry-loop

Wires the M1 reminderChannel into the mana-ai mission runner with two initial producers in services/mana-ai/src/planner/reminders.ts: - tokenBudgetReminder — warns at 75% of the agent's daily cap, emits a stronger "wrap up NOW" message at/above 100%. Uses pretick usage + accumulated round usage so the warning tracks drift during a long plan. - retryLoopReminder — shape is in place (round≥3 + last 2 failures), currently limited to the single lastCall LoopState exposes. Extends cleanly once LoopState carries the full failure window. buildReminderChannel composes active producers; the tick hoists pretickUsage24h so the channel has the baseline. Each round the loop re-evaluates the producers, so usage drift across rounds surfaces on the NEXT turn. Also exports LoopState + ReminderChannel from @mana/shared-ai top-level so consumers don't need to reach into /planner. Tests: 13 new bun tests covering thresholds, pretick+round summing, composition, and per-round re-evaluation. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-28 13:37:44 +02:00 · 2026-04-23 14:00:04 +02:00 · 2026-04-23 14:00:04 +02:00 · faa472be91
commit faa472be91
parent e5d230e599
4 changed files with 330 additions and 4 deletions
--- a/services/mana-ai/src/cron/tick.ts
+++ b/services/mana-ai/src/cron/tick.ts
@ -50,6 +50,7 @@ import {
 import { unwrapMissionGrant } from '../crypto/unwrap-grant';
 import { detectInjectionMarker } from '@mana/tool-registry';
 import { NewsResearchClient } from '../planner/news-research-client';
+import { buildReminderChannel } from '../planner/reminders';
 import { ManaResearchClient, type DeepResearchProvider } from '../clients/mana-research';
 import {
 	deletePendingResearchJob,
@ -192,6 +193,12 @@ export async function runTickOnce(config: Config): Promise<TickStats> {
 				agentDecisionsTotal.inc({ decision: 'skipped-paused' });
 				continue;
 			}
+			// Pretick token usage is surfaced to the reminder channel so the
+			// planner sees a warning as it approaches the cap, rather than
+			// getting cut off without explanation. Default 0 when the
+			// agent has no cap or the query fails (reminder becomes a
+			// no-op for that mission).
+			let pretickUsage24h = 0;
 			if (agent) {
 				const used = activeRuns.get(agent.id) ?? 0;
 				if (used >= agent.maxConcurrentMissions) {
@ -200,8 +207,8 @@ export async function runTickOnce(config: Config): Promise<TickStats> {
 				}
 				// Budget enforcement: check rolling 24h token usage.
 				if (agent.maxTokensPerDay != null && agent.maxTokensPerDay >= 0) {
-					const windowUsage = await getAgentTokenUsage24h(sql, m.userId, agent.id);
-					if (windowUsage >= agent.maxTokensPerDay) {
+					pretickUsage24h = await getAgentTokenUsage24h(sql, m.userId, agent.id);
+					if (pretickUsage24h >= agent.maxTokensPerDay) {
 						agentDecisionsTotal.inc({ decision: 'skipped-budget' });
 						continue;
 					}
@ -219,7 +226,7 @@ export async function runTickOnce(config: Config): Promise<TickStats> {
 						'agent.id': agent?.id ?? 'legacy',
 						'agent.name': agent?.name ?? 'Mana',
 					},
-					() => planOneMission(m, llm, sql, agent, config)
+					() => planOneMission(m, llm, sql, agent, config, pretickUsage24h)
 				);
 				if (planResult.outcome === 'skipped') {
 					// Deep-research job still running — pick this mission
@ -309,7 +316,8 @@ async function planOneMission(
 	llm: ReturnType<typeof createServerLlmClient>,
 	sql: Sql,
 	agent: ServerAgent | null,
-	config: Config
+	config: Config,
+	pretickUsage24h: number
 ): Promise<PlanMissionOutcome> {
 	const mission = serverMissionToSharedMission(m);
 	// Resolve the mission's Key-Grant (if any) once per tick. An absent
@ -371,6 +379,17 @@ async function planOneMission(

 	const tools = filterToolsByAgentPolicy(SERVER_TOOLS, agent);

+	// Per-round reminder channel: injects transient hints (token-budget
+	// warnings today; retry-loop detection, stale-data signals later)
+	// into the NEXT LLM turn only. See `planner/reminders.ts` for the
+	// individual producers and the Claude-Code <system-reminder>
+	// rationale.
+	const reminderChannel = buildReminderChannel({
+		agent,
+		mission: m,
+		pretickUsage24h,
+	});
+
 	try {
 		const loopResult = await runPlannerLoop({
 			llm,
@ -379,6 +398,7 @@ async function planOneMission(
 				userPrompt,
 				tools,
 				model: 'google/gemini-2.5-flash',
+				reminderChannel,
 			},
 			// Server-side onToolCall: no execution, just acknowledge.
 			// The captured call lands in loopResult.executedCalls and