♻️ refactor: migrate bots and chat-backend to mana-llm

Migrate all LLM consumers from direct Ollama calls to centralized mana-llm service with OpenAI-compatible API. Migrated services: - matrix-ollama-bot - telegram-ollama-bot - chat-backend - telegram-project-doc-bot New env vars: MANA_LLM_URL, LLM_MODEL, LLM_TIMEOUT Replaces: OLLAMA_URL, OLLAMA_MODEL, OLLAMA_TIMEOUT
2026-05-22 16:46:42 +02:00 · 2026-01-29 22:56:26 +01:00 · 2026-01-29 22:56:26 +01:00 · 384244fe50
commit 384244fe50
parent 7b2ac78032
11 changed files with 300 additions and 204 deletions
--- a/services/telegram-project-doc-bot/src/config/configuration.ts
+++ b/services/telegram-project-doc-bot/src/config/configuration.ts
@ -26,10 +26,10 @@ export default () => ({
 		model: process.env.STT_MODEL || 'whisper', // 'whisper' or 'voxtral'
 	},
 	llm: {
-		provider: process.env.LLM_PROVIDER || 'ollama',
-		ollama: {
-			url: process.env.OLLAMA_URL || 'http://localhost:11434',
-			model: process.env.OLLAMA_MODEL || 'gemma3:4b',
+		provider: process.env.LLM_PROVIDER || 'mana-llm',
+		manaLlm: {
+			url: process.env.MANA_LLM_URL || 'http://localhost:3025',
+			model: process.env.LLM_MODEL || 'ollama/gemma3:4b',
 		},
 	},
 });
--- a/services/telegram-project-doc-bot/src/generation/generation.service.ts
+++ b/services/telegram-project-doc-bot/src/generation/generation.service.ts
@ -14,8 +14,8 @@ type BlogStyle = keyof typeof BLOG_STYLES;
 export class GenerationService {
 	private readonly logger = new Logger(GenerationService.name);
 	private readonly llmProvider: string;
-	private readonly ollamaUrl: string;
-	private readonly ollamaModel: string;
+	private readonly manaLlmUrl: string;
+	private readonly manaLlmModel: string;
 	private readonly openai: OpenAI | null;

 	constructor(
@ -23,9 +23,10 @@ export class GenerationService {
 		private db: PostgresJsDatabase<typeof schema>,
 		private configService: ConfigService
 	) {
-		this.llmProvider = this.configService.get<string>('llm.provider') || 'ollama';
-		this.ollamaUrl = this.configService.get<string>('llm.ollama.url') || 'http://localhost:11434';
-		this.ollamaModel = this.configService.get<string>('llm.ollama.model') || 'gemma3:4b';
+		this.llmProvider = this.configService.get<string>('llm.provider') || 'mana-llm';
+		this.manaLlmUrl = this.configService.get<string>('llm.manaLlm.url') || 'http://localhost:3025';
+		this.manaLlmModel =
+			this.configService.get<string>('llm.manaLlm.model') || 'ollama/gemma3:4b';

 		const apiKey = this.configService.get<string>('openai.apiKey');
 		this.openai = apiKey ? new OpenAI({ apiKey }) : null;
@ -148,7 +149,7 @@ Beginne direkt mit dem Blogbeitrag (ohne Einleitung wie "Hier ist der Blogbeitra
 			return this.callOpenAI(prompt);
 		}

-		return this.callOllama(prompt);
+		return this.callManaLlm(prompt);
 	}

 	private async callOpenAI(prompt: string): Promise<string> {
@ -166,24 +167,27 @@ Beginne direkt mit dem Blogbeitrag (ohne Einleitung wie "Hier ist der Blogbeitra
 		return response.choices[0]?.message?.content || '';
 	}

-	private async callOllama(prompt: string): Promise<string> {
-		const response = await fetch(`${this.ollamaUrl}/api/generate`, {
+	private async callManaLlm(prompt: string): Promise<string> {
+		const response = await fetch(`${this.manaLlmUrl}/v1/chat/completions`, {
 			method: 'POST',
 			headers: { 'Content-Type': 'application/json' },
 			body: JSON.stringify({
-				model: this.ollamaModel,
-				prompt,
+				model: this.manaLlmModel,
+				messages: [{ role: 'user', content: prompt }],
+				temperature: 0.7,
+				max_tokens: 4000,
 				stream: false,
 			}),
 			signal: AbortSignal.timeout(180000), // 3 minutes timeout
 		});

 		if (!response.ok) {
-			throw new Error(`Ollama API error: ${response.status}`);
+			const errorText = await response.text();
+			throw new Error(`mana-llm API error: ${response.status} - ${errorText}`);
 		}

 		const data = await response.json();
-		return data.response || '';
+		return data.choices?.[0]?.message?.content || '';
 	}

 	async getLatestGeneration(projectId: string): Promise<Generation | undefined> {