mirror of
https://github.com/Memo-2023/mana-monorepo.git
synced 2026-05-19 11:01:24 +02:00
Python/FastAPI service providing unified OpenAI-compatible API for Ollama and cloud LLM providers (OpenRouter, Groq, Together). Features: - Chat completions with streaming (SSE) - Vision/multimodal support - Embeddings generation - Multi-provider routing (provider/model format) - Prometheus metrics - Optional Redis caching
22 lines
481 B
Python
22 lines
481 B
Python
"""Pydantic models for OpenAI-compatible API."""
|
|
|
|
from .requests import ChatCompletionRequest, EmbeddingRequest
|
|
from .responses import (
|
|
ChatCompletionResponse,
|
|
ChatCompletionStreamResponse,
|
|
EmbeddingResponse,
|
|
ModelInfo,
|
|
ModelsResponse,
|
|
Usage,
|
|
)
|
|
|
|
__all__ = [
|
|
"ChatCompletionRequest",
|
|
"ChatCompletionResponse",
|
|
"ChatCompletionStreamResponse",
|
|
"EmbeddingRequest",
|
|
"EmbeddingResponse",
|
|
"ModelInfo",
|
|
"ModelsResponse",
|
|
"Usage",
|
|
]
|