mirror of
https://github.com/Memo-2023/mana-monorepo.git
synced 2026-05-20 07:03:36 +02:00
mana-stt: add WhisperX service with CUDA GPU support, speaker diarization, and auto-fallback chain. mana-notify: add locale fallback and default templates for task reminders. CD: update deployment pipeline and docker-compose configuration. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
35 lines
893 B
Text
35 lines
893 B
Text
# ManaCore STT Service Dependencies
|
|
# For GPU Server (NVIDIA RTX 3090 / CUDA)
|
|
|
|
# Web Framework
|
|
fastapi==0.115.6
|
|
uvicorn[standard]==0.34.0
|
|
python-multipart==0.0.20
|
|
|
|
# Audio Processing
|
|
pydub==0.25.1
|
|
soundfile==0.13.1
|
|
|
|
# WhisperX (CUDA) — includes faster-whisper + alignment
|
|
whisperx @ git+https://github.com/m-bain/whisperX.git
|
|
|
|
# faster-whisper with CTranslate2 (CUDA backend)
|
|
faster-whisper>=1.1.0
|
|
|
|
# Speaker Diarization (pyannote.audio)
|
|
# Requires HF_TOKEN with accepted terms:
|
|
# https://huggingface.co/pyannote/speaker-diarization-3.1
|
|
# https://huggingface.co/pyannote/segmentation-3.0
|
|
pyannote.audio>=3.3.0
|
|
|
|
# PyTorch CUDA — install separately for your CUDA version:
|
|
# pip install torch torchaudio --index-url https://download.pytorch.org/whl/cu121
|
|
torch>=2.5.0
|
|
torchaudio>=2.5.0
|
|
|
|
# Utilities
|
|
numpy>=1.26.0
|
|
tqdm>=4.67.0
|
|
|
|
# External Auth (mana-core-auth integration)
|
|
httpx>=0.27.0
|