Changed stt to parakeet — still experiemntal, though performance seems to be better

This commit is contained in:
2026-01-18 03:35:50 +02:00
parent 50e4f7a5f2
commit 0a8910fff8
10 changed files with 375 additions and 37 deletions

View File

@@ -6,7 +6,7 @@ uvicorn[standard]==0.32.1
websockets==14.1
aiohttp==3.11.11
# Audio processing
# Audio processing (install numpy first for sox dependency)
numpy==2.2.2
soundfile==0.12.1
librosa==0.10.2.post1
@@ -16,9 +16,12 @@ torch==2.9.1 # Latest PyTorch
torchaudio==2.9.1
silero-vad==5.1.2
# STT (GPU)
faster-whisper==1.2.1 # Latest version (Oct 31, 2025)
ctranslate2==4.5.0 # Required by faster-whisper
# STT (GPU) - NVIDIA NeMo for Parakeet
# Parakeet TDT 0.6b-v3 requires NeMo 2.4
# Fix huggingface-hub version conflict with transformers
huggingface-hub>=0.30.0,<1.0
nemo_toolkit[asr]==2.4.0
omegaconf==2.3.0
# Utilities
python-multipart==0.0.20