2025-03-01 20:37:52 -05:00
|
|
|
# OBS Recording Transcriber Dependencies
|
2025-07-23 14:45:19 -04:00
|
|
|
# Core dependencies with pinned compatible versions
|
2025-01-28 17:00:03 -05:00
|
|
|
streamlit==1.26.0
|
|
|
|
|
moviepy==1.0.3
|
2025-04-30 12:09:10 -04:00
|
|
|
openai-whisper==20231117
|
2025-03-01 20:37:52 -05:00
|
|
|
requests>=2.28.0
|
|
|
|
|
humanize>=4.6.0
|
|
|
|
|
|
2026-01-05 09:57:20 -05:00
|
|
|
# PyTorch ecosystem - updated for SpeechBrain 1.0 compatibility
|
|
|
|
|
# torchaudio >= 2.1.0 is REQUIRED for diarization to work properly
|
2026-01-05 10:50:20 -05:00
|
|
|
# NOTE: For Docker GPU builds, these are installed separately from cu118 index
|
|
|
|
|
torch>=2.1.0
|
|
|
|
|
torchaudio>=2.1.0
|
|
|
|
|
torchvision>=0.16.0
|
2025-03-01 20:37:52 -05:00
|
|
|
|
2025-07-23 14:45:19 -04:00
|
|
|
# Transformers ecosystem - compatible versions
|
2026-01-05 09:57:20 -05:00
|
|
|
transformers==4.35.0
|
|
|
|
|
tokenizers>=0.14.0
|
2025-07-23 14:45:19 -04:00
|
|
|
|
|
|
|
|
# ML dependencies with compatible versions
|
|
|
|
|
numpy==1.24.3
|
|
|
|
|
scipy==1.10.1
|
|
|
|
|
scikit-learn==1.3.0
|
|
|
|
|
|
|
|
|
|
# Audio processing and ML models
|
2026-01-05 09:57:20 -05:00
|
|
|
# Pin speechbrain for stability with pyannote.audio
|
|
|
|
|
speechbrain==1.0.0
|
2025-07-23 14:45:19 -04:00
|
|
|
pyannote.audio==3.1.1
|
2026-01-05 09:57:20 -05:00
|
|
|
pytorch-lightning==2.1.0
|
2025-07-23 14:45:19 -04:00
|
|
|
|
|
|
|
|
# Other dependencies
|
2025-03-01 20:37:52 -05:00
|
|
|
iso639>=0.1.4
|
2026-01-05 09:57:20 -05:00
|
|
|
protobuf>=3.20.0,<5.0.0
|
2025-03-01 20:37:52 -05:00
|
|
|
matplotlib>=3.5.0
|
|
|
|
|
soundfile>=0.10.3
|
|
|
|
|
ffmpeg-python>=0.2.0
|
|
|
|
|
|
|
|
|
|
# Optional: Ollama Python client (uncomment to install)
|
|
|
|
|
# ollama
|
|
|
|
|
|
|
|
|
|
# Installation notes:
|
|
|
|
|
# 1. For Windows users, you may need to install PyTorch separately:
|
|
|
|
|
# pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu118
|
|
|
|
|
#
|
|
|
|
|
# 2. For tokenizers issues, try installing Visual C++ Build Tools:
|
|
|
|
|
# https://visualstudio.microsoft.com/visual-cpp-build-tools/
|
|
|
|
|
#
|
|
|
|
|
# 3. For pyannote.audio, you'll need a HuggingFace token with access to:
|
|
|
|
|
# https://huggingface.co/pyannote/speaker-diarization-3.0
|
|
|
|
|
#
|
|
|
|
|
# 4. FFmpeg is required for audio processing:
|
|
|
|
|
# Windows: https://www.gyan.dev/ffmpeg/builds/
|
|
|
|
|
# Mac: brew install ffmpeg
|
|
|
|
|
# Linux: apt-get install ffmpeg
|