-
Notifications
You must be signed in to change notification settings - Fork 3
Expand file tree
/
Copy pathrequirements.txt
More file actions
48 lines (42 loc) · 1.48 KB
/
requirements.txt
File metadata and controls
48 lines (42 loc) · 1.48 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
# Algorithmic Filmmaking - Pure Python MVP
# Core dependencies for scene detection and video processing
certifi>=2024.0.0
click>=8.0
PySide6>=6.6
python-mpv>=1.0.8
scenedetect[opencv]>=0.6.4
opencv-python>=4.8
numpy>=1.24
yt-dlp>=2024.1
scikit-learn>=1.3
transformers>=4.50,<5
# torch and torchvision MUST be installed together to stay version-compatible
torch>=2.4,<2.7
torchvision>=0.19,<0.22
sentencepiece>=0.2.0
protobuf>=4.25,<6
Pillow>=10.0
faster-whisper>=1.0.0
# MLX packages (Apple Silicon) — install on demand via feature registry, not here
# lightning-whisper-mlx conflicts with litellm on tiktoken version
# mlx-vlm is heavy; both are in requirements-optional.txt
google-api-python-client>=2.100.0
keyring>=24.0
mcp[cli]>=1.2.0
# LLM Integration
# Vendored wheel avoids build-time dependency on PyPI-hosted LiteLLM artifacts.
./vendor/wheels/litellm-1.82.6-py3-none-any.whl
tenacity>=8.2.0
httpx>=0.25.0
# Content Analysis
ultralytics>=8.4.0 # YOLO26 (NMS-free, 43% faster CPU inference)
insightface>=0.7.3,<1.0 # Face detection and ArcFace embeddings
onnxruntime>=1.16.0,<2.0 # InsightFace backend (supports Apple Silicon natively since 1.16)
einops>=0.7.0
# OCR / Text Extraction
paddleocr>=3.0.0 # PaddleOCR PP-OCRv5 for text extraction (replaces Tesseract)
rapidfuzz>=3.0.0 # Fast fuzzy string matching for text comparison
# Audio Analysis
librosa>=0.10.0 # Beat detection, tempo analysis, onset detection
# Development
watchdog>=3.0.0 # File watching for auto-restart (watchmedo)