OpenCut/requirements.txt at main · SysAdminDoc/OpenCut · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
# OpenCut v1.25.1 Requirements
# Install: pip install -r requirements.txt
# For GPU: pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121

# === CORE (required) ===
click>=8.0
rich>=13.0
flask>=3.0
flask-cors>=4.0
python-json-logger>=2.0,<3
psutil>=5.9

# === STANDARD (recommended) ===
faster-whisper>=1.0
opencv-python-headless>=4.8
Pillow>=10.0
numpy>=1.24
librosa>=0.10
pydub>=0.25
noisereduce>=3.0
deep-translator>=1.11
scenedetect[opencv]>=0.6

# === AUDIO (optional) ===
# demucs>=4.0              # Stem separation (~1.5GB with models)
# pedalboard>=0.9          # Pro audio FX chain
# edge-tts>=6.1            # Text-to-speech (requires internet)

# === AI/ML (optional, GPU recommended) ===
# realesrgan>=0.3          # AI upscaling (~67MB model)
# rembg>=2.0               # Background removal (~170MB model)
# gfpgan>=1.3              # Face enhancement (~330MB model)
# insightface>=0.7         # Face detection/swap
# onnxruntime-gpu>=1.16    # GPU inference for InsightFace
# audiocraft>=1.0          # MusicGen AI music (1.2-13GB models)

# === ADVANCED (optional) ===
# whisperx>=3.0            # Word-level timestamps + alignment
# pyannote.audio>=3.1      # Speaker diarization (needs HuggingFace token)

# === POST-PRODUCTION FEATURES (optional) ===
# Color matching & auto-zoom use opencv-python-headless + numpy (already listed above)

# Loudness matching uses FFmpeg subprocess (external tool, not pip)
# Install FFmpeg from https://ffmpeg.org/download.html

# Footage search uses stdlib json only (no extra deps)

# LLM integration (for chapters, NLP commands) — optional
# ollama: run locally via https://ollama.ai
# openai>=1.0.0            # For OpenAI provider
# anthropic>=0.20.0        # For Anthropic provider