File size: 1,643 Bytes
4b1c031
 
 
 
 
 
bac2101
 
4b1c031
 
 
bac2101
4b1c031
 
 
 
 
 
 
bac2101
 
4b1c031
 
 
 
 
bac2101
4b1c031
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
# --- Core Torch Stack ---
torchaudio==2.8.0
torchvision==0.23.0
triton
deepspeed==0.17.1
flash-attn-3 @ https://huggingface.co/alexnasa/flash-attn-3/resolve/main/128/flash_attn_3-3.0.0b1-cp39-abi3-linux_x86_64.whl
indextts @ git+https://github.com/OutofAi/index-tts-batch.git
latentsync @ git+https://github.com/OutofAi/LatentSync-batch.git

pyannote.audio
ctranslate2
faster-whisper
pydub==0.25.1
srt
audio-separator==0.24.1
ffmpeg-python==0.2.0
python_speech_features==0.6
librosa==0.10.2.post1  # higher than 0.10.1

accelerate==1.8.1        
transformers==4.52.3     
tokenizers==0.21.0
sentencepiece
g2p-en==2.1.0
cn2an==0.5.22
textstat
omegaconf==2.3.0         
munch==4.0.0
tqdm
json5==0.10.0

diffusers==0.33.1
huggingface-hub<1.0
imageio==2.27.0
decord==0.6.0
opencv-python==4.9.0.80   # same version, deduped
mediapipe==0.10.11
av
torch-fidelity==0.3.0
torchmetrics==1.3.1
lpips==0.1.4
face-alignment==1.4.1
insightface==0.7.3
kornia==0.8.0
scenedetect==0.6.1
moviepy==1.0.3

# --- Numerical / Scientific ---
numpy==1.26.2   # higher than 1.24.4
matplotlib==3.8.2
numba==0.58.1
Cython==3.0.7
einops==0.7.0
ninja==1.11.1.1

# --- Model Repos & Tools ---
descript-audiotools @ git+https://github.com/descriptinc/audiotools.git
tigersound @ git+https://github.com/OutofAi/tigersound.git
tensorboard
hf-xet==1.1.8
DeepCache==0.1.1
ultralytics
batch-face
modelscope==1.27.0
onnxruntime-gpu==1.21.0

# --- Language-specific packages ---
jieba==0.42.1

# --- Environment-specific ---
WeTextProcessing; platform_machine != "Darwin"
wetext; platform_system == "Darwin"