File size: 1,285 Bytes
84fefb5
64d252e
 
 
 
 
 
 
 
84fefb5
64d252e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
84fefb5
64d252e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
84fefb5
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
Gradio<4.0.0,>=3.0.0  # Changed to allow a wider range below 4.0.0
torch>=2.0.0
torchaudio>=2.0.0
librosa>=0.10.0
soundfile>=0.12.0
numpy>=1.24.0
scipy>=1.10.0
matplotlib>=3.7.0
seaborn>=0.12.0
pandas==1.5.3  # Fixed to a version compatible with spleeter and gradio
requests>=2.31.0
Pillow>=10.0.0
transformers>=4.30.0
accelerate>=0.20.0
datasets>=2.14.0
huggingface_hub>=0.16.0

# Audio processing and separation
demucs>=4.0.0
spleeter>=2.4.0
pedalboard>=0.7.0
pyrubberband>=0.3.0

# Voice synthesis and conversion
so-vits-svc-fork>=4.0.0
fairseq>=0.12.0
espnet>=202301
parler-tts>=0.1.0

# Additional audio processing
# librosa and soundfile are already listed above, no need to duplicate
audioread>=3.0.0
resampy>=0.4.0
numba>=0.57.0

# Machine learning utilities
scikit-learn>=1.3.0
joblib>=1.3.0
tensorboard>=2.13.0
wandb>=0.15.0

# Utilities
tqdm>=4.65.0
click>=8.1.0
colorama>=0.4.6
pyyaml>=6.0
python-dotenv>=1.0.0
pathlib2>=2.3.7

# Optional dependencies for enhanced functionality
# Uncomment if needed:
# praat-parselmouth>=0.4.3  # For advanced pitch analysis
# crepe>=0.0.12  # For pitch tracking
# pysptk>=0.1.21  # For speech signal processing
# pyworld>=0.3.2  # For speech analysis and synthesis

# GPU acceleration (uncomment if using CUDA)
# torch-audio-cuda>=2.0.0