zoengjyutgaai_tts / requirements.txt
laubonghaudoi's picture
Update requirements.txt
4f4edca
# Core dependencies for Cantonese TTS HF Space
# Based on original GPT-SoVITS requirements.txt
# Core ML frameworks
spaces>=0.19.0
torch>=2.0.0
torchaudio
pytorch-lightning>=2.4
gradio<5
# Audio processing
librosa==0.10.2
soundfile
ffmpeg-python
numba
scipy
av>=11
# Array processing
numpy<2.0
# NLP and text processing
transformers>=4.43,<=4.50
sentencepiece
tokenizers>=0.13,<1
jieba
jieba_fast
pypinyin
cn2an
ToJyutping
opencc
g2pk2
ko_pron
split-lang
fast_langdetect>=0.3.1
wordsegment
g2p_en
pyopenjtalk>=0.4.1
# Model related
peft
safetensors
huggingface_hub>=0.13
modelscope==1.10.0
funasr==1.0.27
# Additional ML tools
rotary_embedding_torch
x_transformers
torchmetrics<=1.5
tensorboard
# Runtime optimization
onnxruntime-gpu; platform_machine == "x86_64" or platform_machine == "AMD64"
onnxruntime; platform_machine == "aarch64" or platform_machine == "arm64"
# Web framework
fastapi[standard]>=0.115.2
pydantic<=2.10.6
# Utilities
tqdm
psutil
chardet
PyYAML
# Platform specific
python_mecab_ko; sys_platform != 'win32'
# Additional that might be needed
accelerate
ctranslate2>=4.0,<5
# Note: --no-binary=opencc might be needed for opencc