| numpy<2.0 | |
| scipy | |
| tensorboard | |
| librosa==0.10.2 | |
| numba | |
| pytorch-lightning>=2.4 | |
| gradio<5 | |
| ffmpeg-python | |
| onnxruntime; sys_platform == 'darwin' | |
| onnxruntime-gpu; sys_platform != 'darwin' | |
| tqdm | |
| funasr==1.0.27 | |
| cn2an | |
| pypinyin | |
| pyopenjtalk>=0.4.1 | |
| g2p_en | |
| torchaudio | |
| modelscope==1.10.0 | |
| sentencepiece | |
| transformers>=4.43 | |
| peft | |
| chardet | |
| PyYAML | |
| psutil | |
| jieba_fast | |
| jieba | |
| split-lang | |
| fast_langdetect>=0.3.1 | |
| wordsegment | |
| rotary_embedding_torch | |
| ToJyutping | |
| g2pk2 | |
| ko_pron | |
| opencc; sys_platform != 'linux' | |
| opencc==1.1.1; sys_platform == 'linux' | |
| python_mecab_ko; sys_platform != 'win32' | |
| fastapi[standard]>=0.115.2 | |
| x_transformers | |
| torchmetrics<=1.5 | |
| pydantic<=2.10.6 | |
| ctranslate2>=4.0,<5 | |
| huggingface_hub>=0.13 | |
| tokenizers>=0.13,<1 | |
| av>=11 | |
| tqdm | |