File size: 631 Bytes
e53ffe1
3e83551
e53ffe1
9118213
 
e53ffe1
 
 
 
 
 
 
 
 
 
 
 
9118213
e53ffe1
9118213
e53ffe1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
--find-links https://k2-fsa.github.io/icefall/piper_phonemize.html
--find-links https://k2-fsa.github.io/k2/cuda-cn.html

torch<=2.6.0
torchaudio<=2.6.0
lhotse
tensorboard
vocos

# Normalization
cn2an
inflect
unidecode

# Tokenization
piper_phonemize

k2==1.24.4.dev20250208+cuda12.4.torch2.5.1

transformers==4.41.0
bitsandbytes>0.37.0
vinorm
cached_path
huggingface_hub
gradio
accelerate>=0.33.0
click
datasets
ema_pytorch>=0.5.2
gradio>=3.45.2
hydra-core>=1.3.0
jieba
librosa
matplotlib
numpy<=1.26.4
pydub
pypinyin
safetensors
soundfile
tomli
torchdiffeq
tqdm>=4.65.0
transformers_stream_generator
wandb
x_transformers>=1.31.14