pip3 install -r requirements.txt
-
English
cd English
-
Chinese
cd Chinese
-
wav2vec 2.0
cd wav2vec2
-
HuBERT
cd hubert
-
WavLM
cd wavlm
-
English
bash dataset.sh
-
Chinese
Download dataset from Common Voice by selecting Chinese (Taiwan) and Common Voice Corpus 17.0
bash dataset.sh
python3 extract.py
python3 train.py
-
Without fast sampling
python3 inference.py
-
With fast sampling
python3 inference_2.py --C 0.99 --T 5