text_to_speech_Vietnamese / requirements_eval.txt
3v324v23's picture
up
af11ce4
torch
numpy
# Audio processing
librosa
soundfile
# Model
s3prl
pyannote.audio
funasr
transformers
# WER
jiwer==3.1.0
# Normalization
zhconv
zhon