Spaces:
Running
on
Zero
Running
on
Zero
xieli
commited on
Commit
·
efe05ae
1
Parent(s):
96d377d
feat: remove useless code
Browse files
tts.py
CHANGED
|
@@ -123,8 +123,8 @@ class StepAudioTTS:
|
|
| 123 |
"""
|
| 124 |
try:
|
| 125 |
logger.debug(f"Starting voice cloning: {prompt_wav_path}")
|
| 126 |
-
prompt_wav,
|
| 127 |
-
vq0206_codes, vq02_codes_ori, vq06_codes_ori, speech_feat,
|
| 128 |
self.preprocess_prompt_wav(prompt_wav_path)
|
| 129 |
)
|
| 130 |
prompt_speaker = self.generate_clone_voice_id(prompt_text, prompt_wav)
|
|
@@ -135,7 +135,6 @@ class StepAudioTTS:
|
|
| 135 |
target_text,
|
| 136 |
prompt_text,
|
| 137 |
prompt_speaker,
|
| 138 |
-
vq0206_codes,
|
| 139 |
prompt_wav_tokens,
|
| 140 |
)
|
| 141 |
|
|
@@ -297,7 +296,7 @@ class StepAudioTTS:
|
|
| 297 |
return history
|
| 298 |
|
| 299 |
def _encode_audio_edit_clone_prompt(
|
| 300 |
-
self, text: str, prompt_text: str, prompt_speaker: str,
|
| 301 |
):
|
| 302 |
prompt = self.edit_clone_sys_prompt_tpl.format(
|
| 303 |
speaker=prompt_speaker,
|
|
|
|
| 123 |
"""
|
| 124 |
try:
|
| 125 |
logger.debug(f"Starting voice cloning: {prompt_wav_path}")
|
| 126 |
+
prompt_wav, _ = torchaudio.load(prompt_wav_path)
|
| 127 |
+
vq0206_codes, vq02_codes_ori, vq06_codes_ori, speech_feat, _, speech_embedding = (
|
| 128 |
self.preprocess_prompt_wav(prompt_wav_path)
|
| 129 |
)
|
| 130 |
prompt_speaker = self.generate_clone_voice_id(prompt_text, prompt_wav)
|
|
|
|
| 135 |
target_text,
|
| 136 |
prompt_text,
|
| 137 |
prompt_speaker,
|
|
|
|
| 138 |
prompt_wav_tokens,
|
| 139 |
)
|
| 140 |
|
|
|
|
| 296 |
return history
|
| 297 |
|
| 298 |
def _encode_audio_edit_clone_prompt(
|
| 299 |
+
self, text: str, prompt_text: str, prompt_speaker: str, prompt_wav_tokens: str
|
| 300 |
):
|
| 301 |
prompt = self.edit_clone_sys_prompt_tpl.format(
|
| 302 |
speaker=prompt_speaker,
|