Spaces:

gnosticdev
/

INVIDEO_BASIC

Running

App Files Files Community

gnosticdev commited on Jul 13

Commit

4ad7ee5

verified ·

1 Parent(s): 744ab6c

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -14

app.py CHANGED Viewed

@@ -491,21 +491,20 @@ def crear_video(prompt_type, input_text, selected_voice, musica_file=None):
         logger.info("Generando audio de voz...")
         voz_path = os.path.join(temp_dir_intermediate, "voz.mp3")
-        tts_voices_to_try = [selected_voice] # Intentar primero la voz seleccionada
-        # Añadir voces de respaldo si no están ya en la lista y son diferentes a la seleccionada
-        # Nos aseguramos de no añadir None o IDs vacíos a la lista de reintento
-        if "es-ES-JuanNeural" not in tts_voices_to_try and "es-ES-JuanNeural" is not None: tts_voices_to_try.append("es-ES-JuanNeural")
-        if "es-ES-ElviraNeural" not in tts_voices_to_try and "es-ES-ElviraNeural" is not None: tts_voices_to_try.append("es-ES-ElviraNeural")
-        # Si la lista de voces disponibles es fiable, podrías usar un subconjunto ordenado para reintentos más amplios
-        # Opcional: si AVAILABLE_VOICES es fiable, podrías usar un subconjunto ordenado para reintentos
-        # Ejemplo: for voice_id in [selected_voice] + sorted([v[1] for v in AVAILABLE_VOICES if v[1].startswith('es-') and v[1] != selected_voice]) + sorted([v[1] for v in AVAILABLE_VOICES if not v[1].startswith('es-') and v[1] != selected_voice]):
         tts_success = False
-        tried_voices = set() # Usar un set para rastrear voces intentadas de forma eficiente
         for current_voice in tts_voices_to_try:
-            if not current_voice or current_voice in tried_voices: continue # Evitar intentar IDs None/vacíos o duplicados
             tried_voices.add(current_voice)
             logger.info(f"Intentando TTS con voz: {current_voice}...")
@@ -513,12 +512,11 @@ def crear_video(prompt_type, input_text, selected_voice, musica_file=None):
                 tts_success = asyncio.run(text_to_speech(guion, voz_path, voice=current_voice))
                 if tts_success:
                     logger.info(f"TTS exitoso con voz '{current_voice}'.")
-                    break # Salir del bucle de reintento si tiene éxito
             except Exception as e:
                  logger.warning(f"Fallo al generar TTS con voz '{current_voice}': {str(e)}", exc_info=True)
-                 pass # Continuar al siguiente intento
-        # Verificar si el archivo fue creado después de todos los intentos
         if not tts_success or not os.path.exists(voz_path) or os.path.getsize(voz_path) <= 100:
              logger.error("Fallo en la generación de voz después de todos los intentos. Archivo de audio no creado o es muy pequeño.")
              raise ValueError("Error generando voz a partir del guion (fallo de TTS).")
@@ -532,6 +530,12 @@ def crear_video(prompt_type, input_text, selected_voice, musica_file=None):
             try: audio_tts_original.close()
             except: pass
             audio_tts_original = None
             raise ValueError("Audio de voz generado es inválido después de procesamiento inicial.")
         audio_tts = audio_tts_original
@@ -541,7 +545,6 @@ def crear_video(prompt_type, input_text, selected_voice, musica_file=None):
         if audio_duration < 1.0:
              logger.error(f"Duración audio voz ({audio_duration:.2f}s) es muy corta.")
              raise ValueError("Generated voice audio is too short (min 1 second required).")
         # 3. Extraer palabras clave
         logger.info("Extrayendo palabras clave...")
         try:

         logger.info("Generando audio de voz...")
         voz_path = os.path.join(temp_dir_intermediate, "voz.mp3")
+        tts_voices_to_try = [selected_voice]
+        fallback_juan = "es-ES-JuanNeural"
+        fallback_elvira = "es-ES-ElviraNeural"
+        if fallback_juan and fallback_juan != selected_voice and fallback_juan not in tts_voices_to_try:
+            tts_voices_to_try.append(fallback_juan)
+        if fallback_elvira and fallback_elvira != selected_voice and fallback_elvira not in tts_voices_to_try:
+            tts_voices_to_try.append(fallback_elvira)
         tts_success = False
+        tried_voices = set()
         for current_voice in tts_voices_to_try:
+            if not current_voice or current_voice in tried_voices: continue
             tried_voices.add(current_voice)
             logger.info(f"Intentando TTS con voz: {current_voice}...")
                 tts_success = asyncio.run(text_to_speech(guion, voz_path, voice=current_voice))
                 if tts_success:
                     logger.info(f"TTS exitoso con voz '{current_voice}'.")
+                    break
             except Exception as e:
                  logger.warning(f"Fallo al generar TTS con voz '{current_voice}': {str(e)}", exc_info=True)
+                 pass
         if not tts_success or not os.path.exists(voz_path) or os.path.getsize(voz_path) <= 100:
              logger.error("Fallo en la generación de voz después de todos los intentos. Archivo de audio no creado o es muy pequeño.")
              raise ValueError("Error generando voz a partir del guion (fallo de TTS).")
             try: audio_tts_original.close()
             except: pass
             audio_tts_original = None
+            if os.path.exists(voz_path):
+                try: os.remove(voz_path)
+                except: pass
+                if voz_path in temp_intermediate_files:
+                     temp_intermediate_files.remove(voz_path)
             raise ValueError("Audio de voz generado es inválido después de procesamiento inicial.")
         audio_tts = audio_tts_original
         if audio_duration < 1.0:
              logger.error(f"Duración audio voz ({audio_duration:.2f}s) es muy corta.")
              raise ValueError("Generated voice audio is too short (min 1 second required).")
         # 3. Extraer palabras clave
         logger.info("Extrayendo palabras clave...")
         try: