Spaces:

rjproz
/

maya1-txt2speech

Running

Rajkumar Pramanik "RJproz commited on 21 days ago

Commit

f8e32a0

1 Parent(s): 3dde740

bug fixes

Files changed (1) hide show

app.py CHANGED Viewed

@@ -196,24 +196,23 @@ def generate_speech(description, text, temperature, max_tokens):
         if len(audio) > 2048:
             audio = audio[2048:]
-        # Convert to WAV and save to temporary file
-        # import tempfile
-        # import soundfile as sf
-        # audio_int16 = (audio * 32767).astype(np.int16)
-        # # Create temporary file
-        # with tempfile.NamedTemporaryFile(delete=False, suffix='.wav') as tmp_file:
-        #     tmp_path = tmp_file.name
-        # # Save audio
-        # sf.write(tmp_path, audio_int16, AUDIO_SAMPLE_RATE)
-        # duration = len(audio) / AUDIO_SAMPLE_RATE
-        # status_msg = f"Generated {duration:.2f}s of emotional speech!"
-        tmp_path = "success"
-        status_msg = "success"
         return tmp_path, status_msg
     except Exception as e:
@@ -287,17 +286,17 @@ with gr.Blocks(title="Maya1 - Open Source Emotional TTS", theme=gr.themes.Soft()
         with gr.Column(scale=1):
             gr.Markdown("### Generated Audio")
-            # audio_output = gr.Audio(
-            #     label="Generated Speech",
-            #     type="filepath",
-            #     interactive=False
-            # )
-            audio_output = gr.Textbox(
-                label="Autio Path",
-                lines=3,
                 interactive=False
             )
             status_output = gr.Textbox(
                 label="Status",

         if len(audio) > 2048:
             audio = audio[2048:]
+        Convert to WAV and save to temporary file
+        import tempfile
+        import soundfile as sf
+        audio_int16 = (audio * 32767).astype(np.int16)
+        # Create temporary file
+        with tempfile.NamedTemporaryFile(delete=False, suffix='.wav') as tmp_file:
+            tmp_path = tmp_file.name
+        # Save audio
+        sf.write(tmp_path, audio_int16, AUDIO_SAMPLE_RATE)
+        duration = len(audio) / AUDIO_SAMPLE_RATE
+        status_msg = f"Generated {duration:.2f}s of emotional speech!"
         return tmp_path, status_msg
     except Exception as e:
         with gr.Column(scale=1):
             gr.Markdown("### Generated Audio")
+            audio_output = gr.Audio(
+                label="Generated Speech",
+                type="filepath",
                 interactive=False
             )
+            # audio_output = gr.Textbox(
+            #     label="Autio Path",
+            #     lines=3,
+            #     interactive=False
+            # )
             status_output = gr.Textbox(
                 label="Status",