Spaces:

maya-research
/

maya1

Running on Zero

Veena commited on Nov 7

Commit

ab22398

1 Parent(s): e5b76b7

Update Maya1 Gradio app with preset characters

Files changed (1) hide show

app.py CHANGED Viewed

@@ -194,20 +194,23 @@ def generate_speech(preset_name, description, text, temperature, max_tokens):
         if len(audio) > 2048:
             audio = audio[2048:]
-        # Convert to WAV
         audio_int16 = (audio * 32767).astype(np.int16)
-        wav_buffer = io.BytesIO()
-        with wave.open(wav_buffer, 'wb') as wav_file:
-            wav_file.setnchannels(1)
-            wav_file.setsampwidth(2)
-            wav_file.setframerate(AUDIO_SAMPLE_RATE)
-            wav_file.writeframes(audio_int16.tobytes())
-        wav_buffer.seek(0)
-        duration = len(audio) / AUDIO_SAMPLE_RATE
         status_msg = f"Generated {duration:.2f}s of emotional speech!"
-        return wav_buffer, status_msg
     except Exception as e:
         import traceback

         if len(audio) > 2048:
             audio = audio[2048:]
+        # Convert to WAV and save to temporary file
+        import tempfile
+        import soundfile as sf
         audio_int16 = (audio * 32767).astype(np.int16)
+        # Create temporary file
+        with tempfile.NamedTemporaryFile(delete=False, suffix='.wav') as tmp_file:
+            tmp_path = tmp_file.name
+        # Save audio
+        sf.write(tmp_path, audio_int16, AUDIO_SAMPLE_RATE)
+        duration = len(audio) / AUDIO_SAMPLE_RATE
         status_msg = f"Generated {duration:.2f}s of emotional speech!"
+        return tmp_path, status_msg
     except Exception as e:
         import traceback