Update app.py
Browse files
app.py
CHANGED
|
@@ -24,15 +24,8 @@ def generate_audio(text, language, speaker_wav):
|
|
| 24 |
if speaker_wav is not None:
|
| 25 |
audio = tts.tts(text=text, speaker_wav=speaker_wav, language=language)
|
| 26 |
audio_np = np.array(audio, dtype=np.float16)
|
| 27 |
-
|
| 28 |
-
|
| 29 |
-
buffer = BytesIO()
|
| 30 |
-
sf.write(buffer, audio_np, 24000, format="WAV")
|
| 31 |
-
buffer.seek(0)
|
| 32 |
-
|
| 33 |
-
# Codificar a base64
|
| 34 |
-
audio_b64 = base64.b64encode(buffer.read()).decode("utf-8")
|
| 35 |
-
return f"data:audio/wav;base64,{audio_b64}"
|
| 36 |
|
| 37 |
# 🎛️ Interfaz
|
| 38 |
iface = gr.Interface(
|
|
@@ -42,7 +35,7 @@ iface = gr.Interface(
|
|
| 42 |
gr.Text(label="Idioma (ej: 'es', 'en')"),
|
| 43 |
gr.Audio(type="filepath", label="Audio de voz")
|
| 44 |
],
|
| 45 |
-
outputs=
|
| 46 |
)
|
| 47 |
|
| 48 |
iface.launch()
|
|
|
|
| 24 |
if speaker_wav is not None:
|
| 25 |
audio = tts.tts(text=text, speaker_wav=speaker_wav, language=language)
|
| 26 |
audio_np = np.array(audio, dtype=np.float16)
|
| 27 |
+
return (24000, audio_np)
|
| 28 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 29 |
|
| 30 |
# 🎛️ Interfaz
|
| 31 |
iface = gr.Interface(
|
|
|
|
| 35 |
gr.Text(label="Idioma (ej: 'es', 'en')"),
|
| 36 |
gr.Audio(type="filepath", label="Audio de voz")
|
| 37 |
],
|
| 38 |
+
outputs="audio"
|
| 39 |
)
|
| 40 |
|
| 41 |
iface.launch()
|