|
import gradio as gr |
|
import requests |
|
import os |
|
from dotenv import load_dotenv |
|
|
|
|
|
load_dotenv() |
|
|
|
|
|
CHUNK_SIZE = 1024 |
|
XI_API_KEY = os.getenv("XI_API_KEY") |
|
VOICE_ID = os.getenv("VOICE_ID") |
|
|
|
def text_to_speech(text): |
|
|
|
tts_url = f"https://api.elevenlabs.io/v1/text-to-speech/{VOICE_ID}/stream" |
|
|
|
|
|
headers = { |
|
"Accept": "application/json", |
|
"xi-api-key": XI_API_KEY |
|
} |
|
|
|
|
|
data = { |
|
"text": text, |
|
"model_id": "eleven_multilingual_v2", |
|
"voice_settings": { |
|
"stability": 0.5, |
|
"similarity_boost": 0.8, |
|
"style": 0.0, |
|
"use_speaker_boost": True |
|
} |
|
} |
|
|
|
|
|
response = requests.post(tts_url, headers=headers, json=data, stream=True) |
|
|
|
|
|
if response.ok: |
|
|
|
output_path = "output.mp3" |
|
with open(output_path, "wb") as f: |
|
|
|
for chunk in response.iter_content(chunk_size=CHUNK_SIZE): |
|
f.write(chunk) |
|
return output_path |
|
else: |
|
return f"Error: {response.text}" |
|
|
|
|
|
iface = gr.Interface( |
|
fn=text_to_speech, |
|
inputs="text", |
|
outputs="audio", |
|
title="", |
|
description="Texto a generar." |
|
) |
|
|
|
|
|
if __name__ == "__main__": |
|
iface.launch() |
|
|