fakevoice / app.py
seawolf2357's picture
Update app.py
65dcd62
raw
history blame
2.69 kB
import gradio as gr
import requests
def generate_audio(text, voice_name):
MAX_CHARS = 100
# ์ž…๋ ฅ๋œ ํ…์ŠคํŠธ ๊ธธ์ด ๊ฒ€์ฆ
if len(text) > MAX_CHARS:
text = text[:MAX_CHARS] # ์ตœ๋Œ€ ๊ธ€์ž์ˆ˜๋กœ ํ…์ŠคํŠธ ์ž๋ฅด๊ธฐ
voices = {
"๋‚จ์„ฑAI": "6uQD2RqeSgIey9LVBafG",
"์—ฌ์„ฑAI": "jeuEgCxtyEYkC3zsQODy",
"์ฐจ์Šน์›": "SKwm0HLYsVDCM2ruvw2p",
"๊น€์ •์€": "YPWL3nQPzBN1XaiZF4aj",
"๋…ธ๋ฌดํ˜„": "6JdivX36i1eJ3LqLmvwH",
"๊ถ์˜ˆ": "4kFrgJPCTjA6DyPM5Gr5",
"์œค์„์—ด": "Qrf03Q67kRgpFlj9fto3"
}
voice_id = voices[voice_name]
url = f"https://api.elevenlabs.io/v1/text-to-speech/{voice_id}"
model_id = "eleven_multilingual_v2"
payload = {
"model_id": model_id,
"text": text,
"voice_settings": {
"similarity_boost": 0.75,
"stability": 0.5,
"style": 0,
"use_speaker_boost": True
}
}
headers = {
"Content-Type": "application/json",
"xi-api-key": "c5fb99a2b25402f104d246379bcf819a"
}
response = requests.post(url, json=payload, headers=headers, stream=True)
if response.status_code == 200:
chunks = []
for chunk in response.iter_content(chunk_size=CHUNK_SIZE):
chunks.append(chunk)
return b''.join(chunks)
else:
raise Exception(f"์˜ค๋ฅ˜ ๋ฐœ์ƒ. ์ƒํƒœ ์ฝ”๋“œ: {response.status_code}")
CHUNK_SIZE = 1024
# Gradio ์ธํ„ฐํŽ˜์ด์Šค ์ •์˜
with gr.Blocks() as demo:
gr.Markdown("FakeVoice: AI๊ฐ€ ๋ณต์ œํ•œ ์œ ๋ช…์ธ์˜ ์Œ์„ฑ์œผ๋กœ, ํ…์ŠคํŠธ๋งŒ ์ž…๋ ฅํ•˜๋ฉด ์ž์—ฐ์Šค๋Ÿฝ๊ฒŒ ํ•ด๋‹น ์ธ๋ฌผ์˜ ์Œ์„ฑ์œผ๋กœ ์ƒ์„ฑํ•ฉ๋‹ˆ๋‹ค.")
gr.Markdown("์ง€๊ธˆ ์ปค๋ฎค๋‹ˆํ‹ฐ์— ์ฐธ์—ฌํ•˜์‹œ๋ฉด ๋”์šฑ ๋งŽ์€ ์ •๋ณด์™€ ๋‹ค์–‘ํ•œ ๊ธฐํšŒ๋ฅผ ์–ป์œผ์‹ค ๊ฒƒ์ž…๋‹ˆ๋‹ค. ์ปค๋ฎค๋‹ˆํ‹ฐ ์ฐธ์—ฌ ๋งํฌ https://open.kakao.com/o/gE6hK9Vf ")
gr.Markdown("์ƒ์„ฑ๋œ ์˜ค๋””์˜ค๋ฅผ ๋‹ค์šด๋กœ๋“œ ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ๋‹ค์šด๋กœ๋“œ ๋ฐ›์œผ์‹  ํ›„ ๋‹ค์šด๋กœ๋“œ ๋ฐ›์€ ํŒŒ์ผ์˜ ํ™•์žฅ์ž๋ฅผ mp3๋กœ ๋ณ€๊ฒฝํ•˜์‹œ๋ฉด ๋ฉ๋‹ˆ๋‹ค. ")
text_input = gr.Textbox(label="์Œ์„ฑ์œผ๋กœ ์ƒ์„ฑํ•  ํ…์ŠคํŠธ๋ฅผ ์ž…๋ ฅํ•˜์„ธ์š”.(100๊ธ€์ž ์ด๋‚ด ์ œํ•œ ์„ค์ •๋˜์–ด, ์ดˆ๊ณผ์‹œ ์Œ์„ฑ ์ƒ์„ฑ์ด ์ œํ•œ๋ฉ๋‹ˆ๋‹ค.)")
voice_choice = gr.Dropdown(choices=["๋‚จ์„ฑAI", "์—ฌ์„ฑAI", "์ฐจ์Šน์›", "๊น€์ •์€", "๋…ธ๋ฌดํ˜„", "๊ถ์˜ˆ", "์œค์„์—ด"], label="์Œ์„ฑ ์„ ํƒ")
submit_button = gr.Button("์ƒ์„ฑ")
audio_output = gr.Audio(label="์ƒ์„ฑ๋œ ์˜ค๋””์˜ค")
submit_button.click(
fn=generate_audio,
inputs=[text_input, voice_choice],
outputs=audio_output
)
if __name__ == "__main__":
demo.launch()