TriNguyenPO commited on
Commit
5cc86b0
·
verified ·
1 Parent(s): e4c0c4b

Create app.py

Browse files

import gradio as gr
from transformers import AutoModelForSpeechSeq2Seq, AutoTokenizer, pipeline

tokenizer = AutoTokenizer.from_pretrained("MarcNg/fastspeech2-vi-infore")
model = AutoModelForSpeechSeq2Seq.from_pretrained("MarcNg/fastspeech2-vi-infore")

tts_pipeline = pipeline("text-to-speech", model=model, tokenizer=tokenizer)

def text_to_speech(text):
output = tts_pipeline(text)
return output["audio"].numpy()

iface = gr.Interface(
fn=text_to_speech,
inputs="text",
outputs="audio",
title="Vietnamese Text-to-Speech",
description="Enter Vietnamese text to convert to speech using FastSpeech 2 model."
)

iface.launch()

Files changed (1) hide show
  1. app.py +3 -0
app.py ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ transformers
2
+ gradio
3
+ soundfile