Spaces:

englissi
/

bgtts

Running

englissi commited on Oct 30, 2024

Commit

8d444a7

verified ·

1 Parent(s): ca7f474

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,24 +2,25 @@ import gradio as gr
 import torch
 from transformers import pipeline
-# Use a pipeline as a high-level helper
-from transformers import pipeline
-pipe = pipeline("automatic-speech-recognition", model="infinitejoy/wav2vec2-large-xls-r-300m-bulgarian")
-# TTS 변환 함수
-def tts_generate(text):
-    audio = tts(text, return_tensors=True)
-    return (audio['speech'].numpy(), 22050)  # 반환할 샘플링 속도와 오디오 데이터
 # Gradio 인터페이스 생성
-iface = gr.Interface(fn=tts_generate,
-                     inputs="text",
-                     outputs="audio",
-                     title="Bulgarian TTS Generator",
-                     description="Enter text to generate speech in Bulgarian.")
 # 인터페이스 실행
 if __name__ == "__main__":
     iface.launch()

 import torch
 from transformers import pipeline
+# Initialize the ASR pipeline for Bulgarian
+asr_pipeline = pipeline("automatic-speech-recognition", model="infinitejoy/wav2vec2-large-xls-r-300m-bulgarian")
+# ASR 변환 함수 (speech-to-text conversion)
+def asr_generate(audio):
+    transcription = asr_pipeline(audio)["text"]
+    return transcription
 # Gradio 인터페이스 생성
+iface = gr.Interface(
+    fn=asr_generate,
+    inputs=gr.Audio(source="microphone", type="filepath"),
+    outputs="text",
+    title="Bulgarian Speech Recognition",
+    description="Upload or record audio in Bulgarian to get the transcription."
+)
 # 인터페이스 실행
 if __name__ == "__main__":
     iface.launch()