File size: 548 Bytes
4db9758
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
from transformers import pipeline
import gradio as gr

# Specify the task explicitly
pipe = pipeline(task="automatic-speech-recognition", model="erkhem-gantulga/whisper-medium-mn")

def transcribe(audio):
    text = pipe(audio)["text"]
    return text

iface = gr.Interface(
    fn=transcribe,
    inputs=gr.Audio(sources=["upload", "microphone"], type="filepath"),
    outputs="text",
    title="Whisper Medium Mongolian",
    description="Realtime demo for Mongolian speech recognition using a fine-tuned Whisper medium model.",
)

iface.launch()