import gradio as gr import librosa from asr import transcribe, ASR_EXAMPLES, ASR_NOTE # Define only English and Swahili languages ASR_LANGUAGES = { "eng": "English", "swh": "Swahili", } # Speech-to-Text Interface mms_transcribe = gr.Interface( fn=transcribe, inputs=[ gr.Audio(), gr.Dropdown( [f"{k} ({v})" for k, v in ASR_LANGUAGES.items()], label="Language", value="eng English", ), ], outputs="text", examples=ASR_EXAMPLES, title="Speech-to-Text", description="Transcribe audio in either English or Swahili.", article=ASR_NOTE, allow_flagging="never", ) # Main Gradio App with gr.Blocks() as demo: gr.Markdown("
MMS Speech-to-Text
") gr.HTML("