chaouch's picture
try
e18ea74
import gradio as gr
from transformers import pipeline
def transcribe_speech(filepath):
model_id = "chaouch/whisper-small-dv" # update with your model id
pipe = pipeline("automatic-speech-recognition", model=model_id)
output = pipe(
filepath,
max_new_tokens=256,
generate_kwargs={
"task": "transcribe",
"language": "sinhalese",
}, # update with the language you've fine-tuned on
chunk_length_s=30,
batch_size=8,
)
return output["text"]
if __name__ == "__main__":
demo = gr.Interface(fn=transcribe_speech,
inputs=gr.Audio(sources="microphone", type="file"),
outputs=gr.Textbox())
demo.launch(debug=True)