Spaces:
Build error
Build error
# -*- coding: utf-8 -*- | |
"""whisper_youtube.ipynb | |
Automatically generated by Colaboratory. | |
Original file is located at | |
https://colab.research.google.com/drive/1spmA-7Un5TA6ahuCeO62BUS_ME6zPuUx | |
# Using gradio for making a nice UI. | |
Youtube link version. | |
Installing requirements. | |
""" | |
#!pip install gradio | |
#!pip install git+https://github.com/huggingface/transformers | |
#!pip install pytube | |
from pytube import YouTube | |
from transformers import pipeline | |
import gradio as gr | |
import os | |
"""## Building a Demo | |
Now that we've fine-tuned our model we can build a demo to show | |
off its ASR capabilities! We'll make use of 🤗 Transformers | |
`pipeline`, which will take care of the entire ASR pipeline, | |
right from pre-processing the audio inputs to decoding the | |
model predictions. | |
Running the example below will generate a Gradio demo where can input audio to | |
our fine-tuned Whisper model to transcribe the corresponding text: | |
""" | |
pipe = pipeline(model="Victorlopo21/whisper-medium-gl-30") # change to "your-username/the-name-you-picked" | |
def get_audio(url): | |
yt = YouTube(url) | |
video = yt.streams.filter(only_audio=True)[1] | |
out_file=video.download(output_path=".") | |
base, ext = os.path.splitext(out_file) | |
new_file = base+'.wav' | |
os.rename(out_file, new_file) | |
a = new_file | |
return a | |
def transcribe_url(url): | |
text = pipe(get_audio(url))['text'] | |
return text | |
iface = gr.Interface( | |
fn=transcribe_url, | |
inputs='text', | |
outputs="text", | |
title="Whisper Medium Galician", | |
description="Realtime demo for Galician speech recognition of a YouTube video using a fine-tuned Whisper medium model.", | |
) | |
iface.launch(debug=True) | |
# Short youtube video to hear | |
# https://www.youtube.com/watch?v=Z2SjeZJZi6s&ab_channel=rimc7 | |
# TO TRY |