Spaces:

Victorlopo21
/

Lab2Youtube

Build error

App Files Files Community

Victorlopo21 commited on Dec 8, 2022

Commit

6fa0583

•

1 Parent(s): 32c6ac4

Upload whisper_youtube.py

Browse files

Files changed (1) hide show

whisper_youtube.py +75 -0

whisper_youtube.py ADDED Viewed

	@@ -0,0 +1,75 @@

+# -*- coding: utf-8 -*-
+"""whisper_youtube.ipynb
+Automatically generated by Colaboratory.
+Original file is located at
+    https://colab.research.google.com/drive/1spmA-7Un5TA6ahuCeO62BUS_ME6zPuUx
+# Using gradio for making a nice UI.
+Youtube link version.
+Installing requirements.
+"""
+!pip install gradio
+!pip install git+https://github.com/huggingface/transformers
+!pip install pytube
+from pytube import YouTube
+from transformers import pipeline
+import gradio as gr
+import os
+from transformers import WhisperProcessor
+processor = WhisperProcessor.from_pretrained("openai/whisper-small", language="Galician", task="transcribe")
+from transformers import WhisperTokenizer
+tokenizer = WhisperTokenizer.from_pretrained("openai/whisper-small", language="Galician", task="transcribe")
+"""## Building a Demo
+Now that we've fine-tuned our model we can build a demo to show
+off its ASR capabilities! We'll make use of 🤗 Transformers
+`pipeline`, which will take care of the entire ASR pipeline,
+right from pre-processing the audio inputs to decoding the
+model predictions.
+Running the example below will generate a Gradio demo where can input audio to
+our fine-tuned Whisper model to transcribe the corresponding text:
+"""
+pipe = pipeline(model="Victorlopo21/whisper-medium-gl-30")  # change to "your-username/the-name-you-picked"
+def get_audio(url):
+  yt = YouTube(url)
+  video = yt.streams.filter(only_audio=True)[1]
+  out_file=video.download(output_path=".")
+  base, ext = os.path.splitext(out_file)
+  new_file = base+'.wav'
+  os.rename(out_file, new_file)
+  a = new_file
+  return a
+def transcribe_url(url):
+    text = pipe(get_audio(url))['text']
+    return text
+iface = gr.Interface(
+    fn=transcribe_url,
+    inputs='text',
+    outputs="text",
+    title="Whisper Medium Galician",
+    description="Realtime demo for Galician speech recognition using a fine-tuned Whisper medium model.",
+)
+iface.launch(debug=True)
+# Short youtube video to hear
+# https://www.youtube.com/watch?v=Z2SjeZJZi6s&ab_channel=rimc7
+# TO TRY