Spaces:
Sleeping
Sleeping
File size: 2,336 Bytes
69bf66b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 |
from pytube import YouTube
from transformers import pipeline
import streamlit as st
import os
model = whisper.load_model("base")
summarizer = pipeline("summarization")
def get_audio_from_video(file_path):
# You can use a library like moviepy or ffmpeg to extract audio from the video
# For simplicity, I'm assuming the video is already in a format that the model can transcribe
return file_path
def get_audio(url):
yt = YouTube(url)
video = yt.streams.filter(only_audio=True).first()
out_file = video.download(output_path=".")
base, ext = os.path.splitext(out_file)
new_file = base + '.mp3'
os.rename(out_file, new_file)
return new_file
def get_text(url=None, file_path=None):
if url:
result = model.transcribe(get_audio(url))
elif file_path:
result = model.transcribe(get_audio_from_video(file_path))
return result['text']
def get_summary(url=None, file_path=None):
article = get_text(url, file_path)
b = summarizer(article)
b = b[0]['summary_text']
return b
st.title("Youtube video transcription with OpenAI's Whisper")
st.write("Enter the link of any youtube video or upload a video file to get the transcription and a summary in the form of text.")
option = st.radio('Choose an option', ['Get the transcription of any Youtube video', 'Summary of Youtube video', 'Upload a video file'])
if option == 'Get the transcription of any Youtube video':
url1 = st.text_input('Enter the Youtube video URL')
if st.button('Get Transcription'):
transcription = get_text(url1)
st.text_area('Transcription of the video', transcription)
elif option == 'Summary of Youtube video':
url2 = st.text_input('Enter the Youtube video URL')
if st.button('Get Summary'):
summary = get_summary(url2)
st.text_area('Summary text of the Youtube Video', summary)
elif option == 'Upload a video file':
uploaded_file = st.file_uploader("Choose a video file", type=["mp4"])
if uploaded_file:
video_path = "temp_video_file.mp4"
with open(video_path, "wb") as f:
f.write(uploaded_file.getvalue())
if st.button('Transcribe Uploaded Video'):
transcription = get_text(file_path=video_path)
st.text_area('Transcription of the uploaded video file', transcription) |