Spaces:

Nathanotal
/

GuessTheTranscription

Runtime error

App Files Files Community

Nathanotal commited on Dec 3, 2022

Commit

d8b182e

1 Parent(s): 6b90fe2

initial

Browse files

Files changed (2) hide show

requirements.txt +5 -0
spel.py +170 -0

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+yt_dlp
+ffmpeg-python
+gradio
+huggingface_hub
+transformers

spel.py ADDED Viewed

	@@ -0,0 +1,170 @@

+"""## Divide the video into one 10s before and one 10s after"""
+# Login to HuggingFace somehow (todo)
+"""## Convert to audio
+## Get model
+"""
+from transformers import pipeline
+pipe = pipeline(model="Nathanotal/whisper-small-hi")  # change to "your-username/the-name-you-picked"
+def transcribe(audio):
+    text = pipe(audio)["text"]
+    return text
+"""## Download and trim the video"""
+# Commented out IPython magic to ensure Python compatibility.
+def downloadAndTranscribeVideo(source_url):
+  """**Input url to youtube video**"""
+  if "=" in source_url:
+    id = source_url.split('=', 1)[1]
+  else:
+    id = source_url.split('/')[-1]
+  # Empty folder
+#   %rm -rf '/content/drive/My Drive/ID2223/LAB2/'
+  """**Create output folder**"""
+  # change this to /content/drive/My Drive/folder_you_want
+  output_folder = '/content/drive/My Drive/ID2223/LAB2/'
+  import os
+  def my_mkdirs(folder):
+    if os.path.exists(folder)==False:
+      os.makedirs(folder)
+  my_mkdirs('/content/tmp/')
+  my_mkdirs(output_folder)
+  # Get URLs to video file and audio file
+  # Attempt to get 720p clip, else get best possible quality
+  try:
+    video_url, audio_url = !yt-dlp -g -f bv[height=720][ext=webm]+ba[ext=m4a] "{source_url}"
+  except:
+    video_url, audio_url = !yt-dlp -g -f bv[ext=webm]+ba[ext=m4a] "{source_url}"
+  print('Video:', video_url)
+  print('Audio:', audio_url)
+  """**Download part of video and audio files**"""
+  temp_video = "temp_video.mkv"
+  temp_audio = "temp_audio.m4a"
+  # Download video file (first 10 seconds)
+  !ffmpeg -probesize 10M -y -i "{video_url}" -ss 00:00:00 -t 00:00:10 -c copy "{output_folder}{temp_video}"
+  # Download audio file (first 10 seconds)
+  !ffmpeg -probesize 10M -y -i "{audio_url}" -ss 00:00:00 -t 00:00:10 -c copy "{output_folder}{temp_audio}"
+  """**MUX video and audio files**"""
+  temp_output = "output.mp4"
+  # MUX video and audio files into final output [mkv]
+  !ffmpeg  -hide_banner -loglevel error -y -i "{output_folder}{temp_video}" -i "{output_folder}{temp_audio}" -c copy "{output_folder}{temp_output}"
+  first10Video = "first10Video.mp4"
+  second10Video = "second10Video.mp4"
+  !ffmpeg -hide_banner -loglevel error -y -i "{output_folder}{temp_output}" -ss 00:00:00 -to 00:00:05 -c copy "{output_folder}{first10Video}"
+  !ffmpeg -hide_banner -loglevel error -y -i "{output_folder}{temp_output}" -ss 00:00:05 -to 00:00:10 -c copy "{output_folder}{second10Video}"
+  first10Audio = "first10Audio.m4a"
+  second10Audio = "second10Audio.m4a"
+  !ffmpeg -hide_banner -loglevel error -y -i "{output_folder}{first10Video}" -vn -acodec copy "{output_folder}{first10Audio}"
+  !ffmpeg -hide_banner -loglevel error -y -i "{output_folder}{second10Video}" -vn -acodec copy "{output_folder}{second10Audio}"
+  first10AudioFinal = "first10AudioFinal.mp3"
+  second10AudioFinal = "second10AudioFinal.mp3"
+  !ffmpeg -i "{output_folder}{first10Audio}" -c:v copy -c:a libmp3lame -q:a 4 "{output_folder}{first10AudioFinal}"
+  !ffmpeg -i "{output_folder}{second10Audio}" -c:v copy -c:a libmp3lame -q:a 4 "{output_folder}{second10AudioFinal}"
+  firstVideoText = transcribe('/content/drive/My Drive/ID2223/LAB2/first10AudioFinal.mp3')
+  secondVideoText = transcribe('/content/drive/My Drive/ID2223/LAB2/second10AudioFinal.mp3')
+  # Delete temporary files
+  !rm "{output_folder}{temp_video}"
+  !rm "{output_folder}{temp_audio}"
+  return firstVideoText, secondVideoText
+# print(downloadAndTranscribeVideo('https://www.youtube.com/watch?v=93WrIPY4_4E'))
+"""## Build UI"""
+from transformers import pipeline
+import gradio as gr
+def calculateSimilarity(texta, actualText):
+  texta = texta.lower().strip()
+  actualText = actualText.lower().strip()
+  textaL = texta.split(" ")
+  actualTextL = actualText.split(" ")
+  totalWords = len(actualTextL)
+  matchingWords = 0
+  for word in textaL:
+    if word in actualTextL:
+      matchingWords += 1
+  return int(100*(matchingWords / totalWords))
+def game(videoLink, loadVideo, audio1, audio2, theState):
+  theState = theState or []
+  firstText = "test"
+  secondText = "test"
+  if loadVideo:
+    firstText, secondText = downloadAndTranscribeVideo(videoLink)
+    theState = [firstText, secondText]
+    return "/content/drive/My Drive/ID2223/LAB2/first10Video.mp4", firstText, "", "", "", "", "", "/content/drive/My Drive/ID2223/LAB2/second10Video.mp4", "", theState
+  elif len(theState) == 0:
+    return "/content/drive/My Drive/ID2223/LAB2/first10Video.mp4", "", "", "", "", "", "", "/content/drive/My Drive/ID2223/LAB2/second10Video.mp4", "", theState
+  else:
+    firstText, secondText = theState[0], theState[1]
+  t1 = transcribe(audio1)
+  t2 = transcribe(audio2)
+  t1Res = calculateSimilarity(t1, secondText)
+  t2Res = calculateSimilarity(t2, secondText)
+  res = 'The game is even, everybody wins!'
+  if t1Res > t2Res:
+    res = 'Player 1 won!'
+  elif t1Res < t2Res:
+    res = 'Player 2 won!'
+  return "/content/drive/My Drive/ID2223/LAB2/first10Video.mp4", firstText, t1, str(t1Res) + '% match', t2, str(t2Res) + '% match', res, "/content/drive/My Drive/ID2223/LAB2/second10Video.mp4", secondText, theState
+# exInputs = [[None], [None], ["/content/ut.webm"]]
+gameInterface = gr.Interface(fn=game,
+                    inputs=[gr.Textbox(label='Link to video'),
+                            gr.Checkbox(label='Load a new video'),
+                            gr.Audio(source="microphone", type="filepath", label='Player 1\'s guess'),
+                            gr.Audio(source="microphone", type="filepath", label='Player 2\'s guess'),
+                            "state"],
+                    outputs=[gr.Video(label='First ten seconds'),
+                             gr.Textbox(label='Transcription of first ten seconds'),
+                             gr.Textbox(label='Transcription for player 1'),
+                             gr.Textbox(label='Percentage match:'),
+                             gr.Textbox(label='Transcription for player 2'),
+                             gr.Textbox(label='Percentage match:'),
+                             gr.Textbox(label='Result:'),
+                             gr.Video(label='Next ten seconds'),
+                             gr.Textbox(label='Transcription of next ten seconds'),
+                             "state"],
+                    title="Game",
+                    description="Description of game"
+                    )
+gameInterface.launch()