Spaces:

Kr08
/

ASR_gradio

Build error

Kr08 commited on Aug 27, 2024

Commit

7dccca6

verified ·

1 Parent(s): 605a998

Update audio_processing.py

Files changed (1) hide show

audio_processing.py CHANGED Viewed

@@ -3,6 +3,7 @@ import whisper
 import numpy as np
 import torchaudio as ta
 import gradio as gr
 from model_utils import get_processor, get_model, get_whisper_model_small, get_device
 from config import SAMPLING_RATE, CHUNK_LENGTH_S
 import subprocess
@@ -10,12 +11,14 @@ import subprocess
 import subprocess
 import torchaudio as ta
 def resample_with_ffmpeg(input_file, output_file, target_sr=16000):
     command = [
         'ffmpeg', '-i', input_file, '-ar', str(target_sr), output_file
     ]
     subprocess.run(command, check=True)
 def detect_language(audio):
     whisper_model = get_whisper_model_small()
@@ -50,6 +53,7 @@ def detect_language(audio):
     return detected_lang
 def process_long_audio(audio, task="transcribe", language=None):
     if audio[0] != SAMPLING_RATE:
         # Save the input audio to a file for ffmpeg processing
@@ -106,6 +110,7 @@ def process_long_audio(audio, task="transcribe", language=None):
     return " ".join(results)
 def process_audio(audio):
     if audio is None:
         return "No file uploaded", "", ""

 import numpy as np
 import torchaudio as ta
 import gradio as gr
+import spaces
 from model_utils import get_processor, get_model, get_whisper_model_small, get_device
 from config import SAMPLING_RATE, CHUNK_LENGTH_S
 import subprocess
 import subprocess
 import torchaudio as ta
 def resample_with_ffmpeg(input_file, output_file, target_sr=16000):
     command = [
         'ffmpeg', '-i', input_file, '-ar', str(target_sr), output_file
     ]
     subprocess.run(command, check=True)
++@spaces.GPU
 def detect_language(audio):
     whisper_model = get_whisper_model_small()
     return detected_lang
++@spaces.GPU
 def process_long_audio(audio, task="transcribe", language=None):
     if audio[0] != SAMPLING_RATE:
         # Save the input audio to a file for ffmpeg processing
     return " ".join(results)
++@spaces.GPU
 def process_audio(audio):
     if audio is None:
         return "No file uploaded", "", ""