Spaces:

morsczx
/

asr_pipeline

Sleeping

Manjot Singh commited on Sep 1, 2024

Commit

cf21473

1 Parent(s): 5865692

asr_trasncription

Files changed (5) hide show

.gitignore ADDED Viewed

+__pycache__/
+.venv/
+*.pyc

app.py CHANGED Viewed

@@ -1,7 +1,24 @@
 import gradio as gr
-def greet(name):
-    return "Hello " + name + "!!"
-demo = gr.Interface(fn=greet, inputs="text", outputs="text")
-demo.launch()

 import gradio as gr
+from audio_processing import process_audio, print_results
+def transcribe_audio(audio_file):
+    language_segments, text_segments = process_audio(audio_file)
+    output = "Detected language changes:\n\n"
+    for lang_segment in language_segments:
+        output += f"Language: {lang_segment['language']}\n"
+        output += f"Time: {lang_segment['start']:.2f}s - {lang_segment['end']:.2f}s\n\n"
+    output += "Transcription:\n\n"
+    for segment in text_segments:
+        output += f"[{segment['start']:.2f}s - {segment['end']:.2f}s] {segment['text']}\n"
+    return output
+iface = gr.Interface(
+    fn=transcribe_audio,
+    inputs=gr.Audio(type="filepath"),
+    outputs="text",
+    title="WhisperX Audio Transcription"
+)
+iface.launch()

flagged/audio_file/e6332957799e9944ecd7/audio.wav ADDED Viewed

Binary file (238 kB). View file

flagged/log.csv ADDED Viewed


1	+ audio_file,output,flag,username,timestamp
2	+ flagged/audio_file/e6332957799e9944ecd7/audio.wav,,,,2024-08-31 11:46:39.944110

requirements.txt CHANGED Viewed

@@ -1,9 +1,14 @@
-torch
-torchaudio
 transformers
 git+https://github.com/m-bain/whisperx.git
 numpy
 pandas
 pyannote.audio
 pyperclip
-sentencepiece

 transformers
 git+https://github.com/m-bain/whisperx.git
 numpy
 pandas
 pyannote.audio
 pyperclip
+sentencepiece
+gradio
+speechbrain
+torch>=2
+torchaudio>=2
+faster-whisper==1.0.0
+setuptools>=65
+nltk