Update app.py
Browse files
app.py
CHANGED
@@ -5,9 +5,9 @@ from pydub.silence import detect_nonsilent
|
|
5 |
from pydub import AudioSegment
|
6 |
|
7 |
|
8 |
-
def get_labels(audio_fp, min_speech_duration_ms, min_silence_duration_ms, auto_merge, uppper_merge_threshold, max_segment_length, end_extension, extend_small_segments, show_duration_label):
|
9 |
audio = AudioSegment.from_file(audio_fp.name).set_channels(1)
|
10 |
-
speech_timestamps = detect_nonsilent(audio, min_silence_len=min_silence_duration_ms, silence_thresh
|
11 |
speech_timestamps = list(filter(lambda x: x[1]-x[0] > min_speech_duration_ms, speech_timestamps))
|
12 |
speech_timestamps = [{"start": s[0]/1000, "end": s[1]/1000} for s in speech_timestamps]
|
13 |
labels_str = []
|
@@ -81,7 +81,8 @@ interface = gr.Interface(
|
|
81 |
gr.Number(label="Approx Max Segment Length", value=7),
|
82 |
gr.Number(label="Extend end by (seconds)", value=0),
|
83 |
gr.Checkbox(label="Extend small segments (minimum 1.02 seconds)", value=False),
|
84 |
-
gr.Checkbox(label="Show only duration in labels", value=False)
|
|
|
85 |
],
|
86 |
[
|
87 |
gr.File(label="VAD Labels"),
|
|
|
5 |
from pydub import AudioSegment
|
6 |
|
7 |
|
8 |
+
def get_labels(audio_fp, min_speech_duration_ms, min_silence_duration_ms, auto_merge, uppper_merge_threshold, max_segment_length, end_extension, extend_small_segments, show_duration_label, sil_thresh):
|
9 |
audio = AudioSegment.from_file(audio_fp.name).set_channels(1)
|
10 |
+
speech_timestamps = detect_nonsilent(audio, min_silence_len=min_silence_duration_ms, silence_thresh=int(sil_thresh))
|
11 |
speech_timestamps = list(filter(lambda x: x[1]-x[0] > min_speech_duration_ms, speech_timestamps))
|
12 |
speech_timestamps = [{"start": s[0]/1000, "end": s[1]/1000} for s in speech_timestamps]
|
13 |
labels_str = []
|
|
|
81 |
gr.Number(label="Approx Max Segment Length", value=7),
|
82 |
gr.Number(label="Extend end by (seconds)", value=0),
|
83 |
gr.Checkbox(label="Extend small segments (minimum 1.02 seconds)", value=False),
|
84 |
+
gr.Checkbox(label="Show only duration in labels", value=False).
|
85 |
+
gr.Textbox(label="Silence Threshold", value="-45")
|
86 |
],
|
87 |
[
|
88 |
gr.File(label="VAD Labels"),
|