deepsync commited on
Commit
75da7a9
·
verified ·
1 Parent(s): 01a403c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -5,9 +5,9 @@ from pydub.silence import detect_nonsilent
5
  from pydub import AudioSegment
6
 
7
 
8
- def get_labels(audio_fp, min_speech_duration_ms, min_silence_duration_ms, auto_merge, uppper_merge_threshold, max_segment_length, end_extension, extend_small_segments, show_duration_label):
9
  audio = AudioSegment.from_file(audio_fp.name).set_channels(1)
10
- speech_timestamps = detect_nonsilent(audio, min_silence_len=min_silence_duration_ms, silence_thresh=-60)
11
  speech_timestamps = list(filter(lambda x: x[1]-x[0] > min_speech_duration_ms, speech_timestamps))
12
  speech_timestamps = [{"start": s[0]/1000, "end": s[1]/1000} for s in speech_timestamps]
13
  labels_str = []
@@ -81,7 +81,8 @@ interface = gr.Interface(
81
  gr.Number(label="Approx Max Segment Length", value=7),
82
  gr.Number(label="Extend end by (seconds)", value=0),
83
  gr.Checkbox(label="Extend small segments (minimum 1.02 seconds)", value=False),
84
- gr.Checkbox(label="Show only duration in labels", value=False)
 
85
  ],
86
  [
87
  gr.File(label="VAD Labels"),
 
5
  from pydub import AudioSegment
6
 
7
 
8
+ def get_labels(audio_fp, min_speech_duration_ms, min_silence_duration_ms, auto_merge, uppper_merge_threshold, max_segment_length, end_extension, extend_small_segments, show_duration_label, sil_thresh):
9
  audio = AudioSegment.from_file(audio_fp.name).set_channels(1)
10
+ speech_timestamps = detect_nonsilent(audio, min_silence_len=min_silence_duration_ms, silence_thresh=int(sil_thresh))
11
  speech_timestamps = list(filter(lambda x: x[1]-x[0] > min_speech_duration_ms, speech_timestamps))
12
  speech_timestamps = [{"start": s[0]/1000, "end": s[1]/1000} for s in speech_timestamps]
13
  labels_str = []
 
81
  gr.Number(label="Approx Max Segment Length", value=7),
82
  gr.Number(label="Extend end by (seconds)", value=0),
83
  gr.Checkbox(label="Extend small segments (minimum 1.02 seconds)", value=False),
84
+ gr.Checkbox(label="Show only duration in labels", value=False).
85
+ gr.Textbox(label="Silence Threshold", value="-45")
86
  ],
87
  [
88
  gr.File(label="VAD Labels"),