Set "whisper_implementation" to "faster-whisper" in config.json5
Browse files- config.json5 +4 -4
config.json5
CHANGED
@@ -48,7 +48,7 @@
|
|
48 |
// * WEBUI options *
|
49 |
|
50 |
// Maximum audio file length in seconds, or -1 for no limit. Ignored by CLI.
|
51 |
-
"input_audio_max_duration":
|
52 |
// True to share the app on HuggingFace.
|
53 |
"share": false,
|
54 |
// The host or IP to bind to. If None, bind to localhost.
|
@@ -65,10 +65,10 @@
|
|
65 |
// The default implementation to use for Whisper. Can be "whisper" or "faster-whisper".
|
66 |
// Note that you must either install the requirements for faster-whisper (requirements-fasterWhisper.txt)
|
67 |
// or whisper (requirements.txt)
|
68 |
-
"whisper_implementation": "whisper",
|
69 |
|
70 |
// The default model name.
|
71 |
-
"default_model_name": "
|
72 |
// The default VAD.
|
73 |
"default_vad": "silero-vad",
|
74 |
// A commma delimited list of CUDA devices to use for parallel processing. If None, disable parallel processing.
|
@@ -94,7 +94,7 @@
|
|
94 |
// The window size (in seconds) to merge voice segments
|
95 |
"vad_merge_window": 5,
|
96 |
// The maximum size (in seconds) of a voice segment
|
97 |
-
"vad_max_merge_size":
|
98 |
// The padding (in seconds) to add to each voice segment
|
99 |
"vad_padding": 1,
|
100 |
// Whether or not to prepend the initial prompt to each VAD segment (prepend_all_segments), or just the first segment (prepend_first_segment)
|
|
|
48 |
// * WEBUI options *
|
49 |
|
50 |
// Maximum audio file length in seconds, or -1 for no limit. Ignored by CLI.
|
51 |
+
"input_audio_max_duration": 1800,
|
52 |
// True to share the app on HuggingFace.
|
53 |
"share": false,
|
54 |
// The host or IP to bind to. If None, bind to localhost.
|
|
|
65 |
// The default implementation to use for Whisper. Can be "whisper" or "faster-whisper".
|
66 |
// Note that you must either install the requirements for faster-whisper (requirements-fasterWhisper.txt)
|
67 |
// or whisper (requirements.txt)
|
68 |
+
"whisper_implementation": "faster-whisper",
|
69 |
|
70 |
// The default model name.
|
71 |
+
"default_model_name": "large-v2",
|
72 |
// The default VAD.
|
73 |
"default_vad": "silero-vad",
|
74 |
// A commma delimited list of CUDA devices to use for parallel processing. If None, disable parallel processing.
|
|
|
94 |
// The window size (in seconds) to merge voice segments
|
95 |
"vad_merge_window": 5,
|
96 |
// The maximum size (in seconds) of a voice segment
|
97 |
+
"vad_max_merge_size": 90,
|
98 |
// The padding (in seconds) to add to each voice segment
|
99 |
"vad_padding": 1,
|
100 |
// Whether or not to prepend the initial prompt to each VAD segment (prepend_all_segments), or just the first segment (prepend_first_segment)
|