Set "whisper_implementation" to "faster-whisper" in config.json5
Browse files- config.json5 +4 -4
config.json5
CHANGED
|
@@ -48,7 +48,7 @@
|
|
| 48 |
// * WEBUI options *
|
| 49 |
|
| 50 |
// Maximum audio file length in seconds, or -1 for no limit. Ignored by CLI.
|
| 51 |
-
"input_audio_max_duration":
|
| 52 |
// True to share the app on HuggingFace.
|
| 53 |
"share": false,
|
| 54 |
// The host or IP to bind to. If None, bind to localhost.
|
|
@@ -65,10 +65,10 @@
|
|
| 65 |
// The default implementation to use for Whisper. Can be "whisper" or "faster-whisper".
|
| 66 |
// Note that you must either install the requirements for faster-whisper (requirements-fasterWhisper.txt)
|
| 67 |
// or whisper (requirements.txt)
|
| 68 |
-
"whisper_implementation": "whisper",
|
| 69 |
|
| 70 |
// The default model name.
|
| 71 |
-
"default_model_name": "
|
| 72 |
// The default VAD.
|
| 73 |
"default_vad": "silero-vad",
|
| 74 |
// A commma delimited list of CUDA devices to use for parallel processing. If None, disable parallel processing.
|
|
@@ -94,7 +94,7 @@
|
|
| 94 |
// The window size (in seconds) to merge voice segments
|
| 95 |
"vad_merge_window": 5,
|
| 96 |
// The maximum size (in seconds) of a voice segment
|
| 97 |
-
"vad_max_merge_size":
|
| 98 |
// The padding (in seconds) to add to each voice segment
|
| 99 |
"vad_padding": 1,
|
| 100 |
// Whether or not to prepend the initial prompt to each VAD segment (prepend_all_segments), or just the first segment (prepend_first_segment)
|
|
|
|
| 48 |
// * WEBUI options *
|
| 49 |
|
| 50 |
// Maximum audio file length in seconds, or -1 for no limit. Ignored by CLI.
|
| 51 |
+
"input_audio_max_duration": 1800,
|
| 52 |
// True to share the app on HuggingFace.
|
| 53 |
"share": false,
|
| 54 |
// The host or IP to bind to. If None, bind to localhost.
|
|
|
|
| 65 |
// The default implementation to use for Whisper. Can be "whisper" or "faster-whisper".
|
| 66 |
// Note that you must either install the requirements for faster-whisper (requirements-fasterWhisper.txt)
|
| 67 |
// or whisper (requirements.txt)
|
| 68 |
+
"whisper_implementation": "faster-whisper",
|
| 69 |
|
| 70 |
// The default model name.
|
| 71 |
+
"default_model_name": "large-v2",
|
| 72 |
// The default VAD.
|
| 73 |
"default_vad": "silero-vad",
|
| 74 |
// A commma delimited list of CUDA devices to use for parallel processing. If None, disable parallel processing.
|
|
|
|
| 94 |
// The window size (in seconds) to merge voice segments
|
| 95 |
"vad_merge_window": 5,
|
| 96 |
// The maximum size (in seconds) of a voice segment
|
| 97 |
+
"vad_max_merge_size": 90,
|
| 98 |
// The padding (in seconds) to add to each voice segment
|
| 99 |
"vad_padding": 1,
|
| 100 |
// Whether or not to prepend the initial prompt to each VAD segment (prepend_all_segments), or just the first segment (prepend_first_segment)
|