avans06 commited on
Commit
2a5f69c
1 Parent(s): 4c650d7

Set "whisper_implementation" to "faster-whisper" in config.json5

Browse files
Files changed (1) hide show
  1. config.json5 +4 -4
config.json5 CHANGED
@@ -48,7 +48,7 @@
48
  // * WEBUI options *
49
 
50
  // Maximum audio file length in seconds, or -1 for no limit. Ignored by CLI.
51
- "input_audio_max_duration": 600,
52
  // True to share the app on HuggingFace.
53
  "share": false,
54
  // The host or IP to bind to. If None, bind to localhost.
@@ -65,10 +65,10 @@
65
  // The default implementation to use for Whisper. Can be "whisper" or "faster-whisper".
66
  // Note that you must either install the requirements for faster-whisper (requirements-fasterWhisper.txt)
67
  // or whisper (requirements.txt)
68
- "whisper_implementation": "whisper",
69
 
70
  // The default model name.
71
- "default_model_name": "medium",
72
  // The default VAD.
73
  "default_vad": "silero-vad",
74
  // A commma delimited list of CUDA devices to use for parallel processing. If None, disable parallel processing.
@@ -94,7 +94,7 @@
94
  // The window size (in seconds) to merge voice segments
95
  "vad_merge_window": 5,
96
  // The maximum size (in seconds) of a voice segment
97
- "vad_max_merge_size": 30,
98
  // The padding (in seconds) to add to each voice segment
99
  "vad_padding": 1,
100
  // Whether or not to prepend the initial prompt to each VAD segment (prepend_all_segments), or just the first segment (prepend_first_segment)
 
48
  // * WEBUI options *
49
 
50
  // Maximum audio file length in seconds, or -1 for no limit. Ignored by CLI.
51
+ "input_audio_max_duration": 1800,
52
  // True to share the app on HuggingFace.
53
  "share": false,
54
  // The host or IP to bind to. If None, bind to localhost.
 
65
  // The default implementation to use for Whisper. Can be "whisper" or "faster-whisper".
66
  // Note that you must either install the requirements for faster-whisper (requirements-fasterWhisper.txt)
67
  // or whisper (requirements.txt)
68
+ "whisper_implementation": "faster-whisper",
69
 
70
  // The default model name.
71
+ "default_model_name": "large-v2",
72
  // The default VAD.
73
  "default_vad": "silero-vad",
74
  // A commma delimited list of CUDA devices to use for parallel processing. If None, disable parallel processing.
 
94
  // The window size (in seconds) to merge voice segments
95
  "vad_merge_window": 5,
96
  // The maximum size (in seconds) of a voice segment
97
+ "vad_max_merge_size": 90,
98
  // The padding (in seconds) to add to each voice segment
99
  "vad_padding": 1,
100
  // Whether or not to prepend the initial prompt to each VAD segment (prepend_all_segments), or just the first segment (prepend_first_segment)