Better whisper-ctranslate vad filter option

pull/6527/head
Chocobozzz 2024-07-03 17:08:32 +02:00
parent efa58350eb
commit 07058e17c3
No known key found for this signature in database
GPG Key ID: 583A612D890159BE
1 changed files with 4 additions and 0 deletions

View File

@ -37,6 +37,10 @@ export class Ctranslate2Transcriber extends OpenaiTranscriber {
'True', 'True',
'--vad_filter', '--vad_filter',
'true', 'true',
// Better precision with 5s of audio
// We mainly use vad_filter to improve language detection (first 30 seconds of the video, so no voice is problematic)
'--vad_min_silence_duration_ms',
'5000',
'--output_format', '--output_format',
'all', 'all',
'--output_dir', '--output_dir',