Better whisper-ctranslate vad filter option

2024-07-03 17:08:32 +02:00 · 2024-07-03 17:08:32 +02:00 · 07058e17c3
parent efa58350eb
commit 07058e17c3
1 changed files with 4 additions and 0 deletions
--- a/packages/transcription/src/whisper/transcriber/ctranslate2-transcriber.ts
+++ b/packages/transcription/src/whisper/transcriber/ctranslate2-transcriber.ts
@ -37,6 +37,10 @@ export class Ctranslate2Transcriber extends OpenaiTranscriber {
      'True',
      '--vad_filter',
      'true',
      // Better precision with 5s of audio
      // We mainly use vad_filter to improve language detection (first 30 seconds of the video, so no voice is problematic)
      '--vad_min_silence_duration_ms',
      '5000',
      '--output_format',
      'all',
      '--output_dir',