jhj0517 commited on
Commit
eec0c16
·
1 Parent(s): ddbe0b6

Fix VAD syntax & add vad handling case

Browse files
modules/whisper/base_transcription_pipeline.py CHANGED
@@ -135,12 +135,17 @@ class BaseTranscriptionPipeline(ABC):
135
  speech_pad_ms=vad_params.speech_pad_ms
136
  )
137
 
138
- audio, speech_chunks = self.vad.run(
139
  audio=audio,
140
  vad_parameters=vad_options,
141
  progress=progress
142
  )
143
 
 
 
 
 
 
144
  result, elapsed_time = self.transcribe(
145
  audio,
146
  progress,
@@ -150,7 +155,7 @@ class BaseTranscriptionPipeline(ABC):
150
  if vad_params.vad_filter:
151
  result = self.vad.restore_speech_timestamps(
152
  segments=result,
153
- speech_chunks=vad_params.speech_chunks,
154
  )
155
 
156
  if diarization_params.is_diarize:
 
135
  speech_pad_ms=vad_params.speech_pad_ms
136
  )
137
 
138
+ vad_processed, speech_chunks = self.vad.run(
139
  audio=audio,
140
  vad_parameters=vad_options,
141
  progress=progress
142
  )
143
 
144
+ if vad_processed.size > 0:
145
+ audio = vad_processed
146
+ else:
147
+ vad_params.vad_filter = False
148
+
149
  result, elapsed_time = self.transcribe(
150
  audio,
151
  progress,
 
155
  if vad_params.vad_filter:
156
  result = self.vad.restore_speech_timestamps(
157
  segments=result,
158
+ speech_chunks=speech_chunks,
159
  )
160
 
161
  if diarization_params.is_diarize: