Spaces:
Running
Running
jhj0517
commited on
Commit
·
eec0c16
1
Parent(s):
ddbe0b6
Fix VAD syntax & add vad handling case
Browse files
modules/whisper/base_transcription_pipeline.py
CHANGED
|
@@ -135,12 +135,17 @@ class BaseTranscriptionPipeline(ABC):
|
|
| 135 |
speech_pad_ms=vad_params.speech_pad_ms
|
| 136 |
)
|
| 137 |
|
| 138 |
-
|
| 139 |
audio=audio,
|
| 140 |
vad_parameters=vad_options,
|
| 141 |
progress=progress
|
| 142 |
)
|
| 143 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 144 |
result, elapsed_time = self.transcribe(
|
| 145 |
audio,
|
| 146 |
progress,
|
|
@@ -150,7 +155,7 @@ class BaseTranscriptionPipeline(ABC):
|
|
| 150 |
if vad_params.vad_filter:
|
| 151 |
result = self.vad.restore_speech_timestamps(
|
| 152 |
segments=result,
|
| 153 |
-
speech_chunks=
|
| 154 |
)
|
| 155 |
|
| 156 |
if diarization_params.is_diarize:
|
|
|
|
| 135 |
speech_pad_ms=vad_params.speech_pad_ms
|
| 136 |
)
|
| 137 |
|
| 138 |
+
vad_processed, speech_chunks = self.vad.run(
|
| 139 |
audio=audio,
|
| 140 |
vad_parameters=vad_options,
|
| 141 |
progress=progress
|
| 142 |
)
|
| 143 |
|
| 144 |
+
if vad_processed.size > 0:
|
| 145 |
+
audio = vad_processed
|
| 146 |
+
else:
|
| 147 |
+
vad_params.vad_filter = False
|
| 148 |
+
|
| 149 |
result, elapsed_time = self.transcribe(
|
| 150 |
audio,
|
| 151 |
progress,
|
|
|
|
| 155 |
if vad_params.vad_filter:
|
| 156 |
result = self.vad.restore_speech_timestamps(
|
| 157 |
segments=result,
|
| 158 |
+
speech_chunks=speech_chunks,
|
| 159 |
)
|
| 160 |
|
| 161 |
if diarization_params.is_diarize:
|