Skip to content

Commit 5d4fdaa

Browse files
committed
fix VAD timestamp conversion (bug introduced in 1.15.2)
1 parent 9f903c7 commit 5d4fdaa

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

whisper_timestamped/transcribe.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
__author__ = "Jérôme Louradour"
44
__credits__ = ["Jérôme Louradour"]
55
__license__ = "GPLv3"
6-
__version__ = "1.15.2"
6+
__version__ = "1.15.3"
77

88
# Set some environment variables
99
import os
@@ -2106,7 +2106,7 @@ def remove_non_speech(audio,
21062106
if avoid_empty_speech:
21072107
segments = [(0, audio.shape[-1])]
21082108
else:
2109-
return torch.Tensor([]), [], lambda t, t2 = None: do_convert_timestamps(segments, t, t2)
2109+
return torch.Tensor([]), [], lambda t, t2 = None: t if t2 is None else [t, t2]
21102110

21112111
audio_speech = torch.cat([audio[..., s:e] for s,e in segments], dim=-1)
21122112

@@ -2127,7 +2127,7 @@ def remove_non_speech(audio,
21272127
if not use_sample:
21282128
segments = [(float(s)/sample_rate, float(e)/sample_rate) for s,e in segments]
21292129

2130-
return audio_speech, segments, lambda t, t2 = None: t if t2 is None else [t, t2]
2130+
return audio_speech, segments, lambda t, t2 = None: do_convert_timestamps(segments, t, t2)
21312131

21322132
def do_convert_timestamps(segments, t, t2 = None):
21332133
"""

0 commit comments

Comments
 (0)