From f53a161d55bc6cffc2aab066697be14753cd85c7 Mon Sep 17 00:00:00 2001 From: Jong Wook Kim Date: Fri, 5 May 2023 01:40:00 -0700 Subject: [PATCH] Fix #1293 --- whisper/timing.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/whisper/timing.py b/whisper/timing.py index 1a73eaa..979d9d0 100644 --- a/whisper/timing.py +++ b/whisper/timing.py @@ -215,6 +215,8 @@ def find_alignment( words, word_tokens = tokenizer.split_to_word_tokens(text_tokens + [tokenizer.eot]) word_boundaries = np.pad(np.cumsum([len(t) for t in word_tokens[:-1]]), (1, 0)) + if len(word_boundaries) <= 1: + return [] jumps = np.pad(np.diff(text_indices), (1, 0), constant_values=1).astype(bool) jump_times = time_indices[jumps] / TOKENS_PER_SECOND