Transcribe on GPU

2025-11-24 14:35:57 +00:00 · 2024-09-09 19:38:39 +09:00 · 2024-09-09 19:38:39 +09:00 · 2448c6f749
commit 2448c6f749
parent ba3f3cd54b
1 changed files with 3 additions and 1 deletions
--- a/whisper/transcribe.py
+++ b/whisper/transcribe.py
@ -130,7 +130,9 @@ def transcribe(
        decode_options["fp16"] = False
    # Pad 30-seconds of silence to the input audio, for slicing
-    mel = log_mel_spectrogram(audio, model.dims.n_mels, padding=N_SAMPLES)
+    mel = log_mel_spectrogram(
        audio, model.dims.n_mels, padding=N_SAMPLES, device=model.device
    )
    content_frames = mel.shape[-1] - N_FRAMES
    content_duration = float(content_frames * HOP_LENGTH / SAMPLE_RATE)