Transcribe on GPU

This commit is contained in:
take0x 2024-09-09 19:38:39 +09:00
parent ba3f3cd54b
commit 2448c6f749

View File

@ -130,7 +130,9 @@ def transcribe(
decode_options["fp16"] = False decode_options["fp16"] = False
# Pad 30-seconds of silence to the input audio, for slicing # Pad 30-seconds of silence to the input audio, for slicing
mel = log_mel_spectrogram(audio, model.dims.n_mels, padding=N_SAMPLES) mel = log_mel_spectrogram(
audio, model.dims.n_mels, padding=N_SAMPLES, device=model.device
)
content_frames = mel.shape[-1] - N_FRAMES content_frames = mel.shape[-1] - N_FRAMES
content_duration = float(content_frames * HOP_LENGTH / SAMPLE_RATE) content_duration = float(content_frames * HOP_LENGTH / SAMPLE_RATE)