Merge 089f08945b4934eb6a453c61492fe2d7835e115a into c0d2f624c09dc18e709e37c2ad90c039a4eb72a2

This commit is contained in:
Yuekai Zhang 2025-06-27 02:27:48 +00:00 committed by GitHub
commit 32bd171005
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -730,7 +730,8 @@ class DecodingTask:
)
]
# repeat text tensors by the group size, for beam search or best-of-n sampling
# repeat the audio & text tensors by the group size, for beam search or best-of-n sampling
audio_features = audio_features.repeat_interleave(self.n_group, dim=0)
tokens = tokens.repeat_interleave(self.n_group, dim=0).to(audio_features.device)
# call the main sampling loop