This commit is contained in:
unknown
2025-12-28 15:06:32 -08:00
parent 1a52dabf09
commit 5979a2484c

View File

@@ -142,7 +142,7 @@ class XTTSv2(TTSUtils, TTSRegistry, name='xtts'):
audio_sentence = result.get('wav')
if is_audio_data_valid(audio_sentence):
if isinstance(audio_sentence, torch.Tensor):
audio_tensor = audio_sentence.detach().cpu().unsqueeze(0)
audio_tensor = audio_sentence.detach().unsqueeze(0)
elif isinstance(audio_sentence, np.ndarray):
audio_tensor = torch.from_numpy(audio_sentence).unsqueeze(0)
elif isinstance(audio_sentence, (list, tuple)):
@@ -151,7 +151,7 @@ class XTTSv2(TTSUtils, TTSRegistry, name='xtts'):
error = f"Unsupported XTTSv2 wav type: {type(audio_sentence)}"
print(error)
return False
audio_tensor = audio_tensor.detach().cpu()
audio_tensor = audio_tensor.cpu()
if sentence[-1].isalnum() or sentence[-1] == '':
audio_tensor = trim_audio(audio_tensor.squeeze(), self.params['samplerate'], 0.001, trim_audio_buffer).unsqueeze(0)
if audio_tensor is not None and audio_tensor.numel() > 0: