This commit is contained in:
unknown
2025-05-17 03:45:29 -07:00
parent 38868147d1
commit 7defcf92cf
4 changed files with 12 additions and 9 deletions

View File

@@ -27,5 +27,6 @@ translate
tqdm
unidic
pymupdf4llm
coqui-tts>=0.26.1
torch
coqui-tts
torchvggish

View File

@@ -483,7 +483,7 @@ class TTSManager:
speakers_path = hf_hub_download(repo_id=models[self.session['tts_engine']]['internal']['repo'], filename="speakers_xtts.pth", cache_dir=self.cache_dir)
loaded_builtin_speakers[self.session['tts_engine']] = torch.load(speakers_path)
speakers_list = loaded_builtin_speakers[self.session['tts_engine']]
if processed_voice_key in loaded_processed_voices.keys():
if processed_voice_key is not None and loaded_processed_voices[processed_voice_key]:
self.params['gpt_cond_latent'], self.params['speaker_embedding'] = loaded_processed_voices[processed_voice_key].values()
else:
msg = 'Computing speaker latents...'
@@ -526,7 +526,7 @@ class TTSManager:
msg = f"{self.session['tts_engine']} custom model not implemented yet!"
print(msg)
else:
if processed_voice_key in loaded_processed_voices.keys():
if processed_voice_key is not None and loaded_processed_voices[processed_voice_key]:
bark_dir, speaker = loaded_processed_voices[processed_voice_key].values()
else:
if self.params['voice_path'] is not None:
@@ -568,7 +568,7 @@ class TTSManager:
file_path=tmp_in_wav,
**speaker_argument
)
if processed_voice_key in loaded_processed_voices.keys():
if processed_voice_key is not None and loaded_processed_voices[processed_voice_key]:
self.params['semitones'] = loaded_processed_voices[processed_voice_key]
else:
self.params['voice_path_gender'] = self._detect_gender(self.params['voice_path'])
@@ -630,7 +630,7 @@ class TTSManager:
text=self.params['sentence'],
file_path=tmp_in_wav
)
if processed_voice_key in loaded_processed_voices.keys():
if processed_voice_key is not None and loaded_processed_voices[processed_voice_key]:
self.params['semitones'] = loaded_processed_voices[processed_voice_key]
else:
self.params['voice_path_gender'] = self._detect_gender(self.params['voice_path'])
@@ -683,7 +683,7 @@ class TTSManager:
else:
speaker_argument = {}
language = self.session['language_iso1'] if self.session['language_iso1'] == 'en' else 'fr-fr' if self.session['language_iso1'] == 'fr' else 'pt-br' if self.session['language_iso1'] == 'pt' else 'en'
if processed_voice_key in loaded_processed_voices.keys():
if processed_voice_key is not None and loaded_processed_voices[processed_voice_key]:
speaker_argument = loaded_processed_voices[processed_voice_key]
else:
if self.params['voice_path'] is not None:

View File

@@ -45,8 +45,9 @@ dependencies = [
"translate",
"tqdm",
"unidic",
"pymupdf4llm",
"coqui-tts>=0.26.1",
"pymupdf4llm",
"torch",
"coqui-tts",
"torchvggish"
]
readme = "README.md"

View File

@@ -27,5 +27,6 @@ translate
tqdm
unidic
pymupdf4llm
coqui-tts>=0.26.1
torch
coqui-tts
torchvggish