mirror of
https://github.com/DrewThomasson/ebook2audiobook.git
synced 2026-01-10 14:28:15 -05:00
...
This commit is contained in:
@@ -13,11 +13,12 @@ class Bark(TTSUtils, TTSRegistry, name='bark'):
|
||||
self.pth_voice_file = None
|
||||
self.sentences_total_time = 0.0
|
||||
self.sentence_idx = 1
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
self.models = load_engine_presets(self.session['tts_engine'])
|
||||
self.params = {}
|
||||
self.params['samplerate'] = self.models[self.session['fine_tuned']]['samplerate']
|
||||
self.vtt_path = os.path.join(self.session['process_dir'],Path(self.session['final_name']).stem+'.vtt')
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
using_gpu = self.session['device'] != devices['CPU']['proc']
|
||||
enough_vram = self.session['free_vram_gb'] > 4.0
|
||||
seed = 123456
|
||||
|
||||
@@ -13,11 +13,12 @@ class Fairseq(TTSUtils, TTSRegistry, name='fairseq'):
|
||||
self.pth_voice_file = None
|
||||
self.sentences_total_time = 0.0
|
||||
self.sentence_idx = 1
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
self.models = load_engine_presets(self.session['tts_engine'])
|
||||
self.params = {"semitones":{}}
|
||||
self.params['samplerate'] = self.models[self.session['fine_tuned']]['samplerate']
|
||||
self.vtt_path = os.path.join(self.session['process_dir'],Path(self.session['final_name']).stem+'.vtt')
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
using_gpu = self.session['device'] != devices['CPU']['proc']
|
||||
enough_vram = self.session['free_vram_gb'] > 4.0
|
||||
seed = 123456
|
||||
|
||||
@@ -13,11 +13,12 @@ class Tacotron2(TTSUtils, TTSRegistry, name='tacotron'):
|
||||
self.pth_voice_file = None
|
||||
self.sentences_total_time = 0.0
|
||||
self.sentence_idx = 1
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
self.models = load_engine_presets(self.session['tts_engine'])
|
||||
self.params = {"semitones":{}}
|
||||
self.params['samplerate'] = self.models[self.session['fine_tuned']]['samplerate']
|
||||
self.vtt_path = os.path.join(self.session['process_dir'],Path(self.session['final_name']).stem+'.vtt')
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
using_gpu = self.session['device'] != devices['CPU']['proc']
|
||||
enough_vram = self.session['free_vram_gb'] > 4.0
|
||||
seed = 123456
|
||||
|
||||
@@ -13,11 +13,12 @@ class Vits(TTSUtils, TTSRegistry, name='vits'):
|
||||
self.pth_voice_file = None
|
||||
self.sentences_total_time = 0.0
|
||||
self.sentence_idx = 1
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
self.models = load_engine_presets(self.session['tts_engine'])
|
||||
self.params = {"semitones":{}}
|
||||
self.params['samplerate'] = self.models[self.session['fine_tuned']]['samplerate']
|
||||
self.vtt_path = os.path.join(self.session['process_dir'],Path(self.session['final_name']).stem+'.vtt')
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
using_gpu = self.session['device'] != devices['CPU']['proc']
|
||||
enough_vram = self.session['free_vram_gb'] > 4.0
|
||||
seed = 123456
|
||||
|
||||
@@ -13,11 +13,12 @@ class XTTSv2(TTSUtils, TTSRegistry, name='xtts'):
|
||||
self.pth_voice_file = None
|
||||
self.sentences_total_time = 0.0
|
||||
self.sentence_idx = 1
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
self.models = load_engine_presets(self.session['tts_engine'])
|
||||
self.params = {"latent_embedding":{}}
|
||||
self.params['samplerate'] = self.models[self.session['fine_tuned']]['samplerate']
|
||||
self.vtt_path = os.path.join(self.session['process_dir'],Path(self.session['final_name']).stem+'.vtt')
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
using_gpu = self.session['device'] != devices['CPU']['proc']
|
||||
enough_vram = self.session['free_vram_gb'] > 4.0
|
||||
seed = 123456
|
||||
|
||||
@@ -13,12 +13,12 @@ class YourTTS(TTSUtils, TTSRegistry, name='yourtts'):
|
||||
self.pth_voice_file = None
|
||||
self.sentences_total_time = 0.0
|
||||
self.sentence_idx = 1
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
self.models = load_engine_presets(self.session['tts_engine'])
|
||||
self.params = {}
|
||||
self.params['samplerate'] = self.models[self.session['fine_tuned']]['samplerate']
|
||||
self.vtt_path = os.path.join(self.session['process_dir'],Path(self.session['final_name']).stem+'.vtt')
|
||||
self.resampler_cache = {}
|
||||
self.audio_segments = []
|
||||
using_gpu = self.session['device'] != devices['CPU']['proc']
|
||||
enough_vram = self.session['free_vram_gb'] > 4.0
|
||||
seed = 123456
|
||||
|
||||
Reference in New Issue
Block a user