mirror of
https://github.com/DrewThomasson/ebook2audiobook.git
synced 2026-04-21 03:00:19 -04:00
200 lines
8.8 KiB
Python
200 lines
8.8 KiB
Python
import os, tempfile, sys, re
|
|
|
|
debug_mode = False
|
|
|
|
DEVICE_SYSTEM = sys.platform
|
|
|
|
systems = {
|
|
"LINUX": "linux",
|
|
"MACOS": "darwin",
|
|
"WINDOWS": "win32"
|
|
}
|
|
|
|
cli_options = [
|
|
'--script_mode', '--docker_mode', '--session', '--share', '--headless',
|
|
'--ebook', '--ebooks_dir', '--text', '--language', '--voice', '--device', '--tts_engine',
|
|
'--custom_model', '--fine_tuned', '--output_format', '--output_channel',
|
|
'--temperature', '--length_penalty', '--num_beams', '--repetition_penalty',
|
|
'--top_k', '--top_p', '--speed', '--enable_text_splitting', '--text_temp',
|
|
'--waveform_temp', '--output_dir', '--version', '--docker_device', '--workflow', '--help'
|
|
]
|
|
|
|
workflow_id = 'ba800d22-ee51-11ef-ac34-d4ae52cfd9ce'
|
|
fernet_key = '0TkxI0iP0jmhT0vJ-AUpM2U4SAX3urVtrx1q8lwTynI='
|
|
fernet_data = b'gAAAAABptJuHZS_rMQRTmqzy-i5UFTh6HqcbklSV6oZsRpZXa7uSEveAMv1daIFzzeeWZW0wDV-frFlzk_gJPc5tr_YVKW-Eg8evw9Wll1rWrvIAfT0YQywaUe188qP1dg-GOJDM7Ul1'
|
|
|
|
# ---------------------------------------------------------------------
|
|
# Version and runtime config
|
|
# ---------------------------------------------------------------------
|
|
prog_version = (lambda: open('VERSION.txt').read().strip())()
|
|
|
|
NATIVE = 'native'
|
|
FULL_DOCKER = 'full_docker'
|
|
BUILD_DOCKER = 'build_docker'
|
|
|
|
# ---------------------------------------------------------------------
|
|
# Python environment references
|
|
# ---------------------------------------------------------------------
|
|
min_python_version = (3,10)
|
|
max_python_version = (3,12)
|
|
python_env_dir = os.path.abspath(os.path.join('.','python_env'))
|
|
requirements_file = os.path.abspath(os.path.join('.','requirements.txt'))
|
|
|
|
# ---------------------------------------------------------------------
|
|
# Hardware mappings
|
|
# ---------------------------------------------------------------------
|
|
devices = {
|
|
"CPU": {"proc": "cpu", "found": True},
|
|
"CUDA": {"proc": "cuda", "found": False},
|
|
"MPS": {"proc": "mps", "found": False},
|
|
"ROCM": {"proc": "rocm", "found": False},
|
|
"XPU": {"proc": "xpu", "found": False},
|
|
"JETSON": {"proc": "jetson", "found": False},
|
|
}
|
|
|
|
default_device = devices['CPU']['proc']
|
|
|
|
default_gpu_wiki = '<a href="https://github.com/DrewThomasson/ebook2audiobook/wiki/GPU-ISSUES">GPU howto wiki</a>'
|
|
|
|
default_py_major = sys.version_info.major
|
|
default_py_minor = sys.version_info.minor
|
|
|
|
default_pytorch_url = 'https://download.pytorch.org/whl'
|
|
default_jetson_url = 'https://www.e-blokos.com/whl/jetson' # TODO: find a permanent website where to upload the jetpack torch
|
|
|
|
torch_matrix = {
|
|
# CPU
|
|
"cpu": {"url": None, "base": ((lambda m:m.group(1) if m else '')(re.search(r'(?m)^\s*torch\s*==\s*([0-9]+\.[0-9]+\.[0-9]+)',open(requirements_file).read())))},
|
|
# CUDA
|
|
"cu118": {"url": default_pytorch_url, "base": "2.7.1"},
|
|
"cu121": {"url": default_pytorch_url, "base": "2.5.1"},
|
|
"cu124": {"url": default_pytorch_url, "base": "2.6.0"},
|
|
"cu126": {"url": default_pytorch_url, "base": "2.7.1"},
|
|
"cu128": {"url": default_pytorch_url, "base": "2.7.1"},
|
|
# ROCm
|
|
"rocm5.7": {"url": default_pytorch_url, "base": "2.3.1"},
|
|
"rocm6.0": {"url": default_pytorch_url, "base": "2.4.1"},
|
|
"rocm6.1": {"url": default_pytorch_url, "base": "2.6.0"},
|
|
"rocm6.2": {"url": default_pytorch_url, "base": "2.5.1"},
|
|
"rocm6.2.4": {"url": default_pytorch_url, "base": "2.7.1"},
|
|
"rocm6.3": {"url": default_pytorch_url, "base": "2.7.1"},
|
|
# MPS
|
|
"mps": {"url": default_pytorch_url, "base": "2.7.1"},
|
|
# XPU
|
|
"xpu": {"url": default_pytorch_url, "base": "2.7.1"},
|
|
# JETSON
|
|
"jetson51": {"url": default_jetson_url, "base": "2.4.1"},
|
|
"jetson60": {"url": default_jetson_url, "base": "2.4.0"},
|
|
"jetson61": {"url": default_jetson_url, "base": "2.5.0"}
|
|
}
|
|
|
|
cuda_version_range = {"min": (11,8), "max": (12,8)}
|
|
rocm_version_range = {"min": (5,7), "max": (6,3)}
|
|
mps_version_range = {"min": (0,0), "max": (0,0)}
|
|
xpu_version_range = {"min": (0,0), "max": (0,0)}
|
|
jetson_version_range = {"min": (5,1), "max": (6,1)}
|
|
|
|
############### SETTINGS BELOW CAN BE MODIFIED ###############
|
|
|
|
# ---------------------------------------------------------------------
|
|
# Global paths
|
|
# ---------------------------------------------------------------------
|
|
root_dir = os.path.dirname(os.path.abspath(__file__))
|
|
tmp_dir = os.path.abspath('tmp')
|
|
run_dir = os.path.abspath('run')
|
|
gradio_cache_dir = os.path.normpath(os.path.join(run_dir, 'gradio'))
|
|
models_dir = os.path.abspath('models')
|
|
ebooks_dir = os.path.abspath('ebooks')
|
|
voices_dir = os.path.abspath('voices')
|
|
tts_dir = os.path.join(models_dir, 'tts')
|
|
components_dir = os.path.abspath('components')
|
|
tempfile.tempdir = run_dir
|
|
|
|
# ---------------------------------------------------------------------
|
|
# Environment setup
|
|
# ---------------------------------------------------------------------
|
|
os.environ['PYTHONUTF8'] = '1'
|
|
os.environ['PYTHONIOENCODING'] = 'utf-8'
|
|
os.environ['COQUI_TOS_AGREED'] = '1'
|
|
os.environ['PYTHONIOENCODING'] = 'utf-8'
|
|
os.environ['CALIBRE_NO_NATIVE_FILEDIALOGS'] = '1'
|
|
os.environ['CALIBRE_TEMP_DIR'] = run_dir
|
|
os.environ['CALIBRE_CACHE_DIRECTORY'] = run_dir
|
|
os.environ['CALIBRE_CONFIG_DIRECTORY'] = run_dir
|
|
os.environ['TMPDIR'] = run_dir
|
|
os.environ['GRADIO_DEBUG'] = '0'
|
|
os.environ['DO_NOT_TRACK'] = 'True'
|
|
os.environ['HUGGINGFACE_HUB_CACHE'] = tts_dir
|
|
os.environ['HF_HOME'] = tts_dir
|
|
os.environ['HF_DATASETS_CACHE'] = tts_dir
|
|
os.environ['HF_HUB_DISABLE_SYMLINKS_WARNING'] = '1'
|
|
os.environ['BARK_CACHE_DIR'] = tts_dir
|
|
os.environ['TTS_CACHE'] = tts_dir
|
|
os.environ['TORCH_HOME'] = tts_dir
|
|
os.environ['TTS_HOME'] = models_dir
|
|
os.environ['XDG_CACHE_HOME'] = models_dir
|
|
os.environ['MPLCONFIGDIR'] = f'{models_dir}/matplotlib'
|
|
os.environ['TESSDATA_PREFIX'] = f'{models_dir}/tessdata'
|
|
os.environ['STANZA_RESOURCES_DIR'] = os.path.join(models_dir, 'stanza')
|
|
os.environ['ARGOS_TRANSLATE_PACKAGE_PATH'] = os.path.join(models_dir, 'argostranslate')
|
|
os.environ['TORCH_FORCE_NO_WEIGHTS_ONLY_LOAD'] = '1'
|
|
os.environ['PYTORCH_ENABLE_MPS_FALLBACK'] = '1'
|
|
os.environ['PYTORCH_CUDA_ALLOC_CONF'] = 'expandable_segments:True'
|
|
os.environ['CUDA_MODULE_LOADING'] = 'LAZY'
|
|
os.environ['CUDA_DEVICE_ORDER'] = 'PCI_BUS_ID'
|
|
os.environ['CUDA_CACHE_MAXSIZE'] = '2147483648'
|
|
os.environ['SUNO_OFFLOAD_CPU'] = 'False'
|
|
os.environ['SUNO_USE_SMALL_MODELS'] = 'False'
|
|
if DEVICE_SYSTEM == systems['WINDOWS']:
|
|
os.environ['ESPEAK_DATA_PATH'] = os.path.expandvars(r"%USERPROFILE%\scoop\apps\espeak-ng\current\espeak-ng-data")
|
|
|
|
# ---------------------------------------------------------------------
|
|
# Global settings
|
|
# ---------------------------------------------------------------------
|
|
max_upload_size = '6GB' # MB or GB
|
|
tmp_expire = 60 # days
|
|
max_ebook_textarea_length = 1024 # chars
|
|
|
|
# ---------------------------------------------------------------------
|
|
# Interface configuration
|
|
# ---------------------------------------------------------------------
|
|
interface_host = '0.0.0.0'
|
|
interface_port = 7860
|
|
interface_shared_tmp_expire = 3 # in days
|
|
interface_concurrency_limit = 1 # or None for unlimited multiple parallele user conversion
|
|
|
|
interface_component_options = {
|
|
"gr_tab_xtts_params": True,
|
|
"gr_tab_bark_params": True,
|
|
"gr_group_voice_file": True,
|
|
"gr_group_custom_model": True
|
|
}
|
|
|
|
# ---------------------------------------------------------------------
|
|
# UI directories
|
|
# ---------------------------------------------------------------------
|
|
audiobooks_gradio_dir = os.path.abspath(os.path.join('audiobooks','gui','gradio'))
|
|
audiobooks_host_dir = os.path.abspath(os.path.join('audiobooks','gui','host'))
|
|
audiobooks_cli_dir = os.path.abspath(os.path.join('audiobooks','cli'))
|
|
|
|
# ---------------------------------------------------------------------
|
|
# files and audio supported formats
|
|
# ---------------------------------------------------------------------
|
|
ebook_formats = [
|
|
".epub", ".mobi", ".azw3", ".fb2", ".lrf", ".rb", ".snb", ".tcr", ".pdf",
|
|
".txt", ".rtf", ".doc", ".docx", ".html", ".odt", ".azw", ".tiff", ".tif",
|
|
".png", ".jpg", ".jpeg", ".bmp", ".pptx"
|
|
]
|
|
voice_formats = [
|
|
".mp4", ".m4b", ".m4a", ".mp3", ".wav", ".aac", ".flac", ".alac", ".ogg",
|
|
".aiff", ".aif", ".wma", ".dsd", ".opus", ".pcmu", ".pcma", ".gsm"
|
|
]
|
|
output_formats = [
|
|
"aac", "flac", "mp3", "m4b", "m4a", "mp4", "mov", "ogg", "wav", "webm"
|
|
]
|
|
default_audio_proc_samplerate = 24000
|
|
default_audio_proc_format = 'flac' # or 'mp3', 'aac', 'm4a', 'm4b', 'amr', '3gp', 'alac'. 'wav' format is ok but limited to process files < 4GB
|
|
default_output_format = 'm4b'
|
|
default_output_channel = 'mono' # mono or stereo
|
|
default_output_split = False
|
|
default_output_split_hours = '6' # if the final ouput esceed outpout_split_hours * 2 hours the final file will be splitted by outpout_split_hours + the end if any. |