audiblez/audiblez.py

#!/usr/bin/env python3
# audiblez - A program to convert e-books into audiobooks using
# Kokoro-82M model for high-quality text-to-speech synthesis.
# by Claudio Santini 2025 - https://claudio.uk

import argparse
import sys
import time
import shutil
import subprocess
import soundfile as sf
import ebooklib
import warnings
import re
from pathlib import Path
from string import Formatter
from bs4 import BeautifulSoup
from kokoro_onnx import config
from kokoro_onnx import Kokoro
from ebooklib import epub
from pydub import AudioSegment
from pick import pick
import onnxruntime as ort
from tempfile import NamedTemporaryFile

MODEL_FILE = 'kokoro-v0_19.onnx'
VOICES_FILE = 'voices.json'
config.MAX_PHONEME_LENGTH = 128


def main(kokoro, file_path, lang, voice, pick_manually, speed, providers):
    # Set ONNX providers if specified
    if providers:
        available_providers = ort.get_available_providers()
        invalid_providers = [p for p in providers if p not in available_providers]
        if invalid_providers:
            print(f"Invalid ONNX providers: {', '.join(invalid_providers)}")
            print(f"Available providers: {', '.join(available_providers)}")
            sys.exit(1)
        kokoro.sess.set_providers(providers)
        print(f"Using ONNX providers: {', '.join(providers)}")
    filename = Path(file_path).name
    warnings.simplefilter("ignore")
    book = epub.read_epub(file_path)
    title = book.get_metadata('DC', 'title')[0][0]
    creator = book.get_metadata('DC', 'creator')[0][0]

    cover_maybe = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_COVER]
    cover_image = cover_maybe[0].get_content() if cover_maybe else b""
    if cover_maybe:
        print(f'Found cover image {cover_maybe[0].file_name} in {cover_maybe[0].media_type} format')

    intro = f'{title} by {creator}'
    print(intro)
    print('Found Chapters:', [c.get_name() for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT])
    if pick_manually:
        chapters = pick_chapters(book)
    else:
        chapters = find_chapters(book)
    print('Automatically selected chapters:', [c.get_name() for c in chapters])
    texts = extract_texts(chapters)

    has_ffmpeg = shutil.which('ffmpeg') is not None
    if not has_ffmpeg:
        print('\033[91m' + 'ffmpeg not found. Please install ffmpeg to create mp3 and m4b audiobook files.' + '\033[0m')

    total_chars, processed_chars = sum(map(len, texts)), 0
    print('Started at:', time.strftime('%H:%M:%S'))
    print(f'Total characters: {total_chars:,}')
    print('Total words:', len(' '.join(texts).split()))

    chapter_mp3_files = []
    durations = {}

    for i, text in enumerate(texts, start=1):
        chapter_filename = filename.replace('.epub', f'_chapter_{i}.wav')
        chapter_mp3_files.append(chapter_filename)
        if Path(chapter_filename).exists():
            print(f'File for chapter {i} already exists. Skipping')
            continue
        if len(text.strip()) < 10:
            print(f'Skipping empty chapter {i}')
            chapter_mp3_files.remove(chapter_filename)
            continue
        print(f'Reading chapter {i} ({len(text):,} characters)...')
        if i == 1:
            text = intro + '.\n\n' + text
        start_time = time.time()
        samples, sample_rate = kokoro.create(text, voice=voice, speed=speed, lang=lang)
        sf.write(f'{chapter_filename}', samples, sample_rate)
        durations[chapter_filename] = len(samples) / sample_rate
        end_time = time.time()
        delta_seconds = end_time - start_time
        chars_per_sec = len(text) / delta_seconds
        processed_chars += len(text)
        remaining_chars = total_chars - processed_chars
        remaining_time = remaining_chars / chars_per_sec
        print(f'Estimated time remaining: {strfdelta(remaining_time)}')
        print('Chapter written to', chapter_filename)
        print(f'Chapter {i} read in {delta_seconds:.2f} seconds ({chars_per_sec:.0f} characters per second)')
        progress = processed_chars * 100 // total_chars
        print('Progress:', f'{progress}%\n')

    if has_ffmpeg:
        create_index_file(title, creator, chapter_mp3_files, durations)
        create_m4b(chapter_mp3_files, filename, title, creator, cover_image)


def extract_texts(chapters):
    texts = []
    for chapter in chapters:
        xml = chapter.get_body_content()
        soup = BeautifulSoup(xml, features='lxml')
        chapter_text = ''
        html_content_tags = ['title', 'p', 'h1', 'h2', 'h3', 'h4']
        for child in soup.find_all(html_content_tags):
            inner_text = child.text.strip() if child.text else ""
            if inner_text:
                chapter_text += inner_text + '\n'
        texts.append(chapter_text)
    return texts


def is_chapter(c):
    name = c.get_name().lower()
    return bool(
        'chapter' in name.lower()
        or re.search(r'part\d{1,3}', name)
        or re.search(r'ch\d{1,3}', name)
        or re.search(r'chap\d{1,3}', name)
    )


def find_chapters(book, verbose=False):
    chapters = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT and is_chapter(c)]
    if verbose:
        for item in book.get_items():
            if item.get_type() == ebooklib.ITEM_DOCUMENT:
                print(f"'{item.get_name()}'" + ', #' + str(len(item.get_body_content())))
                # print(f'{item.get_name()}'.ljust(60), str(len(item.get_body_content())).ljust(15), 'X' if item in chapters else '-')
    if len(chapters) == 0:
        print('Not easy to find the chapters, defaulting to all available documents.')
        chapters = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT]
    return chapters


def pick_chapters(book):
    all_chapters_names = [c.get_name() for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT]
    title = 'Select which chapters to read in the audiobook'
    selected_chapters_names = pick(all_chapters_names, title, multiselect=True, min_selection_count=1)
    selected_chapters_names = [c[0] for c in selected_chapters_names]
    selected_chapters = [c for c in book.get_items() if c.get_name() in selected_chapters_names]
    return selected_chapters


def strfdelta(tdelta, fmt='{D:02}d {H:02}h {M:02}m {S:02}s'):
    remainder = int(tdelta)
    f = Formatter()
    desired_fields = [field_tuple[1] for field_tuple in f.parse(fmt)]
    possible_fields = ('W', 'D', 'H', 'M', 'S')
    constants = {'W': 604800, 'D': 86400, 'H': 3600, 'M': 60, 'S': 1}
    values = {}
    for field in possible_fields:
        if field in desired_fields and field in constants:
            values[field], remainder = divmod(remainder, constants[field])
    return f.format(fmt, **values)


def create_m4b(chapter_files, filename, title, author, cover_image):
    tmp_filename = filename.replace('.epub', '.tmp.mp4')
    if not Path(tmp_filename).exists():
        combined_audio = AudioSegment.empty()
        for wav_file in chapter_files:
            audio = AudioSegment.from_wav(wav_file)
            combined_audio += audio
        print('Converting to Mp4...')
        combined_audio.export(tmp_filename, format="mp4", codec="aac", bitrate="64k")
    final_filename = filename.replace('.epub', '.m4b')
    print('Creating M4B file...')

    if cover_image:
        cover_image_file = NamedTemporaryFile("wb")
        cover_image_file.write(cover_image)
        cover_image_args = ["-i", cover_image_file.name, "-map", "0:a", "-map", "1:v"]
    else:
        cover_image_args = []

    proc = subprocess.run([
        'ffmpeg',
        '-i', f'{tmp_filename}',
        '-i', 'chapters.txt',
        # '-map', '0',
        # '-map_metadata', '1',
        *cover_image_args,
        '-c:a', 'copy',
        '-c:v', 'copy',
        '-disposition:v', 'attached_pic',
        '-metadata:s:v', f'title={title}',
        '-metadata', f'artist={author}',
        '-c', 'copy',
        '-f', 'mp4',
        f'{final_filename}'
    ])
    Path(tmp_filename).unlink()
    if proc.returncode == 0:
        print(f'{final_filename} created. Enjoy your audiobook.')
        print('Feel free to delete the intermediary .wav chapter files, the .m4b is all you need.')


def probe_duration(file_name):
    args = ['ffprobe', '-i', file_name, '-show_entries', 'format=duration', '-v', 'quiet', '-of', 'default=noprint_wrappers=1:nokey=1']
    proc = subprocess.run(args, capture_output=True, text=True, check=True)
    return float(proc.stdout.strip())


def create_index_file(title, creator, chapter_mp3_files, durations):
    with open("chapters.txt", "w") as f:
        f.write(f";FFMETADATA1\ntitle={title}\nartist={creator}\n\n")
        start = 0
        i = 0
        for c in chapter_mp3_files:
            if c not in durations:
                durations[c] = probe_duration(c)
            end = start + (int)(durations[c] * 1000)
            f.write(f"[CHAPTER]\nTIMEBASE=1/1000\nSTART={start}\nEND={end}\ntitle=Chapter {i}\n\n")
            i += 1
            start = end


def cli_main():
    if not Path(MODEL_FILE).exists() or not Path(VOICES_FILE).exists():
        print('Error: kokoro-v0_19.onnx and voices.json must be in the current directory. Please download them with:')
        print('wget https://github.com/thewh1teagle/kokoro-onnx/releases/download/model-files/kokoro-v0_19.onnx')
        print('wget https://github.com/thewh1teagle/kokoro-onnx/releases/download/model-files/voices.json')
        sys.exit(1)
    kokoro = Kokoro(MODEL_FILE, VOICES_FILE)
    voices = list(kokoro.get_voices())
    voices_str = ', '.join(voices)
    epilog = 'example:\n' + \
             '  audiblez book.epub -l en-us -v af_sky'
    default_voice = 'af_sky' if 'af_sky' in voices else voices[0]

    # Get available ONNX providers
    available_providers = ort.get_available_providers()
    providers_help = f"Available ONNX providers: {', '.join(available_providers)}"

    parser = argparse.ArgumentParser(epilog=epilog, formatter_class=argparse.RawDescriptionHelpFormatter)
    parser.add_argument('epub_file_path', help='Path to the epub file')
    parser.add_argument('-l', '--lang', default='en-gb', help='Language code: en-gb, en-us, fr-fr, ja, ko, cmn')
    parser.add_argument('-v', '--voice', default=default_voice, help=f'Choose narrating voice: {voices_str}')
    parser.add_argument('-p', '--pick', default=False, help=f'Interactively select which chapters to read in the audiobook',
                        action='store_true')
    parser.add_argument('-s', '--speed', default=1.0, help=f'Set speed from 0.5 to 2.0', type=float)
    parser.add_argument('--providers', nargs='+', metavar='PROVIDER', help=f"Specify ONNX providers. {providers_help}")

    if len(sys.argv) == 1:
        parser.print_help(sys.stderr)
        sys.exit(1)
    args = parser.parse_args()
    main(kokoro, args.epub_file_path, args.lang, args.voice, args.pick, args.speed, args.providers)


if __name__ == '__main__':
    cli_main()
m4b 2025-01-14 17:45:04 +01:00			`#!/usr/bin/env python3`
fix 2025-01-14 22:57:31 +01:00			`# audiblez - A program to convert e-books into audiobooks using`
			`# Kokoro-82M model for high-quality text-to-speech synthesis.`
			`# by Claudio Santini 2025 - https://claudio.uk`
init 2025-01-14 15:35:10 +01:00
			`import argparse`
m4b 2025-01-14 17:45:04 +01:00			`import sys`
init 2025-01-14 15:35:10 +01:00			`import time`
			`import shutil`
			`import subprocess`
			`import soundfile as sf`
			`import ebooklib`
			`import warnings`
fixed chapters 2025-01-15 09:31:50 +01:00			`import re`
init 2025-01-14 15:35:10 +01:00			`from pathlib import Path`
			`from string import Formatter`
			`from bs4 import BeautifulSoup`
Adds support for cuda accelerated computations 2025-01-15 23:36:52 +01:00			`from kokoro_onnx import config`
init 2025-01-14 15:35:10 +01:00			`from kokoro_onnx import Kokoro`
			`from ebooklib import epub`
m4b 2025-01-14 18:38:26 +01:00			`from pydub import AudioSegment`
manual pick 2025-01-15 19:12:48 +01:00			`from pick import pick`
Support for onnxruntime-gpu and documentation. 2025-01-16 20:01:16 -08:00			`import onnxruntime as ort`
Set the cover image 2025-01-22 22:17:02 +05:30			`from tempfile import NamedTemporaryFile`
init 2025-01-14 15:35:10 +01:00
fix 2025-01-23 21:59:20 +01:00			`MODEL_FILE = 'kokoro-v0_19.onnx'`
			`VOICES_FILE = 'voices.json'`
Adds support for cuda accelerated computations 2025-01-15 23:36:52 +01:00			`config.MAX_PHONEME_LENGTH = 128`
init 2025-01-14 15:35:10 +01:00
Support for onnxruntime-gpu and documentation. 2025-01-16 20:01:16 -08:00
			`def main(kokoro, file_path, lang, voice, pick_manually, speed, providers):`
			`# Set ONNX providers if specified`
			`if providers:`
			`available_providers = ort.get_available_providers()`
			`invalid_providers = [p for p in providers if p not in available_providers]`
			`if invalid_providers:`
			`print(f"Invalid ONNX providers: {', '.join(invalid_providers)}")`
			`print(f"Available providers: {', '.join(available_providers)}")`
			`sys.exit(1)`
			`kokoro.sess.set_providers(providers)`
			`print(f"Using ONNX providers: {', '.join(providers)}")`
m4b 2025-01-14 17:45:04 +01:00			`filename = Path(file_path).name`
cleanup 2025-01-23 21:44:26 +01:00			`warnings.simplefilter("ignore")`
			`book = epub.read_epub(file_path)`
init 2025-01-14 15:35:10 +01:00			`title = book.get_metadata('DC', 'title')[0][0]`
			`creator = book.get_metadata('DC', 'creator')[0][0]`
Set the cover image 2025-01-22 22:17:02 +05:30
			`cover_maybe = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_COVER]`
			`cover_image = cover_maybe[0].get_content() if cover_maybe else b""`
			`if cover_maybe:`
			`print(f'Found cover image {cover_maybe[0].file_name} in {cover_maybe[0].media_type} format')`

init 2025-01-14 15:35:10 +01:00			`intro = f'{title} by {creator}'`
			`print(intro)`
manual pick 2025-01-15 19:12:48 +01:00			`print('Found Chapters:', [c.get_name() for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT])`
			`if pick_manually:`
			`chapters = pick_chapters(book)`
			`else:`
			`chapters = find_chapters(book)`
cleanup 2025-01-23 21:44:26 +01:00			`print('Automatically selected chapters:', [c.get_name() for c in chapters])`
init 2025-01-14 15:35:10 +01:00			`texts = extract_texts(chapters)`
Set the cover image 2025-01-22 22:17:02 +05:30
init 2025-01-14 15:35:10 +01:00			`has_ffmpeg = shutil.which('ffmpeg') is not None`
m4b 2025-01-14 17:45:04 +01:00			`if not has_ffmpeg:`
			`print('\033[91m' + 'ffmpeg not found. Please install ffmpeg to create mp3 and m4b audiobook files.' + '\033[0m')`
Set the cover image 2025-01-22 22:17:02 +05:30
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`total_chars, processed_chars = sum(map(len, texts)), 0`
m4b 2025-01-14 17:45:04 +01:00			`print('Started at:', time.strftime('%H:%M:%S'))`
			`print(f'Total characters: {total_chars:,}')`
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`print('Total words:', len(' '.join(texts).split()))`
init 2025-01-14 15:35:10 +01:00
m4b 2025-01-14 18:38:26 +01:00			`chapter_mp3_files = []`
Adds generation of chapter markings in the audiobook 2025-01-16 07:52:13 +01:00			`durations = {}`
cleanup 2025-01-23 21:44:26 +01:00
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`for i, text in enumerate(texts, start=1):`
m4b 2025-01-14 17:45:04 +01:00			`chapter_filename = filename.replace('.epub', f'_chapter_{i}.wav')`
m4b 2025-01-14 18:38:26 +01:00			`chapter_mp3_files.append(chapter_filename)`
cleanup 2025-01-14 18:41:15 +01:00			`if Path(chapter_filename).exists():`
init 2025-01-14 15:35:10 +01:00			`print(f'File for chapter {i} already exists. Skipping')`
			`continue`
fix 2025-01-23 21:59:20 +01:00			`if len(text.strip()) < 10:`
			`print(f'Skipping empty chapter {i}')`
			`chapter_mp3_files.remove(chapter_filename)`
			`continue`
init 2025-01-14 15:35:10 +01:00			`print(f'Reading chapter {i} ({len(text):,} characters)...')`
m4b 2025-01-14 17:45:04 +01:00			`if i == 1:`
			`text = intro + '.\n\n' + text`
init 2025-01-14 15:35:10 +01:00			`start_time = time.time()`
Add a speed argument 2025-01-15 22:05:49 +02:00			`samples, sample_rate = kokoro.create(text, voice=voice, speed=speed, lang=lang)`
init 2025-01-14 15:35:10 +01:00			`sf.write(f'{chapter_filename}', samples, sample_rate)`
cleanup 2025-01-23 21:44:26 +01:00			`durations[chapter_filename] = len(samples) / sample_rate`
init 2025-01-14 15:35:10 +01:00			`end_time = time.time()`
			`delta_seconds = end_time - start_time`
m4b 2025-01-14 17:45:04 +01:00			`chars_per_sec = len(text) / delta_seconds`
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`processed_chars += len(text)`
			`remaining_chars = total_chars - processed_chars`
m4b 2025-01-14 17:45:04 +01:00			`remaining_time = remaining_chars / chars_per_sec`
init 2025-01-14 15:35:10 +01:00			`print(f'Estimated time remaining: {strfdelta(remaining_time)}')`
fix 2025-01-14 19:04:45 +01:00			`print('Chapter written to', chapter_filename)`
			`print(f'Chapter {i} read in {delta_seconds:.2f} seconds ({chars_per_sec:.0f} characters per second)')`
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`progress = processed_chars * 100 // total_chars`
cleanup 2025-01-23 21:44:26 +01:00			`print('Progress:', f'{progress}%\n')`
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30
m4b 2025-01-14 17:45:04 +01:00			`if has_ffmpeg:`
Adds generation of chapter markings in the audiobook 2025-01-16 07:52:13 +01:00			`create_index_file(title, creator, chapter_mp3_files, durations)`
Set the cover image 2025-01-22 22:17:02 +05:30			`create_m4b(chapter_mp3_files, filename, title, creator, cover_image)`
init 2025-01-14 15:35:10 +01:00

			`def extract_texts(chapters):`
			`texts = []`
			`for chapter in chapters:`
			`xml = chapter.get_body_content()`
			`soup = BeautifulSoup(xml, features='lxml')`
			`chapter_text = ''`
			`html_content_tags = ['title', 'p', 'h1', 'h2', 'h3', 'h4']`
			`for child in soup.find_all(html_content_tags):`
			`inner_text = child.text.strip() if child.text else ""`
			`if inner_text:`
			`chapter_text += inner_text + '\n'`
			`texts.append(chapter_text)`
			`return texts`


fixed chapters 2025-01-15 09:31:50 +01:00			`def is_chapter(c):`
			`name = c.get_name().lower()`
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`return bool(`
			`'chapter' in name.lower()`
			`or re.search(r'part\d{1,3}', name)`
			`or re.search(r'ch\d{1,3}', name)`
			`or re.search(r'chap\d{1,3}', name)`
			`)`
fixed chapters 2025-01-15 09:31:50 +01:00

manual pick 2025-01-15 19:12:48 +01:00			`def find_chapters(book, verbose=False):`
init 2025-01-14 15:35:10 +01:00			`chapters = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT and is_chapter(c)]`
			`if verbose:`
			`for item in book.get_items():`
			`if item.get_type() == ebooklib.ITEM_DOCUMENT:`
dracula fix 2025-01-15 11:00:59 +01:00			`print(f"'{item.get_name()}'" + ', #' + str(len(item.get_body_content())))`
			`# print(f'{item.get_name()}'.ljust(60), str(len(item.get_body_content())).ljust(15), 'X' if item in chapters else '-')`
			`if len(chapters) == 0:`
			`print('Not easy to find the chapters, defaulting to all available documents.')`
			`chapters = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT]`
init 2025-01-14 15:35:10 +01:00			`return chapters`


manual pick 2025-01-15 19:12:48 +01:00			`def pick_chapters(book):`
fix 2025-01-16 15:24:32 +01:00			`all_chapters_names = [c.get_name() for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT]`
manual pick 2025-01-15 19:12:48 +01:00			`title = 'Select which chapters to read in the audiobook'`
			`selected_chapters_names = pick(all_chapters_names, title, multiselect=True, min_selection_count=1)`
			`selected_chapters_names = [c[0] for c in selected_chapters_names]`
			`selected_chapters = [c for c in book.get_items() if c.get_name() in selected_chapters_names]`
			`return selected_chapters`


init 2025-01-14 15:35:10 +01:00			`def strfdelta(tdelta, fmt='{D:02}d {H:02}h {M:02}m {S:02}s'):`
			`remainder = int(tdelta)`
			`f = Formatter()`
			`desired_fields = [field_tuple[1] for field_tuple in f.parse(fmt)]`
			`possible_fields = ('W', 'D', 'H', 'M', 'S')`
			`constants = {'W': 604800, 'D': 86400, 'H': 3600, 'M': 60, 'S': 1}`
			`values = {}`
			`for field in possible_fields:`
			`if field in desired_fields and field in constants:`
			`values[field], remainder = divmod(remainder, constants[field])`
			`return f.format(fmt, **values)`


Set the cover image 2025-01-22 22:17:02 +05:30			`def create_m4b(chapter_files, filename, title, author, cover_image):`
			`tmp_filename = filename.replace('.epub', '.tmp.mp4')`
m4b 2025-01-14 18:38:26 +01:00			`if not Path(tmp_filename).exists():`
			`combined_audio = AudioSegment.empty()`
Add title and author metadata to .m4b file 2025-01-15 22:29:10 +01:00			`for wav_file in chapter_files:`
m4b 2025-01-14 18:38:26 +01:00			`audio = AudioSegment.from_wav(wav_file)`
			`combined_audio += audio`
cleanup 2025-01-14 18:41:15 +01:00			`print('Converting to Mp4...')`
m4b 2025-01-14 18:38:26 +01:00			`combined_audio.export(tmp_filename, format="mp4", codec="aac", bitrate="64k")`
			`final_filename = filename.replace('.epub', '.m4b')`
m4b 2025-01-14 17:45:04 +01:00			`print('Creating M4B file...')`
Set the cover image 2025-01-22 22:17:02 +05:30
			`if cover_image:`
			`cover_image_file = NamedTemporaryFile("wb")`
			`cover_image_file.write(cover_image)`
cleanup 2025-01-23 21:44:26 +01:00			`cover_image_args = ["-i", cover_image_file.name, "-map", "0:a", "-map", "1:v"]`
Set the cover image 2025-01-22 22:17:02 +05:30			`else:`
			`cover_image_args = []`

Add title and author metadata to .m4b file 2025-01-15 22:29:10 +01:00			`proc = subprocess.run([`
cleanup 2025-01-23 21:44:26 +01:00			`'ffmpeg',`
			`'-i', f'{tmp_filename}',`
			`'-i', 'chapters.txt',`
			`# '-map', '0',`
			`# '-map_metadata', '1',`
			`*cover_image_args,`
			`'-c:a', 'copy',`
			`'-c:v', 'copy',`
Merge branch 'main' into feat/cover-image 2025-01-23 21:32:10 +01:00			`'-disposition:v', 'attached_pic',`
Set the cover image 2025-01-22 22:17:02 +05:30			`'-metadata:s:v', f'title={title}',`
			`'-metadata', f'artist={author}',`
cleanup 2025-01-23 21:44:26 +01:00			`'-c', 'copy',`
Merge branch 'main' into main 2025-01-23 21:25:25 +01:00			`'-f', 'mp4',`
Add title and author metadata to .m4b file 2025-01-15 22:29:10 +01:00			`f'{final_filename}'`
			`])`
m4b 2025-01-14 18:38:26 +01:00			`Path(tmp_filename).unlink()`
			`if proc.returncode == 0:`
			`print(f'{final_filename} created. Enjoy your audiobook.')`
			`print('Feel free to delete the intermediary .wav chapter files, the .m4b is all you need.')`
init 2025-01-14 15:35:10 +01:00
cleanup 2025-01-23 21:44:26 +01:00
Adds generation of chapter markings in the audiobook 2025-01-16 07:52:13 +01:00			`def probe_duration(file_name):`
			`args = ['ffprobe', '-i', file_name, '-show_entries', 'format=duration', '-v', 'quiet', '-of', 'default=noprint_wrappers=1:nokey=1']`
			`proc = subprocess.run(args, capture_output=True, text=True, check=True)`
			`return float(proc.stdout.strip())`

cleanup 2025-01-23 21:44:26 +01:00
Adds generation of chapter markings in the audiobook 2025-01-16 07:52:13 +01:00			`def create_index_file(title, creator, chapter_mp3_files, durations):`
			`with open("chapters.txt", "w") as f:`
			`f.write(f";FFMETADATA1\ntitle={title}\nartist={creator}\n\n")`
			`start = 0`
			`i = 0`
			`for c in chapter_mp3_files:`
			`if c not in durations:`
			`durations[c] = probe_duration(c)`
			`end = start + (int)(durations[c] * 1000)`
			`f.write(f"[CHAPTER]\nTIMEBASE=1/1000\nSTART={start}\nEND={end}\ntitle=Chapter {i}\n\n")`
			`i += 1`
			`start = end`

init 2025-01-14 15:35:10 +01:00
fix 2025-01-15 00:06:05 +01:00			`def cli_main():`
fix 2025-01-23 21:59:20 +01:00			`if not Path(MODEL_FILE).exists() or not Path(VOICES_FILE).exists():`
fix 2025-01-14 23:22:06 +01:00			`print('Error: kokoro-v0_19.onnx and voices.json must be in the current directory. Please download them with:')`
			`print('wget https://github.com/thewh1teagle/kokoro-onnx/releases/download/model-files/kokoro-v0_19.onnx')`
			`print('wget https://github.com/thewh1teagle/kokoro-onnx/releases/download/model-files/voices.json')`
			`sys.exit(1)`
fix 2025-01-23 21:59:20 +01:00			`kokoro = Kokoro(MODEL_FILE, VOICES_FILE)`
init 2025-01-14 15:35:10 +01:00			`voices = list(kokoro.get_voices())`
			`voices_str = ', '.join(voices)`
			`epilog = 'example:\n' + \`
			`' audiblez book.epub -l en-us -v af_sky'`
m4b 2025-01-14 17:45:04 +01:00			`default_voice = 'af_sky' if 'af_sky' in voices else voices[0]`
Support for onnxruntime-gpu and documentation. 2025-01-16 20:01:16 -08:00
			`# Get available ONNX providers`
			`available_providers = ort.get_available_providers()`
			`providers_help = f"Available ONNX providers: {', '.join(available_providers)}"`

init 2025-01-14 15:35:10 +01:00			`parser = argparse.ArgumentParser(epilog=epilog, formatter_class=argparse.RawDescriptionHelpFormatter)`
			`parser.add_argument('epub_file_path', help='Path to the epub file')`
			`parser.add_argument('-l', '--lang', default='en-gb', help='Language code: en-gb, en-us, fr-fr, ja, ko, cmn')`
m4b 2025-01-14 17:45:04 +01:00			`parser.add_argument('-v', '--voice', default=default_voice, help=f'Choose narrating voice: {voices_str}')`
fix 2025-01-16 15:25:04 +01:00			`parser.add_argument('-p', '--pick', default=False, help=f'Interactively select which chapters to read in the audiobook',`
manual pick 2025-01-15 19:12:48 +01:00			`action='store_true')`
merge 2025-01-16 15:20:51 +01:00			`parser.add_argument('-s', '--speed', default=1.0, help=f'Set speed from 0.5 to 2.0', type=float)`
Support for onnxruntime-gpu and documentation. 2025-01-16 20:01:16 -08:00			`parser.add_argument('--providers', nargs='+', metavar='PROVIDER', help=f"Specify ONNX providers. {providers_help}")`
cleanup 2025-01-23 21:44:26 +01:00
m4b 2025-01-14 17:45:04 +01:00			`if len(sys.argv) == 1:`
			`parser.print_help(sys.stderr)`
			`sys.exit(1)`
init 2025-01-14 15:35:10 +01:00			`args = parser.parse_args()`
Support for onnxruntime-gpu and documentation. 2025-01-16 20:01:16 -08:00			`main(kokoro, args.epub_file_path, args.lang, args.voice, args.pick, args.speed, args.providers)`
fix 2025-01-15 00:06:05 +01:00

			`if __name__ == '__main__':`
			`cli_main()`