audiblez/audiblez.py

#!/usr/bin/env python3
# audiblez - A program to convert e-books into audiobooks using
# Kokoro-82M model for high-quality text-to-speech synthesis.
# by Claudio Santini 2025 - https://claudio.uk
import argparse
import sys
import time
import shutil
import subprocess
import numpy as np
import soundfile
import ebooklib
import warnings
import re
import torch
from pathlib import Path
from string import Formatter
from bs4 import BeautifulSoup
from kokoro import KPipeline
from ebooklib import epub
from pydub import AudioSegment
from pick import pick
from tempfile import NamedTemporaryFile

from voices import voices, available_voices_str

sample_rate = 24000


def main(pipeline, file_path, voice, pick_manually, speed):
    filename = Path(file_path).name
    warnings.simplefilter("ignore")
    book = epub.read_epub(file_path)
    meta_title = book.get_metadata('DC', 'title')
    title = meta_title[0][0] if meta_title else ''
    meta_creator = book.get_metadata('DC', 'creator')
    by_creator = 'by ' + meta_creator[0][0] if meta_creator else ''

    cover_maybe = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_COVER]
    cover_image = cover_maybe[0].get_content() if cover_maybe else b""
    if cover_maybe:
        print(f'Found cover image {cover_maybe[0].file_name} in {cover_maybe[0].media_type} format')

    intro = f'{title} {by_creator}'
    print(intro)
    print('Found Chapters:', [c.get_name() for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT])
    if pick_manually:
        chapters = pick_chapters(book)
    else:
        chapters = find_chapters(book)
    print('Automatically selected chapters:', [c.get_name() for c in chapters])
    texts = extract_texts(chapters)

    has_ffmpeg = shutil.which('ffmpeg') is not None
    if not has_ffmpeg:
        print('\033[91m' + 'ffmpeg not found. Please install ffmpeg to create mp3 and m4b audiobook files.' + '\033[0m')

    total_chars, processed_chars = sum(map(len, texts)), 0
    print('Started at:', time.strftime('%H:%M:%S'))
    print(f'Total characters: {total_chars:,}')
    print('Total words:', len(' '.join(texts).split()))
    chars_per_sec = 500 if torch.cuda.is_available() else 50
    print(f'Estimated time remaining (assuming {chars_per_sec} chars/sec): {strfdelta((total_chars - processed_chars) / chars_per_sec)}')

    chapter_mp3_files = []
    for i, text in enumerate(texts, start=1):
        chapter_filename = filename.replace('.epub', f'_chapter_{i}.wav')
        chapter_mp3_files.append(chapter_filename)
        if Path(chapter_filename).exists():
            print(f'File for chapter {i} already exists. Skipping')
            continue
        if len(text.strip()) < 10:
            print(f'Skipping empty chapter {i}')
            chapter_mp3_files.remove(chapter_filename)
            continue
        print(f'Reading chapter {i} ({len(text):,} characters)...')
        if i == 1:
            text = intro + '.\n\n' + text
        start_time = time.time()

        audio_segments = gen_audio_segments(pipeline, text, voice, speed)
        if audio_segments:
            final_audio = np.concatenate(audio_segments)
            soundfile.write(chapter_filename, final_audio, sample_rate)
            end_time = time.time()
            delta_seconds = end_time - start_time
            chars_per_sec = len(text) / delta_seconds
            processed_chars += len(text)
            print(f'Estimated time remaining: {strfdelta((total_chars - processed_chars) / chars_per_sec)}')
            print('Chapter written to', chapter_filename)
            print(f'Chapter {i} read in {delta_seconds:.2f} seconds ({chars_per_sec:.0f} characters per second)')
            progress = processed_chars * 100 // total_chars
            print('Progress:', f'{progress}%\n')
        else:
            print(f'Warning: No audio generated for chapter {i}')
            chapter_mp3_files.remove(chapter_filename)

    if has_ffmpeg:
        create_index_file(title, by_creator, chapter_mp3_files)
        create_m4b(chapter_mp3_files, filename, cover_image)


def gen_audio_segments(pipeline, text, voice, speed):
    audio_segments = []
    for gs, ps, audio in pipeline(text, voice=voice, speed=speed, split_pattern=r'\n+'):
        audio_segments.append(audio)
    return audio_segments


def extract_texts(chapters):
    texts = []
    for chapter in chapters:
        xml = chapter.get_body_content()
        soup = BeautifulSoup(xml, features='lxml')
        chapter_text = ''
        html_content_tags = ['title', 'p', 'h1', 'h2', 'h3', 'h4', 'li']
        for child in soup.find_all(html_content_tags):
            inner_text = child.text.strip() if child.text else ""
            if inner_text:
                chapter_text += inner_text + '\n'
        texts.append(chapter_text)
    return texts


def is_chapter(c):
    name = c.get_name().lower()
    return bool(
        'chapter' in name.lower()
        or re.search(r'part\d{1,3}', name)
        or re.search(r'ch\d{1,3}', name)
        or re.search(r'chap\d{1,3}', name)
    )


def find_chapters(book, verbose=False):
    chapters = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT and is_chapter(c)]
    if verbose:
        for item in book.get_items():
            if item.get_type() == ebooklib.ITEM_DOCUMENT:
                print(f"'{item.get_name()}'" + ', #' + str(len(item.get_body_content())))
    if len(chapters) == 0:
        print('Not easy to find the chapters, defaulting to all available documents.')
        chapters = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT]
    return chapters


def pick_chapters(book):
    all_chapters_names = [c.get_name() for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT]
    title = 'Select which chapters to read in the audiobook'
    selected_chapters_names = pick(all_chapters_names, title, multiselect=True, min_selection_count=1)
    selected_chapters_names = [c[0] for c in selected_chapters_names]
    selected_chapters = [c for c in book.get_items() if c.get_name() in selected_chapters_names]
    return selected_chapters


def strfdelta(tdelta, fmt='{D:02}d {H:02}h {M:02}m {S:02}s'):
    remainder = int(tdelta)
    f = Formatter()
    desired_fields = [field_tuple[1] for field_tuple in f.parse(fmt)]
    possible_fields = ('W', 'D', 'H', 'M', 'S')
    constants = {'W': 604800, 'D': 86400, 'H': 3600, 'M': 60, 'S': 1}
    values = {}
    for field in possible_fields:
        if field in desired_fields and field in constants:
            values[field], remainder = divmod(remainder, constants[field])
    return f.format(fmt, **values)


def create_m4b(chapter_files, filename, cover_image):
    tmp_filename = filename.replace('.epub', '.tmp.mp4')
    if not Path(tmp_filename).exists():
        combined_audio = AudioSegment.empty()
        for wav_file in chapter_files:
            audio = AudioSegment.from_wav(wav_file)
            combined_audio += audio
        print('Converting to Mp4...')
        combined_audio.export(tmp_filename, format="mp4", codec="aac", bitrate="64k")
    final_filename = filename.replace('.epub', '.m4b')
    print('Creating M4B file...')

    if cover_image:
        cover_image_file = NamedTemporaryFile("wb")
        cover_image_file.write(cover_image)
        cover_image_args = ["-i", cover_image_file.name, "-map", "0:a", "-map", "2:v"]
    else:
        cover_image_args = []

    proc = subprocess.run([
        'ffmpeg',
        '-i', f'{tmp_filename}',
        '-i', 'chapters.txt',
        *cover_image_args,
        '-map', '0',
        '-map_metadata', '1',
        '-c:a', 'copy',
        '-c:v', 'copy',
        '-disposition:v', 'attached_pic',
        '-c', 'copy',
        '-f', 'mp4',
        f'{final_filename}'
    ])
    Path(tmp_filename).unlink()
    if proc.returncode == 0:
        print(f'{final_filename} created. Enjoy your audiobook.')
        print('Feel free to delete the intermediary .wav chapter files, the .m4b is all you need.')


def probe_duration(file_name):
    args = ['ffprobe', '-i', file_name, '-show_entries', 'format=duration', '-v', 'quiet', '-of', 'default=noprint_wrappers=1:nokey=1']
    proc = subprocess.run(args, capture_output=True, text=True, check=True)
    return float(proc.stdout.strip())


def create_index_file(title, creator, chapter_mp3_files):
    with open("chapters.txt", "w") as f:
        f.write(f";FFMETADATA1\ntitle={title}\nartist={creator}\n\n")
        start = 0
        i = 0
        for c in chapter_mp3_files:
            duration = probe_duration(c)
            end = start + (int)(duration * 1000)
            f.write(f"[CHAPTER]\nTIMEBASE=1/1000\nSTART={start}\nEND={end}\ntitle=Chapter {i}\n\n")
            i += 1
            start = end


def cli_main():
    voices_str = ', '.join(voices)
    epilog = ('example:\n' +
              '  audiblez book.epub -l en-us -v af_sky\n\n' +
              'available voices:\n' +
              available_voices_str)
    default_voice = 'af_sky'
    parser = argparse.ArgumentParser(epilog=epilog, formatter_class=argparse.RawDescriptionHelpFormatter)
    parser.add_argument('epub_file_path', help='Path to the epub file')
    parser.add_argument('-v', '--voice', default=default_voice, help=f'Choose narrating voice: {voices_str}')
    parser.add_argument('-p', '--pick', default=False, help=f'Interactively select which chapters to read in the audiobook', action='store_true')
    parser.add_argument('-s', '--speed', default=1.0, help=f'Set speed from 0.5 to 2.0', type=float)
    parser.add_argument('-c', '--cuda', default=False, help=f'Use GPU via Cuda in Torch if available', action='store_true')

    if len(sys.argv) == 1:
        parser.print_help(sys.stderr)
        sys.exit(1)
    args = parser.parse_args()

    if args.cuda:
        if torch.cuda.is_available():
            print('CUDA GPU available')
            torch.set_default_device('cuda')
        else:
            print('CUDA GPU not available. Defaulting to CPU')

    pipeline = KPipeline(lang_code=args.voice[0])  # a for american or b for british
    main(pipeline, args.epub_file_path, args.voice, args.pick, args.speed)


if __name__ == '__main__':
    cli_main()
m4b 2025-01-14 17:45:04 +01:00			`#!/usr/bin/env python3`
fix 2025-01-14 22:57:31 +01:00			`# audiblez - A program to convert e-books into audiobooks using`
			`# Kokoro-82M model for high-quality text-to-speech synthesis.`
			`# by Claudio Santini 2025 - https://claudio.uk`
init 2025-01-14 15:35:10 +01:00			`import argparse`
m4b 2025-01-14 17:45:04 +01:00			`import sys`
init 2025-01-14 15:35:10 +01:00			`import time`
			`import shutil`
			`import subprocess`
fix: improve audio processing by handling large text chunks and ensuring valid audio generation 2025-01-31 00:41:52 +02:00			`import numpy as np`
test fix 2025-01-29 11:02:50 +01:00			`import soundfile`
init 2025-01-14 15:35:10 +01:00			`import ebooklib`
			`import warnings`
fixed chapters 2025-01-15 09:31:50 +01:00			`import re`
cuda 2025-01-29 14:45:06 +01:00			`import torch`
init 2025-01-14 15:35:10 +01:00			`from pathlib import Path`
			`from string import Formatter`
			`from bs4 import BeautifulSoup`
torch 2025-01-29 10:50:30 +01:00			`from kokoro import KPipeline`
init 2025-01-14 15:35:10 +01:00			`from ebooklib import epub`
m4b 2025-01-14 18:38:26 +01:00			`from pydub import AudioSegment`
manual pick 2025-01-15 19:12:48 +01:00			`from pick import pick`
Set the cover image 2025-01-22 22:17:02 +05:30			`from tempfile import NamedTemporaryFile`
init 2025-01-14 15:35:10 +01:00
voices, chunking etc 2025-01-31 12:13:55 +01:00			`from voices import voices, available_voices_str`

torch 2025-01-29 10:50:30 +01:00			`sample_rate = 24000`


			`def main(pipeline, file_path, voice, pick_manually, speed):`
m4b 2025-01-14 17:45:04 +01:00			`filename = Path(file_path).name`
cleanup 2025-01-23 21:44:26 +01:00			`warnings.simplefilter("ignore")`
			`book = epub.read_epub(file_path)`
fix 2025-01-29 15:09:29 +01:00			`meta_title = book.get_metadata('DC', 'title')`
			`title = meta_title[0][0] if meta_title else ''`
			`meta_creator = book.get_metadata('DC', 'creator')`
fix espeak-ng 2025-01-30 16:04:58 +01:00			`by_creator = 'by ' + meta_creator[0][0] if meta_creator else ''`
Set the cover image 2025-01-22 22:17:02 +05:30
			`cover_maybe = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_COVER]`
			`cover_image = cover_maybe[0].get_content() if cover_maybe else b""`
			`if cover_maybe:`
			`print(f'Found cover image {cover_maybe[0].file_name} in {cover_maybe[0].media_type} format')`

fix espeak-ng 2025-01-30 16:04:58 +01:00			`intro = f'{title} {by_creator}'`
init 2025-01-14 15:35:10 +01:00			`print(intro)`
manual pick 2025-01-15 19:12:48 +01:00			`print('Found Chapters:', [c.get_name() for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT])`
			`if pick_manually:`
			`chapters = pick_chapters(book)`
			`else:`
			`chapters = find_chapters(book)`
cleanup 2025-01-23 21:44:26 +01:00			`print('Automatically selected chapters:', [c.get_name() for c in chapters])`
init 2025-01-14 15:35:10 +01:00			`texts = extract_texts(chapters)`
Set the cover image 2025-01-22 22:17:02 +05:30
init 2025-01-14 15:35:10 +01:00			`has_ffmpeg = shutil.which('ffmpeg') is not None`
m4b 2025-01-14 17:45:04 +01:00			`if not has_ffmpeg:`
			`print('\033[91m' + 'ffmpeg not found. Please install ffmpeg to create mp3 and m4b audiobook files.' + '\033[0m')`
Set the cover image 2025-01-22 22:17:02 +05:30
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`total_chars, processed_chars = sum(map(len, texts)), 0`
m4b 2025-01-14 17:45:04 +01:00			`print('Started at:', time.strftime('%H:%M:%S'))`
			`print(f'Total characters: {total_chars:,}')`
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`print('Total words:', len(' '.join(texts).split()))`
fix: improve audio processing by handling large text chunks and ensuring valid audio generation 2025-01-31 00:41:52 +02:00			`chars_per_sec = 500 if torch.cuda.is_available() else 50`
fix 2025-01-29 16:16:05 +01:00			`print(f'Estimated time remaining (assuming {chars_per_sec} chars/sec): {strfdelta((total_chars - processed_chars) / chars_per_sec)}')`
init 2025-01-14 15:35:10 +01:00
m4b 2025-01-14 18:38:26 +01:00			`chapter_mp3_files = []`
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`for i, text in enumerate(texts, start=1):`
m4b 2025-01-14 17:45:04 +01:00			`chapter_filename = filename.replace('.epub', f'_chapter_{i}.wav')`
m4b 2025-01-14 18:38:26 +01:00			`chapter_mp3_files.append(chapter_filename)`
cleanup 2025-01-14 18:41:15 +01:00			`if Path(chapter_filename).exists():`
init 2025-01-14 15:35:10 +01:00			`print(f'File for chapter {i} already exists. Skipping')`
			`continue`
fix 2025-01-23 21:59:20 +01:00			`if len(text.strip()) < 10:`
			`print(f'Skipping empty chapter {i}')`
			`chapter_mp3_files.remove(chapter_filename)`
			`continue`
init 2025-01-14 15:35:10 +01:00			`print(f'Reading chapter {i} ({len(text):,} characters)...')`
m4b 2025-01-14 17:45:04 +01:00			`if i == 1:`
			`text = intro + '.\n\n' + text`
init 2025-01-14 15:35:10 +01:00			`start_time = time.time()`
voices, chunking etc 2025-01-31 12:13:55 +01:00
			`audio_segments = gen_audio_segments(pipeline, text, voice, speed)`
			`if audio_segments:`
fix: improve audio processing by handling large text chunks and ensuring valid audio generation 2025-01-31 00:41:52 +02:00			`final_audio = np.concatenate(audio_segments)`
			`soundfile.write(chapter_filename, final_audio, sample_rate)`
			`end_time = time.time()`
			`delta_seconds = end_time - start_time`
			`chars_per_sec = len(text) / delta_seconds`
			`processed_chars += len(text)`
			`print(f'Estimated time remaining: {strfdelta((total_chars - processed_chars) / chars_per_sec)}')`
			`print('Chapter written to', chapter_filename)`
			`print(f'Chapter {i} read in {delta_seconds:.2f} seconds ({chars_per_sec:.0f} characters per second)')`
			`progress = processed_chars * 100 // total_chars`
			`print('Progress:', f'{progress}%\n')`
			`else:`
			`print(f'Warning: No audio generated for chapter {i}')`
			`chapter_mp3_files.remove(chapter_filename)`
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30
m4b 2025-01-14 17:45:04 +01:00			`if has_ffmpeg:`
fix espeak-ng 2025-01-30 16:04:58 +01:00			`create_index_file(title, by_creator, chapter_mp3_files)`
broken 2025-01-30 09:24:21 +01:00			`create_m4b(chapter_mp3_files, filename, cover_image)`
init 2025-01-14 15:35:10 +01:00
voices, chunking etc 2025-01-31 12:13:55 +01:00
			`def gen_audio_segments(pipeline, text, voice, speed):`
			`audio_segments = []`
			`for gs, ps, audio in pipeline(text, voice=voice, speed=speed, split_pattern=r'\n+'):`
			`audio_segments.append(audio)`
			`return audio_segments`


init 2025-01-14 15:35:10 +01:00			`def extract_texts(chapters):`
			`texts = []`
			`for chapter in chapters:`
			`xml = chapter.get_body_content()`
			`soup = BeautifulSoup(xml, features='lxml')`
			`chapter_text = ''`
li 2025-01-27 14:37:31 +01:00			`html_content_tags = ['title', 'p', 'h1', 'h2', 'h3', 'h4', 'li']`
init 2025-01-14 15:35:10 +01:00			`for child in soup.find_all(html_content_tags):`
			`inner_text = child.text.strip() if child.text else ""`
			`if inner_text:`
			`chapter_text += inner_text + '\n'`
			`texts.append(chapter_text)`
			`return texts`


fixed chapters 2025-01-15 09:31:50 +01:00			`def is_chapter(c):`
			`name = c.get_name().lower()`
Minor refactor and simplify is_chapter function 2025-01-22 22:29:56 +05:30			`return bool(`
			`'chapter' in name.lower()`
			`or re.search(r'part\d{1,3}', name)`
			`or re.search(r'ch\d{1,3}', name)`
			`or re.search(r'chap\d{1,3}', name)`
			`)`
fixed chapters 2025-01-15 09:31:50 +01:00

manual pick 2025-01-15 19:12:48 +01:00			`def find_chapters(book, verbose=False):`
init 2025-01-14 15:35:10 +01:00			`chapters = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT and is_chapter(c)]`
			`if verbose:`
			`for item in book.get_items():`
			`if item.get_type() == ebooklib.ITEM_DOCUMENT:`
dracula fix 2025-01-15 11:00:59 +01:00			`print(f"'{item.get_name()}'" + ', #' + str(len(item.get_body_content())))`
			`if len(chapters) == 0:`
			`print('Not easy to find the chapters, defaulting to all available documents.')`
			`chapters = [c for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT]`
init 2025-01-14 15:35:10 +01:00			`return chapters`


manual pick 2025-01-15 19:12:48 +01:00			`def pick_chapters(book):`
fix 2025-01-16 15:24:32 +01:00			`all_chapters_names = [c.get_name() for c in book.get_items() if c.get_type() == ebooklib.ITEM_DOCUMENT]`
manual pick 2025-01-15 19:12:48 +01:00			`title = 'Select which chapters to read in the audiobook'`
			`selected_chapters_names = pick(all_chapters_names, title, multiselect=True, min_selection_count=1)`
			`selected_chapters_names = [c[0] for c in selected_chapters_names]`
			`selected_chapters = [c for c in book.get_items() if c.get_name() in selected_chapters_names]`
			`return selected_chapters`


init 2025-01-14 15:35:10 +01:00			`def strfdelta(tdelta, fmt='{D:02}d {H:02}h {M:02}m {S:02}s'):`
			`remainder = int(tdelta)`
			`f = Formatter()`
			`desired_fields = [field_tuple[1] for field_tuple in f.parse(fmt)]`
			`possible_fields = ('W', 'D', 'H', 'M', 'S')`
			`constants = {'W': 604800, 'D': 86400, 'H': 3600, 'M': 60, 'S': 1}`
			`values = {}`
			`for field in possible_fields:`
			`if field in desired_fields and field in constants:`
			`values[field], remainder = divmod(remainder, constants[field])`
			`return f.format(fmt, **values)`


broken 2025-01-30 09:24:21 +01:00			`def create_m4b(chapter_files, filename, cover_image):`
Set the cover image 2025-01-22 22:17:02 +05:30			`tmp_filename = filename.replace('.epub', '.tmp.mp4')`
m4b 2025-01-14 18:38:26 +01:00			`if not Path(tmp_filename).exists():`
			`combined_audio = AudioSegment.empty()`
Add title and author metadata to .m4b file 2025-01-15 22:29:10 +01:00			`for wav_file in chapter_files:`
m4b 2025-01-14 18:38:26 +01:00			`audio = AudioSegment.from_wav(wav_file)`
			`combined_audio += audio`
cleanup 2025-01-14 18:41:15 +01:00			`print('Converting to Mp4...')`
m4b 2025-01-14 18:38:26 +01:00			`combined_audio.export(tmp_filename, format="mp4", codec="aac", bitrate="64k")`
			`final_filename = filename.replace('.epub', '.m4b')`
m4b 2025-01-14 17:45:04 +01:00			`print('Creating M4B file...')`
Set the cover image 2025-01-22 22:17:02 +05:30
			`if cover_image:`
			`cover_image_file = NamedTemporaryFile("wb")`
			`cover_image_file.write(cover_image)`
chapter markings and cover fix 2025-01-23 22:30:04 +01:00			`cover_image_args = ["-i", cover_image_file.name, "-map", "0:a", "-map", "2:v"]`
Set the cover image 2025-01-22 22:17:02 +05:30			`else:`
			`cover_image_args = []`

Add title and author metadata to .m4b file 2025-01-15 22:29:10 +01:00			`proc = subprocess.run([`
cleanup 2025-01-23 21:44:26 +01:00			`'ffmpeg',`
			`'-i', f'{tmp_filename}',`
			`'-i', 'chapters.txt',`
chapter markings and cover fix 2025-01-23 22:30:04 +01:00			`*cover_image_args,`
fix 2025-01-23 22:14:50 +01:00			`'-map', '0',`
			`'-map_metadata', '1',`
cleanup 2025-01-23 21:44:26 +01:00			`'-c:a', 'copy',`
			`'-c:v', 'copy',`
Merge branch 'main' into feat/cover-image 2025-01-23 21:32:10 +01:00			`'-disposition:v', 'attached_pic',`
cleanup 2025-01-23 21:44:26 +01:00			`'-c', 'copy',`
Merge branch 'main' into main 2025-01-23 21:25:25 +01:00			`'-f', 'mp4',`
Add title and author metadata to .m4b file 2025-01-15 22:29:10 +01:00			`f'{final_filename}'`
			`])`
m4b 2025-01-14 18:38:26 +01:00			`Path(tmp_filename).unlink()`
			`if proc.returncode == 0:`
			`print(f'{final_filename} created. Enjoy your audiobook.')`
			`print('Feel free to delete the intermediary .wav chapter files, the .m4b is all you need.')`
init 2025-01-14 15:35:10 +01:00
cleanup 2025-01-23 21:44:26 +01:00
Adds generation of chapter markings in the audiobook 2025-01-16 07:52:13 +01:00			`def probe_duration(file_name):`
			`args = ['ffprobe', '-i', file_name, '-show_entries', 'format=duration', '-v', 'quiet', '-of', 'default=noprint_wrappers=1:nokey=1']`
			`proc = subprocess.run(args, capture_output=True, text=True, check=True)`
			`return float(proc.stdout.strip())`

cleanup 2025-01-23 21:44:26 +01:00
broken 2025-01-30 09:24:21 +01:00			`def create_index_file(title, creator, chapter_mp3_files):`
Adds generation of chapter markings in the audiobook 2025-01-16 07:52:13 +01:00			`with open("chapters.txt", "w") as f:`
			`f.write(f";FFMETADATA1\ntitle={title}\nartist={creator}\n\n")`
			`start = 0`
			`i = 0`
			`for c in chapter_mp3_files:`
broken 2025-01-30 09:24:21 +01:00			`duration = probe_duration(c)`
			`end = start + (int)(duration * 1000)`
Adds generation of chapter markings in the audiobook 2025-01-16 07:52:13 +01:00			`f.write(f"[CHAPTER]\nTIMEBASE=1/1000\nSTART={start}\nEND={end}\ntitle=Chapter {i}\n\n")`
			`i += 1`
			`start = end`

init 2025-01-14 15:35:10 +01:00
fix 2025-01-15 00:06:05 +01:00			`def cli_main():`
init 2025-01-14 15:35:10 +01:00			`voices_str = ', '.join(voices)`
voices, chunking etc 2025-01-31 12:13:55 +01:00			`epilog = ('example:\n' +`
			`' audiblez book.epub -l en-us -v af_sky\n\n' +`
			`'available voices:\n' +`
			`available_voices_str)`
			`default_voice = 'af_sky'`
init 2025-01-14 15:35:10 +01:00			`parser = argparse.ArgumentParser(epilog=epilog, formatter_class=argparse.RawDescriptionHelpFormatter)`
			`parser.add_argument('epub_file_path', help='Path to the epub file')`
m4b 2025-01-14 17:45:04 +01:00			`parser.add_argument('-v', '--voice', default=default_voice, help=f'Choose narrating voice: {voices_str}')`
torch 2025-01-29 10:50:30 +01:00			`parser.add_argument('-p', '--pick', default=False, help=f'Interactively select which chapters to read in the audiobook', action='store_true')`
merge 2025-01-16 15:20:51 +01:00			`parser.add_argument('-s', '--speed', default=1.0, help=f'Set speed from 0.5 to 2.0', type=float)`
cuda 2025-01-31 12:27:11 +01:00			`parser.add_argument('-c', '--cuda', default=False, help=f'Use GPU via Cuda in Torch if available', action='store_true')`
cleanup 2025-01-23 21:44:26 +01:00
m4b 2025-01-14 17:45:04 +01:00			`if len(sys.argv) == 1:`
			`parser.print_help(sys.stderr)`
			`sys.exit(1)`
init 2025-01-14 15:35:10 +01:00			`args = parser.parse_args()`
cuda 2025-01-29 14:45:06 +01:00
broken 2025-01-30 09:24:21 +01:00			`if args.cuda:`
			`if torch.cuda.is_available():`
			`print('CUDA GPU available')`
			`torch.set_default_device('cuda')`
			`else:`
			`print('CUDA GPU not available. Defaulting to CPU')`
cuda 2025-01-29 14:45:06 +01:00
torch 2025-01-29 10:50:30 +01:00			`pipeline = KPipeline(lang_code=args.voice[0]) # a for american or b for british`
			`main(pipeline, args.epub_file_path, args.voice, args.pick, args.speed)`
fix 2025-01-15 00:06:05 +01:00

			`if __name__ == '__main__':`
			`cli_main()`