MBook/assembler.py at master · hebbihebb/MBook · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
import os
import re
import shutil
from pydub import AudioSegment
import subprocess
from typing import List, Dict, Optional


def check_ffmpeg_available():
    """
    Check if ffmpeg is installed and available in PATH.

    Raises:
        RuntimeError: If ffmpeg is not found
    """
    if not shutil.which("ffmpeg"):
        raise RuntimeError(
            "ffmpeg is not installed or not in PATH.\n"
            "Please install ffmpeg from: https://ffmpeg.org/download.html\n"
            "On Ubuntu/Debian: sudo apt-get install ffmpeg\n"
            "On macOS: brew install ffmpeg\n"
            "On Windows: Download from https://ffmpeg.org/download.html"
        )


def sanitize_metadata(value: str) -> str:
    """
    Sanitizes metadata values to prevent command injection in ffmpeg calls.

    Removes or escapes characters that could be used for command injection:
    - Newlines, carriage returns, tabs
    - Shell metacharacters: ; | & $ ` \ " ' < >
    - Control characters

    Args:
        value: The metadata value to sanitize

    Returns:
        Sanitized metadata value safe for ffmpeg
    """
    if not isinstance(value, str):
        value = str(value)

    # Remove control characters (0x00-0x1f, 0x7f-0x9f) and shell metacharacters
    # Single regex pass for O(n) performance instead of O(n*m) loop
    value = re.sub(r'[\x00-\x1f\x7f-\x9f;|&$`\\"\'<>]', '', value)

    # Limit length to prevent extremely long metadata
    max_length = 500
    if len(value) > max_length:
        value = value[:max_length]

    return value.strip()


def stitch_audio(audio_chunks: List[str], output_path: str = "temp_book.wav") -> str:
    """
    Stitches audio chunks with exactly 400ms of silence between them.

    Args:
        audio_chunks: List of paths to audio files.
        output_path: Path for the output WAV file.

    Returns:
        Path to the stitched audio file.
    """
    combined = AudioSegment.empty()
    silence_400ms = AudioSegment.silent(duration=400)

    for i, chunk in enumerate(audio_chunks):
        if isinstance(chunk, str):
            segment = AudioSegment.from_file(chunk)
        else:
            segment = chunk

        combined += segment

        # Add silence between chunks, but not after the last one
        if i < len(audio_chunks) - 1:
            combined += silence_400ms

    combined.export(output_path, format="wav")
    return output_path


def stitch_audio_with_chapter_tracking(
    audio_chunks: List[str],
    chunk_to_chapter: List[int],
    chapter_titles: List[str],
    output_path: str = "temp_book.wav"
) -> tuple[str, List[Dict]]:
    """
    Stitches audio chunks and tracks chapter boundaries.

    Args:
        audio_chunks: List of paths to audio files.
        chunk_to_chapter: List mapping each chunk index to its chapter index.
        chapter_titles: List of chapter titles.
        output_path: Path for the output WAV file.

    Returns:
        Tuple of (output_path, chapters_info) where chapters_info is a list of
        dicts with 'title', 'start_ms', 'end_ms'.
    """
    combined = AudioSegment.empty()
    silence_400ms = AudioSegment.silent(duration=400)

    # Track chapter boundaries
    chapter_starts = {}  # chapter_index -> start_ms
    current_position_ms = 0

    for i, chunk_path in enumerate(audio_chunks):
        chapter_idx = chunk_to_chapter[i]

        # Record start of chapter if this is the first chunk of a new chapter
        if chapter_idx not in chapter_starts:
            chapter_starts[chapter_idx] = current_position_ms

        # Load and append audio
        segment = AudioSegment.from_file(chunk_path)
        combined += segment
        current_position_ms += len(segment)

        # Add silence between chunks, but not after the last one
        if i < len(audio_chunks) - 1:
            combined += silence_400ms
            current_position_ms += 400

    # Export the combined audio
    combined.export(output_path, format="wav")

    # Build chapter info with end times
    total_duration_ms = current_position_ms
    chapter_indices = sorted(chapter_starts.keys())

    chapters_info = []
    for i, chapter_idx in enumerate(chapter_indices):
        start_ms = chapter_starts[chapter_idx]

        # End time is start of next chapter, or total duration for last chapter
        if i + 1 < len(chapter_indices):
            end_ms = chapter_starts[chapter_indices[i + 1]]
        else:
            end_ms = total_duration_ms

        title = chapter_titles[chapter_idx] if chapter_idx < len(chapter_titles) else f"Chapter {chapter_idx + 1}"

        chapters_info.append({
            'title': title,
            'start_ms': start_ms,
            'end_ms': end_ms
        })

    return output_path, chapters_info


def generate_chapter_metadata(chapters: List[Dict], output_path: str = "chapters.txt") -> str:
    """
    Generate FFMETADATA file for chapter markers.

    Args:
        chapters: List of dicts with 'title', 'start_ms', 'end_ms'.
        output_path: Path for the metadata file.

    Returns:
        Path to the metadata file.
    """
    with open(output_path, 'w', encoding='utf-8') as f:
        f.write(";FFMETADATA1\n\n")

        for ch in chapters:
            f.write("[CHAPTER]\n")
            f.write("TIMEBASE=1/1000\n")
            f.write(f"START={ch['start_ms']}\n")
            f.write(f"END={ch['end_ms']}\n")
            # Escape special characters in title
            title = ch['title'].replace('=', '\\=').replace(';', '\\;').replace('#', '\\#').replace('\\', '\\\\')
            f.write(f"title={title}\n\n")

    return output_path


def export_m4b(
    wav_path: str,
    output_m4b_path: str,
    metadata: Optional[Dict] = None,
    cover_art_path: Optional[str] = None,
    chapters_file: Optional[str] = None
) -> str:
    """
    Converts WAV to M4B with metadata and chapter markers using ffmpeg.

    Args:
        wav_path: Path to input WAV file.
        output_m4b_path: Path for output M4B file.
        metadata: Dict with 'title', 'author'.
        cover_art_path: Optional path to cover image.
        chapters_file: Optional path to FFMETADATA chapters file.

    Returns:
        Path to the M4B file.
    """
    # Check ffmpeg availability before proceeding
    check_ffmpeg_available()

    cmd = ["ffmpeg", "-y"]

    # Input files
    cmd.extend(["-i", wav_path])

    if chapters_file and os.path.exists(chapters_file):
        cmd.extend(["-i", chapters_file])

    if cover_art_path and os.path.exists(cover_art_path):
        cmd.extend(["-i", cover_art_path])

    # Map streams
    cmd.extend(["-map", "0:a"])  # Audio from first input

    if cover_art_path and os.path.exists(cover_art_path):
        # Map cover art as attached picture
        cover_input_idx = 2 if chapters_file else 1
        cmd.extend(["-map", f"{cover_input_idx}:v"])
        cmd.extend(["-c:v", "copy"])
        cmd.extend(["-disposition:v:0", "attached_pic"])

    # Import chapter metadata
    if chapters_file and os.path.exists(chapters_file):
        cmd.extend(["-map_metadata", "1"])

    # Audio codec settings (standard audiobook settings)
    cmd.extend(["-c:a", "aac", "-b:a", "64k"])

    # Book metadata (sanitized to prevent command injection)
    if metadata:
        if "title" in metadata:
            safe_title = sanitize_metadata(metadata['title'])
            cmd.extend(["-metadata", f"title={safe_title}"])
        if "author" in metadata:
            safe_author = sanitize_metadata(metadata['author'])
            cmd.extend(["-metadata", f"artist={safe_author}"])
            cmd.extend(["-metadata", f"album_artist={safe_author}"])
        # Mark as audiobook
        cmd.extend(["-metadata", "genre=Audiobook"])

    cmd.append(output_m4b_path)

    print(f"Running command: {' '.join(cmd)}")
    subprocess.run(cmd, check=True)

    return output_m4b_path


def create_audiobookshelf_folder(
    output_dir: str,
    author: str,
    title: str,
    m4b_path: str,
    cover_image_bytes: Optional[bytes] = None,
    cover_extension: str = ".jpg"
) -> str:
    """
    Create Audiobookshelf-compatible folder structure.

    Structure: {output_dir}/{author}/{title}/{title}.m4b

    Args:
        output_dir: Base output directory.
        author: Author name.
        title: Book title.
        m4b_path: Path to the M4B file to move/copy.
        cover_image_bytes: Optional cover image data.
        cover_extension: Extension for cover image (e.g., '.jpg', '.png').

    Returns:
        Path to the final M4B file location.
    """
    import shutil

    # Sanitize names for filesystem
    def sanitize_name(name: str) -> str:
        # Remove/replace problematic characters
        invalid_chars = '<>:"/\\|?*'
        for char in invalid_chars:
            name = name.replace(char, '_')
        return name.strip()

    safe_author = sanitize_name(author)
    safe_title = sanitize_name(title)

    # Create folder structure
    book_folder = os.path.join(output_dir, safe_author, safe_title)
    os.makedirs(book_folder, exist_ok=True)

    # Move/copy M4B file
    final_m4b_path = os.path.join(book_folder, f"{safe_title}.m4b")
    if m4b_path != final_m4b_path:
        shutil.move(m4b_path, final_m4b_path)

    # Save cover image if provided
    if cover_image_bytes:
        cover_path = os.path.join(book_folder, f"cover{cover_extension}")
        with open(cover_path, 'wb') as f:
            f.write(cover_image_bytes)

    return final_m4b_path