encoding-scripts/MkvOpusEnc.py

#!/usr/bin/env python3

"""
Processes or downmixes an MKV file's audio tracks sequentially using a specific toolchain.
This script is cross-platform and optimized for correctness and clean output.

This script intelligently handles audio streams in an MKV file one by one.
- AAC/Opus audio is remuxed.
- Multi-channel audio (DTS, AC3, etc.) can be re-encoded or optionally downmixed to stereo.
- All other streams and metadata (title, language, delay) are preserved.
"""

import argparse
import json
import shutil
import subprocess
import sys
import re # Import the regular expression module
import tempfile
from datetime import datetime
from pathlib import Path

class Tee:
    """A file-like object that writes to multiple files and handles terminal-specific output."""
    def __init__(self, *files):
        self.files = files
        # Identify which file objects are interactive terminals
        self.terminals = [f for f in files if hasattr(f, 'isatty') and f.isatty()]

    def write(self, obj):
        # For regular file writes (like logs), replace carriage returns with newlines
        # to ensure each progress update is on a new line in the log file.
        log_obj = obj.replace('\r', '\n').replace('\x1B[K', '')

        for f in self.files:
            if f in self.terminals:
                f.write(obj) # Write to terminal as-is
            else:
                # For log files, write the modified object.
                f.write(log_obj)
            f.flush()

    def flush(self):
        for f in self.files:
            f.flush()

def check_tools():
    """Checks if all required command-line tools are in the system's PATH."""
    required_tools = ["ffmpeg", "ffprobe", "mkvmerge", "opusenc", "mediainfo"]
    print("--- Prerequisite Check ---")
    all_found = True
    for tool in required_tools:
        if not shutil.which(tool):
            print(f"Error: Required tool '{tool}' not found.", file=sys.stderr)
            all_found = False
    if not all_found:
        sys.exit("Please install the missing tools and ensure they are in your system's PATH.")
    print("All required tools found.")

def run_cmd(args, capture_output=False, check=True):
    """Helper function to run a command and return its output."""
    process = subprocess.run(args, capture_output=capture_output, text=True, encoding='utf-8', check=check)
    return process.stdout

def convert_audio_track(stream_index, channels, temp_dir, source_file, should_downmix, bitrate_info):
    """Extracts, normalizes, and encodes a single audio track to Opus."""
    temp_extracted = temp_dir / f"track_{stream_index}_extracted.flac" # This will be the input for loudnorm pass 1
    temp_normalized = temp_dir / f"track_{stream_index}_normalized.flac"
    final_opus = temp_dir / f"track_{stream_index}_final.opus"

    # Step 1: Extract audio, with conditional downmixing
    print("    - Extracting to FLAC...")
    ffmpeg_args = ["ffmpeg", "-v", "quiet", "-stats", "-y", "-i", str(source_file), "-map", f"0:{stream_index}"]

    final_channels = channels
    if should_downmix and channels >= 6:
        if channels == 6:  # 5.1
            print("      (Downmixing 5.1 to Stereo with dialogue boost)")
            ffmpeg_args.extend(["-af", "pan=stereo|c0=c2+0.30*c0+0.30*c4|c1=c2+0.30*c1+0.30*c5"])
            final_channels = 2
        elif channels == 8:  # 7.1
            print("      (Downmixing 7.1 to Stereo with dialogue boost)")
            ffmpeg_args.extend(["-af", "pan=stereo|c0=c2+0.30*c0+0.30*c4+0.30*c6|c1=c2+0.30*c1+0.30*c5+0.30*c7"])
            final_channels = 2
        else:
            print(f"      ({channels}-channel source, downmixing to stereo using default -ac 2)")
            ffmpeg_args.extend(["-ac", "2"])
            final_channels = 2
    else:
        print(f"      (Preserving {channels}-channel layout)")

    ffmpeg_args.extend(["-c:a", "flac", str(temp_extracted)])
    run_cmd(ffmpeg_args)

    # Step 2: Normalize the track with ffmpeg (loudnorm 2-pass)
    print("    - Normalizing Audio Track with ffmpeg (loudnorm 2-pass)...")
    # First pass: Analyze the audio to get loudnorm stats
    # The stats are printed to stderr, so we must use subprocess.run directly to capture it.
    print("      - Pass 1: Analyzing...")

    cmd = [
        "ffmpeg", "-v", "error", "-stats", "-i", str(temp_extracted),
        "-af", "loudnorm=I=-18:LRA=7:tp=-1:print_format=json", "-f", "null", "-"
    ]

    # Use Popen to capture stderr in real-time and print it, while also buffering for JSON parsing.
    process = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True, encoding='utf-8')

    # Read stderr and print progress updates. The Tee class now handles '\r' correctly.
    stderr_output = ""
    with process.stderr as pipe:
        for line in iter(pipe.readline, ''):
            stderr_output += line # Buffer the full output for parsing
            # Print the line to stdout, clearing the line and using a carriage return.
            # This will be handled by the Tee class.
            sys.stdout.write(line.strip() + '\x1B[K\r')
        # After the loop, read any remaining data (the JSON block)
        stderr_output += pipe.read()

    process.wait() # Wait for the process to terminate
    if process.returncode != 0:
        raise subprocess.CalledProcessError(process.returncode, cmd, output=process.stdout.read(), stderr="".join(stderr_buffer))

    # Find the start of the JSON block in stderr and parse it.
    # This is more robust than slicing the last N lines.
    # We find the start and end of the JSON block to avoid parsing extra data.
    json_start_index = stderr_output.find('{')
    if json_start_index == -1:
        raise ValueError("Could not find start of JSON block in ffmpeg output for loudnorm analysis.")

    brace_level = 0
    json_end_index = -1
    for i, char in enumerate(stderr_output[json_start_index:]):
        if char == '{':
            brace_level += 1
        elif char == '}':
            brace_level -= 1
            if brace_level == 0:
                json_end_index = json_start_index + i + 1
                break

    stats = json.loads(stderr_output[json_start_index:json_end_index])

    # Second pass: Apply the normalization using the stats from the first pass. A final newline is needed.
    # A print() is needed to move to the next line after the progress bar.
    print("\n      - Pass 2: Applying normalization...")
    run_cmd([
        "ffmpeg", "-v", "quiet", "-stats", "-y", "-i", str(temp_extracted), "-af",
        f"loudnorm=I=-18:LRA=7:tp=-1:measured_i={stats['input_i']}:measured_lra={stats['input_lra']}:measured_tp={stats['input_tp']}:measured_thresh={stats['input_thresh']}:offset={stats['target_offset']}",
        "-c:a", "flac", str(temp_normalized)
    ])

    # Step 3: Encode to Opus with the correct bitrate
    bitrate = "192k"  # Fallback

    if final_channels == 1:
        bitrate = "64k"
    elif final_channels == 2:
        bitrate = "128k"
    elif final_channels == 6:
        bitrate = "256k"
    elif final_channels == 8:
        bitrate = "384k"

    print(f"    - Encoding to Opus at {bitrate}...")
    print(f"      Source: {bitrate_info} -> Destination: Opus {bitrate} ({final_channels} channels)")
    run_cmd(["opusenc", "--vbr", "--bitrate", bitrate, str(temp_normalized), str(final_opus)])

    return final_opus, final_channels, bitrate

def main():
    """Main script logic."""
    parser = argparse.ArgumentParser(description="Batch processes MKV file audio tracks to Opus.")
    parser.add_argument("--downmix", action="store_true", help="If present, multi-channel audio will be downmixed to stereo.")
    args = parser.parse_args()

    check_tools()

    # Define directory paths but don't create them yet
    DIR_COMPLETED = Path("completed")
    DIR_ORIGINAL = Path("original")
    DIR_LOGS = Path("conv_logs")
    current_dir = Path(".")

    # Check if there are any MKV files to process
    files_to_process = sorted(
        f for f in current_dir.glob("*.mkv")
        if not f.name.startswith("temp-output-")
    )

    if not files_to_process:
        print("No MKV files found to process. Exiting.")
        return  # Exit without creating directories

    # Create directories only when we actually have files to process
    DIR_COMPLETED.mkdir(exist_ok=True)
    DIR_ORIGINAL.mkdir(exist_ok=True)
    DIR_LOGS.mkdir(exist_ok=True)

    for file_path in files_to_process:
        # Setup logging
        log_file_path = DIR_LOGS / f"{file_path.name}.log"
        log_file = open(log_file_path, 'w', encoding='utf-8')
        original_stdout = sys.stdout
        original_stderr = sys.stderr
        sys.stdout = Tee(original_stdout, log_file)
        sys.stderr = Tee(original_stderr, log_file)

        try:
            print("-" * shutil.get_terminal_size(fallback=(80, 24)).columns)
            print(f"Starting processing for: {file_path.name}")
            print(f"Log file: {log_file_path}")
            start_time = datetime.now()

            intermediate_output_file = current_dir / f"temp-output-{file_path.name}"
            temp_dir = Path(tempfile.mkdtemp(prefix="mkvopusenc_"))
            print(f"Temporary directory for audio created at: {temp_dir}")

            # 3. --- Get Media Information ---
            print(f"Analyzing file: {file_path}")
            ffprobe_info_json = run_cmd(["ffprobe", "-v", "quiet", "-print_format", "json", "-show_streams", "-show_format", str(file_path)], capture_output=True)
            ffprobe_info = json.loads(ffprobe_info_json)

            mkvmerge_info_json = run_cmd(["mkvmerge", "-J", str(file_path)], capture_output=True)
            mkv_info = json.loads(mkvmerge_info_json)

            mediainfo_json_str = run_cmd(["mediainfo", "--Output=JSON", "-f", str(file_path)], capture_output=True)
            media_info = json.loads(mediainfo_json_str)

            # 4. --- Prepare for Final mkvmerge Command ---
            processed_audio_files = []
            tids_of_reencoded_tracks = []

            # 5. --- Process Each Audio Stream ---
            audio_streams = [s for s in ffprobe_info.get("streams", []) if s.get("codec_type") == "audio"]

            # Check if the file has any audio streams
            if not audio_streams:
                print(f"Warning: No audio streams found in '{file_path.name}'. Skipping file.")
                continue

            mkv_tracks_list = mkv_info.get("tracks", [])
            mkv_audio_tracks = [t for t in mkv_tracks_list if t.get("type") == "audio"]
            media_tracks_data = media_info.get("media", {}).get("track", [])
            mediainfo_audio_tracks = {int(t.get("StreamOrder", -1)): t for t in media_tracks_data if t.get("@type") == "Audio"}

            print("\n=== Audio Track Analysis ===")
            for audio_stream_idx, stream in enumerate(audio_streams):
                stream_index = stream["index"]
                codec = stream.get("codec_name")
                channels = stream.get("channels", 2)
                language = stream.get("tags", {}).get("language", "und")

                track_id = -1
                mkv_track = {}
                if audio_stream_idx < len(mkv_audio_tracks):
                    mkv_track = mkv_audio_tracks[audio_stream_idx]
                    track_id = mkv_track.get("id", -1)

                if track_id == -1:
                    print(f"  -> Warning: Could not map ffprobe audio stream index {stream_index} to an mkvmerge track ID. Skipping this track.")
                    continue

                track_title = mkv_track.get("properties", {}).get("track_name", "")

                track_delay = 0
                audio_track_info = mediainfo_audio_tracks.get(stream_index)

                # Get bitrate information from mediainfo
                bitrate = "Unknown"
                if audio_track_info:
                    if "BitRate" in audio_track_info:
                        try:
                            br_value = int(audio_track_info["BitRate"])
                            bitrate = f"{int(br_value/1000)}k"
                        except (ValueError, TypeError):
                            pass
                    elif "BitRate_Nominal" in audio_track_info:
                        try:
                            br_value = int(audio_track_info["BitRate_Nominal"])
                            bitrate = f"{int(br_value/1000)}k"
                        except (ValueError, TypeError):
                            pass

                delay_raw = audio_track_info.get("Video_Delay") if audio_track_info else None
                if delay_raw is not None:
                    try:
                        delay_val = float(delay_raw)
                        # If the value is a float < 1, it's seconds, so convert to ms.
                        if delay_val < 1 and delay_val > -1:
                            track_delay = int(round(delay_val * 1000))
                        else:
                            track_delay = int(round(delay_val))
                    except Exception:
                        track_delay = 0

                track_info = f"Audio Stream #{stream_index} (TID: {track_id}, Codec: {codec}, Bitrate: {bitrate}, Channels: {channels})"
                if track_title:
                    track_info += f", Title: '{track_title}'"
                if language != "und":
                    track_info += f", Language: {language}"
                if track_delay != 0:
                    track_info += f", Delay: {track_delay}ms"

                print(f"\nProcessing {track_info}")

                if codec in {"aac", "opus"}:
                    print(f"  -> Action: Remuxing track (keeping original {codec.upper()} {bitrate})")
                    # This track will be kept from the original file, so we don't need to add it to a special list.
                else:
                    bitrate_info = f"{codec.upper()} {bitrate}"
                    print(f"  -> Action: Re-encoding codec '{codec}' to Opus")
                    opus_file, final_channels, final_bitrate = convert_audio_track(
                        stream_index, channels, temp_dir, file_path, args.downmix, bitrate_info
                    )
                    processed_audio_files.append({
                        "Path": opus_file,
                        "Language": language,
                        "Title": track_title,
                        "Delay": track_delay
                    })
                    tids_of_reencoded_tracks.append(str(track_id))

            # 6. --- Construct and Execute Final mkvmerge Command ---
            print("\n=== Final MKV Creation ===")
            print("Assembling final mkvmerge command...")
            mkvmerge_args = ["mkvmerge", "-o", str(intermediate_output_file)]

            # If no audio was re-encoded, we are just doing a full remux of the original file.
            if not processed_audio_files:
                print("  -> All audio tracks are in the desired format. Performing a full remux.")
                mkvmerge_args.append(str(file_path))
            else:
                # If we re-encoded audio, copy everything from the source EXCEPT the original audio tracks that we replaced.
                mkvmerge_args.extend(["--audio-tracks", "!" + ",".join(tids_of_reencoded_tracks)])
                mkvmerge_args.append(str(file_path))

                # Add the newly encoded Opus audio files.
                for file_info in processed_audio_files:
                    mkvmerge_args.extend(["--language", f"0:{file_info['Language']}"])
                    if file_info['Title']:
                        mkvmerge_args.extend(["--track-name", f"0:{file_info['Title']}"])
                    if file_info['Delay'] != 0:
                        mkvmerge_args.extend(["--sync", f"0:{file_info['Delay']}"])
                    mkvmerge_args.append(str(file_info["Path"]))

            print(f"Executing mkvmerge...")
            run_cmd(mkvmerge_args)
            print("MKV creation complete")

            # Move files to their final destinations
            print("\n=== File Management ===")
            print(f"Moving processed file to: {DIR_COMPLETED / file_path.name}")
            shutil.move(str(intermediate_output_file), DIR_COMPLETED / file_path.name)
            print(f"Moving original file to: {DIR_ORIGINAL / file_path.name}")
            shutil.move(str(file_path), DIR_ORIGINAL / file_path.name)

            # Display total runtime
            runtime = datetime.now() - start_time
            runtime_str = str(runtime).split('.')[0]  # Remove milliseconds
            print(f"\nTotal processing time: {runtime_str}")

        except Exception as e:
            print(f"\nAn error occurred while processing '{file_path.name}': {e}", file=sys.stderr)
            if intermediate_output_file.exists():
                intermediate_output_file.unlink()
        finally:
            # 7. --- Cleanup ---
            print("\n=== Cleanup ===")
            print("Cleaning up temporary files...")
            if temp_dir.exists():
                shutil.rmtree(temp_dir)
                print("Temporary directory removed.")

            # Restore stdout/stderr and close log file
            sys.stdout = original_stdout
            sys.stderr = original_stderr
            log_file.close()

if __name__ == "__main__":
    main()