test/execute.py

#!/usr/bin/env python3
"""
Execute a pre-computed plan.

Takes a plan file (S-expression) and executes primitive operations,
storing artifacts by their content hash.

Usage:
    analyze.py recipe.sexp > analysis.sexp
    plan.py recipe.sexp --analysis analysis.sexp --sexp > plan.sexp
    execute.py plan.sexp --analysis analysis.sexp
"""

import json
import shutil
import subprocess
import sys
import tempfile
import importlib.util
from pathlib import Path
from typing import List

# Add artdag to path
sys.path.insert(0, str(Path(__file__).parent.parent / "artdag"))

from artdag.sexp import parse
from artdag.sexp.parser import Symbol, Keyword


def clean_nil_symbols(obj):
    """Recursively convert Symbol('nil') to None and filter out None values from dicts."""
    if isinstance(obj, Symbol):
        if obj.name == 'nil':
            return None
        return obj
    elif isinstance(obj, dict):
        result = {}
        for k, v in obj.items():
            cleaned = clean_nil_symbols(v)
            # Skip None values (they were nil)
            if cleaned is not None:
                result[k] = cleaned
        return result
    elif isinstance(obj, list):
        return [clean_nil_symbols(v) for v in obj]
    return obj


def parse_analysis_sexp(content: str) -> dict:
    """Parse analysis S-expression into dict."""
    sexp = parse(content)
    if isinstance(sexp, list) and len(sexp) == 1:
        sexp = sexp[0]

    if not isinstance(sexp, list) or not sexp:
        raise ValueError("Invalid analysis S-expression")

    # Should be (analysis (name ...) (name ...) ...)
    if not isinstance(sexp[0], Symbol) or sexp[0].name != "analysis":
        raise ValueError("Expected (analysis ...) S-expression")

    result = {}
    for item in sexp[1:]:
        if isinstance(item, list) and item and isinstance(item[0], Symbol):
            name = item[0].name
            data = {}

            i = 1
            while i < len(item):
                if isinstance(item[i], Keyword):
                    key = item[i].name.replace("-", "_")
                    i += 1
                    if i < len(item):
                        data[key] = item[i]
                        i += 1
                else:
                    i += 1

            result[name] = data

    return result


def sexp_to_plan(sexp) -> dict:
    """Convert a parsed S-expression plan to a dict."""
    if not isinstance(sexp, list) or not sexp:
        raise ValueError("Invalid plan S-expression")

    # Skip 'plan' symbol and name
    plan = {
        "steps": [],
        "analysis": {},
    }

    i = 0
    if isinstance(sexp[0], Symbol) and sexp[0].name == "plan":
        i = 1
        if i < len(sexp) and isinstance(sexp[i], str):
            plan["recipe_id"] = sexp[i]
            i += 1

    # Parse keywords and steps
    while i < len(sexp):
        item = sexp[i]

        if isinstance(item, Keyword):
            key = item.name.replace("-", "_")
            i += 1
            if i < len(sexp):
                value = sexp[i]
                if key == "encoding" and isinstance(value, list):
                    # Parse encoding dict from sexp
                    plan["encoding"] = sexp_to_dict(value)
                elif key == "output":
                    # Map :output to output_step_id
                    plan["output_step_id"] = value
                elif key == "id":
                    # Map :id to plan_id
                    plan["plan_id"] = value
                elif key == "recipe":
                    # Map :recipe to recipe_id
                    plan["recipe_id"] = value
                else:
                    plan[key] = value
                i += 1
        elif isinstance(item, list) and item and isinstance(item[0], Symbol):
            if item[0].name == "step":
                # Parse step
                step = parse_step_sexp(item)
                plan["steps"].append(step)
            elif item[0].name == "analysis":
                # Parse analysis data
                plan["analysis"] = parse_analysis_sexp(item)
            i += 1
        else:
            i += 1

    return plan


def parse_analysis_sexp(sexp) -> dict:
    """Parse analysis S-expression: (analysis (bass :times [...] :values [...]) ...)"""
    analysis = {}
    for item in sexp[1:]:  # Skip 'analysis' symbol
        if isinstance(item, list) and item and isinstance(item[0], Symbol):
            name = item[0].name
            data = {}
            j = 1
            while j < len(item):
                if isinstance(item[j], Keyword):
                    key = item[j].name
                    j += 1
                    if j < len(item):
                        data[key] = item[j]
                        j += 1
                else:
                    j += 1
            analysis[name] = data
    return analysis


def parse_bind_sexp(sexp) -> dict:
    """Parse a bind S-expression: (bind analysis-ref :range [min max] :offset 60 :transform sqrt)"""
    if not isinstance(sexp, list) or len(sexp) < 2:
        return None
    if not isinstance(sexp[0], Symbol) or sexp[0].name != "bind":
        return None

    bind = {
        "_bind": sexp[1] if isinstance(sexp[1], str) else sexp[1].name if isinstance(sexp[1], Symbol) else str(sexp[1]),
        "range_min": 0.0,
        "range_max": 1.0,
        "transform": None,
        "offset": 0.0,
    }

    i = 2
    while i < len(sexp):
        if isinstance(sexp[i], Keyword):
            kw = sexp[i].name
            if kw == "range":
                i += 1
                if i < len(sexp) and isinstance(sexp[i], list) and len(sexp[i]) >= 2:
                    bind["range_min"] = float(sexp[i][0])
                    bind["range_max"] = float(sexp[i][1])
            elif kw == "offset":
                i += 1
                if i < len(sexp):
                    bind["offset"] = float(sexp[i])
            elif kw == "transform":
                i += 1
                if i < len(sexp):
                    t = sexp[i]
                    if isinstance(t, Symbol):
                        bind["transform"] = t.name
                    elif isinstance(t, str):
                        bind["transform"] = t
        i += 1

    return bind


def sexp_to_dict(sexp) -> dict:
    """Convert S-expression key-value pairs to dict."""
    result = {}
    i = 0
    while i < len(sexp):
        if isinstance(sexp[i], Keyword):
            key = sexp[i].name.replace("-", "_")
            i += 1
            if i < len(sexp):
                value = sexp[i]
                # Check for bind expression and convert to dict format
                if isinstance(value, list) and value and isinstance(value[0], Symbol) and value[0].name == "bind":
                    value = parse_bind_sexp(value)
                result[key] = value
                i += 1
        else:
            i += 1
    return result


def parse_step_sexp(sexp) -> dict:
    """Parse a step S-expression.

    Supports two formats:
    1. (step "id" :cache-id "..." :type "SOURCE" :path "..." :inputs [...])
    2. (step "id" :cache-id "..." :level 1 (source :path "..." :inputs [...]))
    """
    step = {
        "inputs": [],
        "config": {},
    }

    i = 1  # Skip 'step' symbol
    if i < len(sexp) and isinstance(sexp[i], str):
        step["step_id"] = sexp[i]
        i += 1

    while i < len(sexp):
        item = sexp[i]

        if isinstance(item, Keyword):
            key = item.name.replace("-", "_")
            i += 1
            if i < len(sexp):
                value = sexp[i]
                if key == "type":
                    step["node_type"] = value if isinstance(value, str) else value.name
                elif key == "inputs":
                    step["inputs"] = value if isinstance(value, list) else [value]
                elif key in ("level", "cache", "cache_id"):
                    if key == "cache":
                        key = "cache_id"
                    step[key] = value
                else:
                    # Check for bind expression
                    if isinstance(value, list) and value and isinstance(value[0], Symbol) and value[0].name == "bind":
                        value = parse_bind_sexp(value)
                    # Config value
                    step["config"][key] = value
                i += 1
        elif isinstance(item, list) and item and isinstance(item[0], Symbol):
            # Nested node expression: (source :path "..." :inputs [...])
            node_type = item[0].name.upper()
            step["node_type"] = node_type

            # Parse node config
            j = 1
            while j < len(item):
                if isinstance(item[j], Keyword):
                    key = item[j].name.replace("-", "_")
                    j += 1
                    if j < len(item):
                        value = item[j]
                        if key == "inputs":
                            step["inputs"] = value if isinstance(value, list) else [value]
                        else:
                            # Check for bind expression
                            if isinstance(value, list) and value and isinstance(value[0], Symbol) and value[0].name == "bind":
                                value = parse_bind_sexp(value)
                            step["config"][key] = value
                        j += 1
                else:
                    j += 1
            i += 1
        else:
            i += 1

    return step


def parse_plan_input(content: str) -> dict:
    """Parse plan from JSON or S-expression string."""
    content = content.strip()
    if content.startswith("{"):
        return json.loads(content)
    elif content.startswith("("):
        sexp = parse(content)
        return sexp_to_plan(sexp[0] if isinstance(sexp, list) and len(sexp) == 1 else sexp)
    else:
        raise ValueError("Plan must be JSON (starting with '{') or S-expression (starting with '(')")


# Default encoding settings
DEFAULT_ENCODING = {
    "codec": "libx264",
    "preset": "fast",
    "crf": 18,
    "audio_codec": "aac",
    "fps": 30,
}


def get_encoding(recipe_encoding: dict, step_config: dict) -> dict:
    """Merge encoding settings: defaults < recipe < step overrides."""
    encoding = {**DEFAULT_ENCODING}
    encoding.update(recipe_encoding)
    if "encoding" in step_config:
        encoding.update(step_config["encoding"])
    return encoding


class SexpEffectModule:
    """Wrapper for S-expression effects to provide process_frame interface."""

    def __init__(self, effect_path: Path):
        from sexp_effects import get_interpreter
        self.interp = get_interpreter()
        self.interp.load_effect(str(effect_path))
        self.effect_name = effect_path.stem

    def process_frame(self, frame, params, state):
        return self.interp.run_effect(self.effect_name, frame, params, state or {})


def load_effect(effect_path: Path):
    """Load an effect module from a local path (.py or .sexp)."""
    if effect_path.suffix == ".sexp":
        return SexpEffectModule(effect_path)

    spec = importlib.util.spec_from_file_location("effect", effect_path)
    module = importlib.util.module_from_spec(spec)
    spec.loader.exec_module(module)
    return module


def interpolate_analysis(times: list, values: list, t: float) -> float:
    """Interpolate analysis value at time t."""
    if not times or not values:
        return 0.0
    if t <= times[0]:
        return values[0]
    if t >= times[-1]:
        return values[-1]

    # Binary search for surrounding times
    lo, hi = 0, len(times) - 1
    while lo < hi - 1:
        mid = (lo + hi) // 2
        if times[mid] <= t:
            lo = mid
        else:
            hi = mid

    # Linear interpolation
    t0, t1 = times[lo], times[hi]
    v0, v1 = values[lo], values[hi]
    if t1 == t0:
        return v0
    alpha = (t - t0) / (t1 - t0)
    return v0 + alpha * (v1 - v0)


def apply_transform(value: float, transform: str) -> float:
    """Apply a transform function to a value (0-1 range)."""
    if transform is None:
        return value
    if transform == "sqrt":
        return value ** 0.5
    elif transform == "pow2":
        return value ** 2
    elif transform == "pow3":
        return value ** 3
    elif transform == "log":
        # Logarithmic scale: log(1 + 9*x) / log(10) maps 0-1 to 0-1 with log curve
        import math
        return math.log(1 + 9 * value) / math.log(10) if value > 0 else 0
    elif transform == "exp":
        # Exponential scale: (10^x - 1) / 9 maps 0-1 to 0-1 with exp curve
        return (10 ** value - 1) / 9
    elif transform == "inv":
        return 1 - value
    else:
        return value


def resolve_params(params: dict, frame_time: float, analysis_data: dict) -> dict:
    """Resolve any binding params using analysis data at frame_time."""
    resolved = {}
    for key, value in params.items():
        if isinstance(value, dict) and ("_bind" in value or "_binding" in value):
            # This is a binding - resolve it
            # Support both old format (_bind) and new format (_binding)
            if "_bind" in value:
                # Old format: {"_bind": "ref", "range_min": 0, "range_max": 1}
                ref = value["_bind"]
                range_min = value.get("range_min", 0.0)
                range_max = value.get("range_max", 1.0)
            else:
                # New format from compiler: {"_binding": True, "source": "node_id", "feature": "values", "range": [min, max]}
                ref = value.get("source", "")
                range_val = value.get("range", [0.0, 1.0])
                range_min = range_val[0] if isinstance(range_val, list) else 0.0
                range_max = range_val[1] if isinstance(range_val, list) and len(range_val) > 1 else 1.0

            transform = value.get("transform")
            bind_offset = value.get("offset", 0.0)

            # Look up analysis track
            track = analysis_data.get(ref, {})
            times = track.get("times", [])
            values = track.get("values", [])

            # Interpolate raw value (0-1) - add binding offset to frame_time
            lookup_time = frame_time + bind_offset
            raw = interpolate_analysis(times, values, lookup_time)

            # Apply transform to raw value (before range scaling)
            transformed = apply_transform(raw, transform)

            # Map to output range
            resolved[key] = range_min + transformed * (range_max - range_min)
        else:
            resolved[key] = value
    return resolved


def run_effect(effect_module, input_path: Path, output_path: Path, params: dict, encoding: dict, analysis_data: dict = None, time_offset: float = 0.0, max_duration: float = None):
    """Run an effect on a video file.

    Args:
        time_offset: Time offset in seconds for resolving bindings (e.g., segment start time in audio)
        max_duration: Maximum duration in seconds to process (stops after this many seconds of frames)
    """
    import numpy as np

    # Clean nil Symbols from params
    params = clean_nil_symbols(params)

    # Get video info
    probe_cmd = [
        "ffprobe", "-v", "quiet", "-print_format", "json",
        "-show_streams", str(input_path)
    ]
    probe_result = subprocess.run(probe_cmd, capture_output=True, text=True)
    probe_data = json.loads(probe_result.stdout)

    # Find video stream
    video_stream = None
    for stream in probe_data.get("streams", []):
        if stream.get("codec_type") == "video":
            video_stream = stream
            break

    if not video_stream:
        raise ValueError("No video stream found")

    in_width = int(video_stream["width"])
    in_height = int(video_stream["height"])

    # Get framerate
    fps_str = video_stream.get("r_frame_rate", "30/1")
    if "/" in fps_str:
        num, den = fps_str.split("/")
        fps = float(num) / float(den)
    else:
        fps = float(fps_str)

    # Read frames with ffmpeg
    read_cmd = [
        "ffmpeg", "-i", str(input_path),
        "-f", "rawvideo", "-pix_fmt", "rgb24", "-"
    ]
    read_proc = subprocess.Popen(read_cmd, stdout=subprocess.PIPE, stderr=subprocess.DEVNULL)

    # Check if we have any bindings that need per-frame resolution
    has_bindings = any(isinstance(v, dict) and ("_bind" in v or "_binding" in v) for v in params.values())
    analysis_data = analysis_data or {}

    # Debug: print bindings and analysis info once
    if has_bindings:
        print(f"    BINDINGS DEBUG: time_offset={time_offset:.2f}", file=sys.stderr)
        for k, v in params.items():
            if isinstance(v, dict) and ("_bind" in v or "_binding" in v):
                ref = v.get("_bind") or v.get("source")
                bind_offset = float(v.get("offset", 0.0))
                track = analysis_data.get(ref, {})
                times = track.get("times", [])
                values = track.get("values", [])
                if times and values:
                    # Find first non-zero value
                    first_nonzero_idx = next((i for i, v in enumerate(values) if v > 0.01), -1)
                    first_nonzero_time = times[first_nonzero_idx] if first_nonzero_idx >= 0 else -1
                    print(f"      param {k}: ref='{ref}' bind_offset={bind_offset} time_range=[{min(times):.2f}, {max(times):.2f}]", file=sys.stderr)
                    print(f"        first_nonzero at t={first_nonzero_time:.2f} max_value={max(values):.4f}", file=sys.stderr)
                else:
                    raise ValueError(f"Binding for param '{k}' references '{ref}' but no analysis data found. Available: {list(analysis_data.keys())}")

    # Process first frame to detect output dimensions
    in_frame_size = in_width * in_height * 3
    frame_data = read_proc.stdout.read(in_frame_size)
    if len(frame_data) < in_frame_size:
        read_proc.stdout.close()
        read_proc.wait()
        raise ValueError("No frames in input video")

    frame = np.frombuffer(frame_data, dtype=np.uint8).reshape((in_height, in_width, 3))

    # Resolve params for first frame
    if has_bindings:
        frame_params = resolve_params(params, time_offset, analysis_data)
    else:
        frame_params = params

    state = None
    processed, state = effect_module.process_frame(frame, frame_params, state)

    # Get output dimensions from processed frame
    out_height, out_width = processed.shape[:2]
    if out_width != in_width or out_height != in_height:
        print(f"    Effect resizes: {in_width}x{in_height} -> {out_width}x{out_height}", file=sys.stderr)

    # Now start write process with correct output dimensions
    write_cmd = [
        "ffmpeg", "-y",
        "-f", "rawvideo", "-pix_fmt", "rgb24",
        "-s", f"{out_width}x{out_height}", "-r", str(encoding.get("fps", 30)),
        "-i", "-",
        "-i", str(input_path),  # For audio
        "-map", "0:v", "-map", "1:a?",
        "-c:v", encoding["codec"], "-preset", encoding["preset"], "-crf", str(encoding["crf"]),
        "-pix_fmt", "yuv420p",
        "-c:a", encoding["audio_codec"],
        str(output_path)
    ]
    write_proc = subprocess.Popen(write_cmd, stdin=subprocess.PIPE, stderr=subprocess.DEVNULL)

    # Write first processed frame
    write_proc.stdin.write(processed.tobytes())
    frame_count = 1

    # Calculate max frames if duration limit specified
    max_frames = None
    if max_duration:
        max_frames = int(max_duration * fps)

    # Process remaining frames
    while True:
        # Stop if we've reached the frame limit
        if max_frames and frame_count >= max_frames:
            break

        frame_data = read_proc.stdout.read(in_frame_size)
        if len(frame_data) < in_frame_size:
            break

        frame = np.frombuffer(frame_data, dtype=np.uint8).reshape((in_height, in_width, 3))

        # Resolve params for this frame
        if has_bindings:
            frame_time = time_offset + frame_count / fps
            frame_params = resolve_params(params, frame_time, analysis_data)
        else:
            frame_params = params

        processed, state = effect_module.process_frame(frame, frame_params, state)
        write_proc.stdin.write(processed.tobytes())
        frame_count += 1

        if frame_count % 30 == 0:
            print(f"    Processed {frame_count} frames...", end="\r", file=sys.stderr)

    read_proc.stdout.close()
    write_proc.stdin.close()
    read_proc.wait()
    write_proc.wait()

    print(f"    Processed {frame_count} frames total", file=sys.stderr)


def run_multi_effect(effect_module, input_paths: List[Path], output_path: Path, params: dict, encoding: dict, analysis_data: dict = None, time_offset: float = 0.0, max_duration: float = None):
    """Run a multi-input effect on multiple video files.

    Args:
        time_offset: Time offset in seconds for resolving bindings (e.g., segment start time in audio)
        max_duration: Maximum duration in seconds to process (stops after this many seconds of frames)
    """
    import numpy as np

    # Clean nil Symbols from params
    params = clean_nil_symbols(params)

    if len(input_paths) < 2:
        raise ValueError("Multi-input effect requires at least 2 inputs")

    # Get video info for each input (preserve original dimensions)
    input_infos = []
    for input_path in input_paths:
        probe_cmd = [
            "ffprobe", "-v", "quiet", "-print_format", "json",
            "-show_streams", str(input_path)
        ]
        probe_result = subprocess.run(probe_cmd, capture_output=True, text=True)
        probe_data = json.loads(probe_result.stdout)

        video_stream = None
        for stream in probe_data.get("streams", []):
            if stream.get("codec_type") == "video":
                video_stream = stream
                break

        if not video_stream:
            raise ValueError(f"No video stream found in {input_path}")

        w = int(video_stream["width"])
        h = int(video_stream["height"])
        input_infos.append({"width": w, "height": h, "path": input_path})
        print(f"    Input: {input_path.name} ({w}x{h})", file=sys.stderr)

    # Get framerate from first input
    probe_cmd = [
        "ffprobe", "-v", "quiet", "-print_format", "json",
        "-show_streams", str(input_paths[0])
    ]
    probe_result = subprocess.run(probe_cmd, capture_output=True, text=True)
    probe_data = json.loads(probe_result.stdout)
    video_stream = next(s for s in probe_data.get("streams", []) if s.get("codec_type") == "video")
    fps_str = video_stream.get("r_frame_rate", "30/1")
    if "/" in fps_str:
        num, den = fps_str.split("/")
        fps = float(num) / float(den)
    else:
        fps = float(fps_str)

    # Open read processes for all inputs - preserve original dimensions
    read_procs = []
    for info in input_infos:
        read_cmd = [
            "ffmpeg", "-i", str(info["path"]),
            "-f", "rawvideo", "-pix_fmt", "rgb24",
            "-"  # Don't scale - keep original dimensions
        ]
        proc = subprocess.Popen(read_cmd, stdout=subprocess.PIPE, stderr=subprocess.DEVNULL)
        read_procs.append(proc)

    analysis_data = analysis_data or {}
    state = None

    # Process first frame to detect output dimensions
    frames = []
    for i, (proc, info) in enumerate(zip(read_procs, input_infos)):
        frame_size = info["width"] * info["height"] * 3
        frame_data = proc.stdout.read(frame_size)
        if len(frame_data) < frame_size:
            # Cleanup
            for p in read_procs:
                p.stdout.close()
                p.wait()
            raise ValueError(f"No frames in input {i}")
        frame = np.frombuffer(frame_data, dtype=np.uint8).reshape((info["height"], info["width"], 3))
        frames.append(frame)

    # Check if we have any bindings that need per-frame resolution
    has_bindings = any(isinstance(v, dict) and ("_bind" in v or "_binding" in v) for v in params.values())

    # Resolve params for first frame
    if has_bindings:
        frame_params = resolve_params(params, time_offset, analysis_data)
    else:
        frame_params = params

    processed, state = effect_module.process_frame(frames, frame_params, state)
    out_height, out_width = processed.shape[:2]
    print(f"    Output dimensions: {out_width}x{out_height}", file=sys.stderr)

    # Now start write process with correct output dimensions
    write_cmd = [
        "ffmpeg", "-y",
        "-f", "rawvideo", "-pix_fmt", "rgb24",
        "-s", f"{out_width}x{out_height}", "-r", str(encoding.get("fps", 30)),
        "-i", "-",
        "-i", str(input_paths[0]),  # For audio from first input
        "-map", "0:v", "-map", "1:a?",
        "-c:v", encoding["codec"], "-preset", encoding["preset"], "-crf", str(encoding["crf"]),
        "-pix_fmt", "yuv420p",
        "-c:a", encoding["audio_codec"],
        str(output_path)
    ]
    write_proc = subprocess.Popen(write_cmd, stdin=subprocess.PIPE, stderr=subprocess.DEVNULL)

    # Write first processed frame
    write_proc.stdin.write(processed.tobytes())
    frame_count = 1

    # Calculate max frames if duration limit specified
    max_frames = None
    if max_duration:
        max_frames = int(max_duration * fps)

    # Process remaining frames
    while True:
        # Stop if we've reached the frame limit
        if max_frames and frame_count >= max_frames:
            break

        # Read frame from each input (each may have different dimensions)
        frames = []
        all_valid = True
        for i, (proc, info) in enumerate(zip(read_procs, input_infos)):
            frame_size = info["width"] * info["height"] * 3
            frame_data = proc.stdout.read(frame_size)
            if len(frame_data) < frame_size:
                all_valid = False
                break
            frame = np.frombuffer(frame_data, dtype=np.uint8).reshape((info["height"], info["width"], 3))
            frames.append(frame)

        if not all_valid:
            break

        # Resolve params for this frame
        if has_bindings:
            frame_time = time_offset + frame_count / fps
            frame_params = resolve_params(params, frame_time, analysis_data)
        else:
            frame_params = params

        # Pass list of frames to effect
        processed, state = effect_module.process_frame(frames, frame_params, state)
        write_proc.stdin.write(processed.tobytes())
        frame_count += 1

        if frame_count % 30 == 0:
            print(f"    Processed {frame_count} frames...", end="\r", file=sys.stderr)

    # Cleanup
    for proc in read_procs:
        proc.stdout.close()
        proc.wait()
    write_proc.stdin.close()
    write_proc.wait()

    print(f"    Processed {frame_count} frames total", file=sys.stderr)


def get_video_dimensions(file_path: Path) -> tuple:
    """Get video dimensions using ffprobe."""
    cmd = [
        "ffprobe", "-v", "quiet", "-print_format", "json",
        "-show_streams", str(file_path)
    ]
    result = subprocess.run(cmd, capture_output=True, text=True)
    data = json.loads(result.stdout)

    for stream in data.get("streams", []):
        if stream.get("codec_type") == "video":
            return int(stream["width"]), int(stream["height"])

    return None, None


def normalize_video(
    input_path: Path,
    output_path: Path,
    target_width: int,
    target_height: int,
    resize_mode: str,
    priority: str = None,
    pad_color: str = "black",
    crop_gravity: str = "center",
    encoding: dict = None,
) -> Path:
    """
    Normalize video to target dimensions.

    resize_mode:
        - stretch: force to exact size (distorts)
        - crop: scale to fill, crop overflow
        - fit: scale to fit, pad remainder
        - cover: scale to cover, crop minimally

    priority: width | height (which dimension to match exactly for fit/crop)
    """
    enc = encoding or {}
    src_width, src_height = get_video_dimensions(input_path)

    if src_width is None:
        # Can't determine dimensions, just copy
        shutil.copy(input_path, output_path)
        return output_path

    # Already correct size?
    if src_width == target_width and src_height == target_height:
        shutil.copy(input_path, output_path)
        return output_path

    src_aspect = src_width / src_height
    target_aspect = target_width / target_height

    if resize_mode == "stretch":
        # Force exact size
        vf = f"scale={target_width}:{target_height}"

    elif resize_mode == "fit":
        # Scale to fit within bounds, pad remainder
        if priority == "width":
            # Match width exactly, pad height
            vf = f"scale={target_width}:-1,pad={target_width}:{target_height}:(ow-iw)/2:(oh-ih)/2:{pad_color}"
        elif priority == "height":
            # Match height exactly, pad width
            vf = f"scale=-1:{target_height},pad={target_width}:{target_height}:(ow-iw)/2:(oh-ih)/2:{pad_color}"
        else:
            # Auto: fit within bounds (may pad both)
            if src_aspect > target_aspect:
                # Source is wider, fit to width
                vf = f"scale={target_width}:-1,pad={target_width}:{target_height}:(ow-iw)/2:(oh-ih)/2:{pad_color}"
            else:
                # Source is taller, fit to height
                vf = f"scale=-1:{target_height},pad={target_width}:{target_height}:(ow-iw)/2:(oh-ih)/2:{pad_color}"

    elif resize_mode == "crop":
        # Scale to fill, crop overflow
        if priority == "width":
            # Match width, crop height
            vf = f"scale={target_width}:-1,crop={target_width}:{target_height}"
        elif priority == "height":
            # Match height, crop width
            vf = f"scale=-1:{target_height},crop={target_width}:{target_height}"
        else:
            # Auto: fill bounds, crop minimally
            if src_aspect > target_aspect:
                # Source is wider, match height and crop width
                vf = f"scale=-1:{target_height},crop={target_width}:{target_height}"
            else:
                # Source is taller, match width and crop height
                vf = f"scale={target_width}:-1,crop={target_width}:{target_height}"

    elif resize_mode == "cover":
        # Scale to cover target, crop to exact size
        if src_aspect > target_aspect:
            vf = f"scale=-1:{target_height},crop={target_width}:{target_height}"
        else:
            vf = f"scale={target_width}:-1,crop={target_width}:{target_height}"

    else:
        # Unknown mode, just copy
        shutil.copy(input_path, output_path)
        return output_path

    cmd = [
        "ffmpeg", "-y", "-i", str(input_path),
        "-vf", vf,
        "-r", str(enc.get("fps", 30)),  # Normalize framerate for concat compatibility
        "-c:v", enc.get("codec", "libx264"),
        "-preset", enc.get("preset", "fast"),
        "-crf", str(enc.get("crf", 18)),
        "-pix_fmt", "yuv420p",  # Normalize pixel format for concat compatibility
        "-c:a", enc.get("audio_codec", "aac"),
        str(output_path)
    ]
    subprocess.run(cmd, check=True, capture_output=True)
    return output_path


def tree_concat(files: list, work_dir: Path, prefix: str = "concat") -> Path:
    """Concatenate files using a binary tree approach."""
    if len(files) == 1:
        return files[0]

    level = 0
    current_files = list(files)
    print(f"  Tree concat: {len(current_files)} files", file=sys.stderr)
    for i, f in enumerate(current_files):
        print(f"    [{i}] {f}", file=sys.stderr)

    while len(current_files) > 1:
        next_files = []
        pairs = (len(current_files) + 1) // 2
        print(f"    Level {level}: {len(current_files)} -> {pairs} pairs", file=sys.stderr)

        for i in range(0, len(current_files), 2):
            if i + 1 < len(current_files):
                concat_file = work_dir / f"{prefix}_L{level}_{i}.txt"
                output_file = work_dir / f"{prefix}_L{level}_{i}.mp4"

                with open(concat_file, "w") as f:
                    f.write(f"file '{current_files[i]}'\n")
                    f.write(f"file '{current_files[i+1]}'\n")

                cmd = ["ffmpeg", "-y", "-f", "concat", "-safe", "0",
                       "-i", str(concat_file), "-c", "copy", str(output_file)]
                subprocess.run(cmd, capture_output=True)
                next_files.append(output_file)
            else:
                next_files.append(current_files[i])

        current_files = next_files
        level += 1

    return current_files[0]


def execute_plan(plan_path: Path = None, output_path: Path = None, recipe_dir: Path = None, plan_data: dict = None, external_analysis: dict = None):
    """Execute a plan file (S-expression) or plan dict."""

    # Load plan from file, stdin, or dict
    if plan_data:
        plan = plan_data
    elif plan_path and str(plan_path) != "-":
        content = plan_path.read_text()
        plan = parse_plan_input(content)
    else:
        # Read from stdin
        content = sys.stdin.read()
        plan = parse_plan_input(content)

    print(f"Executing plan: {plan['plan_id'][:16]}...", file=sys.stderr)
    print(f"Recipe: {plan['recipe_id']}", file=sys.stderr)
    print(f"Steps: {len(plan['steps'])}", file=sys.stderr)

    recipe_encoding = plan.get("encoding", {})

    # Use external analysis if provided, otherwise fall back to plan's embedded analysis
    analysis_data = external_analysis or plan.get("analysis", {})
    if recipe_dir is None:
        recipe_dir = plan_path.parent if plan_path else Path(".")

    if analysis_data:
        print(f"Analysis tracks: {list(analysis_data.keys())}", file=sys.stderr)

    # Execute steps
    results = {}  # step_id -> output_path
    work_dir = Path(tempfile.mkdtemp(prefix="artdag_exec_"))

    # Sort steps: SOURCE first, then by level, but ANALYZE before COMPOUND/EFFECT at any level
    # This ensures analysis data is available for binding resolution
    steps = plan["steps"]
    def step_sort_key(s):
        node_type = s.get("node_type") or "UNKNOWN"
        # Handle node_type being a Symbol
        if hasattr(node_type, 'name'):
            node_type = node_type.name
        level = s.get("level", 0)
        # Ensure level is an int (could be Symbol or None)
        if not isinstance(level, int):
            level = 0
        # Priority: SOURCE=0, SEGMENT=1, ANALYZE=2, others=3
        if node_type == "SOURCE":
            type_priority = 0
        elif node_type == "SEGMENT":
            type_priority = 1
        elif node_type == "ANALYZE":
            type_priority = 2
        else:
            type_priority = 3
        return (type_priority, level)
    ordered_steps = sorted(steps, key=step_sort_key)

    try:
        for step in ordered_steps:
            step_id = step["step_id"]
            node_type = step["node_type"]
            config = step["config"]
            inputs = step.get("inputs", [])

            print(f"\n[{step.get('level', 0)}] {node_type}: {step_id[:16]}...", file=sys.stderr)

            if node_type == "SOURCE":
                if "path" in config:
                    src_path = (recipe_dir / config["path"]).resolve()
                    if not src_path.exists():
                        raise FileNotFoundError(f"Source not found: {src_path}")
                    results[step_id] = src_path
                    print(f"  -> {src_path}", file=sys.stderr)

            elif node_type == "SEGMENT":
                input_path = results[inputs[0]]
                start = config.get("start", 0)
                duration = config.get("duration")
                end = config.get("end")

                is_audio = str(input_path).lower().endswith(
                    ('.mp3', '.wav', '.flac', '.aac', '.ogg', '.m4a'))
                enc = get_encoding(recipe_encoding, config)

                if is_audio:
                    output_file = work_dir / f"segment_{step_id}.m4a"
                    cmd = ["ffmpeg", "-y", "-i", str(input_path)]
                    if start:
                        cmd.extend(["-ss", str(start)])
                    if duration:
                        cmd.extend(["-t", str(duration)])
                    cmd.extend(["-c:a", enc["audio_codec"], str(output_file)])
                else:
                    output_file = work_dir / f"segment_{step_id}.mp4"
                    cmd = ["ffmpeg", "-y", "-i", str(input_path)]
                    if start:
                        cmd.extend(["-ss", str(start)])
                    if duration:
                        cmd.extend(["-t", str(duration)])
                    elif end:
                        cmd.extend(["-t", str(end - start)])
                    cmd.extend(["-r", str(enc["fps"]),  # Normalize frame rate
                               "-c:v", enc["codec"], "-preset", enc["preset"],
                               "-crf", str(enc["crf"]), "-c:a", enc["audio_codec"],
                               str(output_file)])

                result = subprocess.run(cmd, capture_output=True, text=True)

                # Check if segment has video content, if not try with looping
                needs_loop = False
                if not is_audio and result.returncode == 0:
                    probe_cmd = ["ffprobe", "-v", "quiet", "-print_format", "json",
                                 "-show_streams", str(output_file)]
                    probe_result = subprocess.run(probe_cmd, capture_output=True, text=True)
                    probe_data = json.loads(probe_result.stdout)
                    has_video = any(s.get("codec_type") == "video" for s in probe_data.get("streams", []))
                    if not has_video:
                        needs_loop = True

                if needs_loop or result.returncode != 0:
                    # Get source duration and loop the input
                    probe_cmd = ["ffprobe", "-v", "quiet", "-print_format", "json",
                                 "-show_format", str(input_path)]
                    probe_result = subprocess.run(probe_cmd, capture_output=True, text=True)
                    probe_data = json.loads(probe_result.stdout)
                    src_duration = float(probe_data.get("format", {}).get("duration", 0))

                    if src_duration > 0:
                        # Wrap start time to source duration
                        wrapped_start = start % src_duration if start else 0
                        seg_duration = duration if duration else (end - start if end else None)

                        print(f"    Wrapping segment: {start:.2f}s -> {wrapped_start:.2f}s (source={src_duration:.2f}s)", file=sys.stderr)

                        # Use stream_loop for seamless looping if segment spans wrap point
                        if wrapped_start + (seg_duration or 0) > src_duration:
                            # Need to loop - use concat filter
                            cmd = ["ffmpeg", "-y", "-stream_loop", "-1", "-i", str(input_path)]
                            cmd.extend(["-ss", str(wrapped_start)])
                            if seg_duration:
                                cmd.extend(["-t", str(seg_duration)])
                            cmd.extend(["-r", str(enc["fps"]),
                                       "-c:v", enc["codec"], "-preset", enc["preset"],
                                       "-crf", str(enc["crf"]), "-c:a", enc["audio_codec"],
                                       str(output_file)])
                        else:
                            cmd = ["ffmpeg", "-y", "-i", str(input_path)]
                            cmd.extend(["-ss", str(wrapped_start)])
                            if seg_duration:
                                cmd.extend(["-t", str(seg_duration)])
                            cmd.extend(["-r", str(enc["fps"]),
                                       "-c:v", enc["codec"], "-preset", enc["preset"],
                                       "-crf", str(enc["crf"]), "-c:a", enc["audio_codec"],
                                       str(output_file)])

                        subprocess.run(cmd, check=True, capture_output=True)
                    else:
                        raise ValueError(f"Cannot determine source duration for looping")

                results[step_id] = output_file
                print(f"  -> {output_file}", file=sys.stderr)

            elif node_type == "EFFECT":
                effect_name = config.get("effect", "unknown")
                effect_path = config.get("effect_path")
                is_multi_input = config.get("multi_input", False)

                output_file = work_dir / f"effect_{step_id}.mp4"
                enc = get_encoding(recipe_encoding, config)

                if effect_path:
                    full_path = recipe_dir / effect_path
                    effect_module = load_effect(full_path)
                    params = {k: v for k, v in config.items()
                              if k not in ("effect", "effect_path", "cid", "encoding", "multi_input")}
                    print(f"  Effect: {effect_name}", file=sys.stderr)

                    # Get timing offset and duration for bindings
                    effect_time_offset = config.get("start", config.get("segment_start", 0))
                    effect_duration = config.get("duration")

                    if is_multi_input and len(inputs) > 1:
                        # Multi-input effect (blend, layer, etc.)
                        input_paths = [results[inp] for inp in inputs]
                        run_multi_effect(effect_module, input_paths, output_file, params, enc, analysis_data, time_offset=effect_time_offset, max_duration=effect_duration)
                    else:
                        # Single-input effect
                        input_path = results[inputs[0]]
                        run_effect(effect_module, input_path, output_file, params, enc, analysis_data, time_offset=effect_time_offset, max_duration=effect_duration)
                else:
                    input_path = results[inputs[0]]
                    shutil.copy(input_path, output_file)

                results[step_id] = output_file
                print(f"  -> {output_file}", file=sys.stderr)

            elif node_type == "SEQUENCE":
                if len(inputs) < 2:
                    results[step_id] = results[inputs[0]]
                    continue

                input_files = [results[inp] for inp in inputs]
                enc = get_encoding(recipe_encoding, config)

                # Check for normalization config
                resize_mode = config.get("resize_mode")
                if resize_mode:
                    # Determine target dimensions
                    target_width = config.get("target_width") or enc.get("width")
                    target_height = config.get("target_height") or enc.get("height")

                    # If no explicit target, use first input's dimensions
                    if not target_width or not target_height:
                        first_w, first_h = get_video_dimensions(input_files[0])
                        target_width = target_width or first_w
                        target_height = target_height or first_h

                    if target_width and target_height:
                        print(f"  Normalizing {len(input_files)} inputs to {target_width}x{target_height} ({resize_mode})", file=sys.stderr)
                        normalized_files = []
                        for i, inp_file in enumerate(input_files):
                            norm_file = work_dir / f"norm_{step_id[:8]}_{i:04d}.mp4"
                            normalize_video(
                                inp_file, norm_file,
                                target_width, target_height,
                                resize_mode,
                                priority=config.get("priority"),
                                pad_color=config.get("pad_color", "black"),
                                crop_gravity=config.get("crop_gravity", "center"),
                                encoding=enc,
                            )
                            normalized_files.append(norm_file)
                        input_files = normalized_files

                # Use tree concat for efficiency
                output_file = tree_concat(input_files, work_dir, f"seq_{step_id[:8]}")
                results[step_id] = output_file
                print(f"  -> {output_file}", file=sys.stderr)

            elif node_type == "MUX":
                video_path = results[inputs[0]]
                audio_path = results[inputs[1]]
                enc = get_encoding(recipe_encoding, config)

                output_file = work_dir / f"mux_{step_id}.mp4"
                cmd = ["ffmpeg", "-y",
                       "-i", str(video_path), "-i", str(audio_path),
                       "-map", "0:v", "-map", "1:a",
                       "-c:v", enc["codec"], "-preset", enc["preset"],
                       "-crf", str(enc["crf"]), "-c:a", enc["audio_codec"],
                       "-shortest", str(output_file)]

                subprocess.run(cmd, check=True, capture_output=True)
                results[step_id] = output_file
                print(f"  -> {output_file}", file=sys.stderr)

            elif node_type == "ANALYZE":
                output_file = work_dir / f"analysis_{step_id}.json"

                if "analysis_results" in config:
                    # Analysis was done during planning
                    with open(output_file, "w") as f:
                        json.dump(config["analysis_results"], f)
                    analysis_data[step_id] = config["analysis_results"]
                    print(f"  -> {output_file} (from plan)", file=sys.stderr)
                else:
                    # Run analyzer now
                    analyzer_path = config.get("analyzer_path")
                    if analyzer_path:
                        analyzer_path = (recipe_dir / analyzer_path).resolve()
                        input_path = results[inputs[0]]

                        # Load and run analyzer
                        import importlib.util
                        spec = importlib.util.spec_from_file_location("analyzer", analyzer_path)
                        analyzer_module = importlib.util.module_from_spec(spec)
                        spec.loader.exec_module(analyzer_module)

                        # Run analysis
                        analyzer_params = {k: v for k, v in config.items()
                                         if k not in ("analyzer", "analyzer_path", "cid")}
                        analysis_result = analyzer_module.analyze(input_path, analyzer_params)

                        # Save and store results
                        with open(output_file, "w") as f:
                            json.dump(analysis_result, f)
                        analysis_data[step_id] = analysis_result
                        print(f"  -> {output_file} (ran analyzer: {len(analysis_result.get('times', []))} pts)", file=sys.stderr)
                    else:
                        print(f"  -> no analyzer path!", file=sys.stderr)

                results[step_id] = output_file

            elif node_type == "COMPOUND":
                # Collapsed effect chains - compile to single FFmpeg command with sendcmd
                filter_chain_raw = config.get("filter_chain", [])
                if not filter_chain_raw:
                    raise ValueError("COMPOUND step has empty filter_chain")

                # Convert filter_chain items from S-expression lists to dicts
                # and clean nil Symbols from configs
                filter_chain = []
                for item in filter_chain_raw:
                    if isinstance(item, dict):
                        # Clean nil Symbols from the config
                        cleaned_item = clean_nil_symbols(item)
                        filter_chain.append(cleaned_item)
                    elif isinstance(item, list) and item:
                        item_dict = sexp_to_dict(item)
                        ftype = item_dict.get("type", "UNKNOWN")
                        if isinstance(ftype, Symbol):
                            ftype = ftype.name
                        fconfig_raw = item_dict.get("config", {})
                        if isinstance(fconfig_raw, list):
                            fconfig = sexp_to_dict(fconfig_raw)
                        elif isinstance(fconfig_raw, dict):
                            fconfig = fconfig_raw
                        else:
                            fconfig = {}
                        # Clean nil Symbols from config
                        fconfig = clean_nil_symbols(fconfig)
                        filter_chain.append({"type": ftype, "config": fconfig})
                    else:
                        filter_chain.append({"type": "UNKNOWN", "config": {}})

                input_path = results[inputs[0]]
                # Debug: verify input exists and has content
                if not input_path.exists():
                    raise ValueError(f"COMPOUND input does not exist: {input_path}")
                if input_path.stat().st_size == 0:
                    raise ValueError(f"COMPOUND input is empty: {input_path}")
                print(f"  COMPOUND input: {input_path} ({input_path.stat().st_size} bytes)", file=sys.stderr)
                enc = get_encoding(recipe_encoding, config)
                output_file = work_dir / f"compound_{step_id}.mp4"

                # Extract segment timing and effects
                segment_start = 0
                segment_duration = None
                effects = []

                for filter_item in filter_chain:
                    filter_type = filter_item.get("type", "")
                    filter_config = filter_item.get("config", {})

                    if filter_type == "SEGMENT":
                        segment_start = filter_config.get("start", 0)
                        segment_duration = filter_config.get("duration")
                        if not segment_duration and filter_config.get("end"):
                            segment_duration = filter_config["end"] - segment_start
                    elif filter_type == "EFFECT":
                        effects.append(filter_config)

                # Try to compile effects to FFmpeg filters
                from artdag.sexp.ffmpeg_compiler import FFmpegCompiler, generate_sendcmd_filter
                compiler = FFmpegCompiler()

                # Check if any effect has bindings - these need Python path for per-frame resolution
                def has_bindings(effect_config):
                    for k, v in effect_config.items():
                        if isinstance(v, dict) and ("_bind" in v or "_binding" in v):
                            return True
                    return False

                any_has_bindings = any(has_bindings(e) for e in effects)

                # Check if all effects have FFmpeg mappings
                all_have_mappings = all(
                    compiler.get_mapping(e.get("effect", "")) is not None
                    for e in effects
                )

                # Use FFmpeg only for static effects (no bindings)
                # Effects with bindings use Python path for proper per-frame binding resolution
                if all_have_mappings and effects and not any_has_bindings:
                    # Compile to FFmpeg with sendcmd for dynamic params
                    ffmpeg_filters, sendcmd_path = generate_sendcmd_filter(
                        effects,
                        analysis_data,
                        segment_start,
                        segment_duration or 1.0,
                    )

                    # Build FFmpeg command
                    cmd = ["ffmpeg", "-y", "-i", str(input_path)]
                    if segment_start:
                        cmd.extend(["-ss", str(segment_start)])
                    if segment_duration:
                        cmd.extend(["-t", str(segment_duration)])

                    if ffmpeg_filters:
                        cmd.extend(["-vf", ffmpeg_filters])

                    cmd.extend(["-r", str(enc.get("fps", 30)),
                               "-c:v", enc["codec"], "-preset", enc["preset"],
                               "-crf", str(enc["crf"]), "-pix_fmt", "yuv420p",
                               "-c:a", enc["audio_codec"],
                               str(output_file)])

                    effect_names = [e.get("effect", "?") for e in effects]
                    print(f"  COMPOUND (FFmpeg): {', '.join(effect_names)}", file=sys.stderr)
                    print(f"    filters: {ffmpeg_filters[:80]}{'...' if len(ffmpeg_filters) > 80 else ''}", file=sys.stderr)

                    result = subprocess.run(cmd, capture_output=True, text=True)
                    if result.returncode != 0:
                        print(f"    FFmpeg error: {result.stderr[:200]}", file=sys.stderr)
                        raise RuntimeError(f"FFmpeg failed: {result.stderr}")

                    # Clean up sendcmd file
                    if sendcmd_path and sendcmd_path.exists():
                        sendcmd_path.unlink()
                else:
                    # Fall back to sequential processing for effects without FFmpeg mappings
                    current_input = input_path

                    # First handle segment
                    for filter_item in filter_chain:
                        if filter_item.get("type") == "SEGMENT":
                            filter_config = filter_item.get("config", {})
                            start = filter_config.get("start", 0)
                            duration = filter_config.get("duration")

                            if start or duration:
                                seg_output = work_dir / f"compound_{step_id}_seg.mp4"
                                cmd = ["ffmpeg", "-y", "-i", str(current_input)]
                                if start:
                                    cmd.extend(["-ss", str(start)])
                                if duration:
                                    cmd.extend(["-t", str(duration)])
                                cmd.extend(["-r", str(enc.get("fps", 30)),
                                           "-c:v", enc["codec"], "-preset", enc["preset"],
                                           "-crf", str(enc["crf"]), "-pix_fmt", "yuv420p",
                                           "-c:a", enc["audio_codec"],
                                           str(seg_output)])
                                print(f"  Extracting segment: start={start}, duration={duration}", file=sys.stderr)
                                result = subprocess.run(cmd, capture_output=True, text=True)
                                if result.returncode != 0:
                                    print(f"  FFmpeg segment error: {result.stderr}", file=sys.stderr)
                                    raise ValueError(f"FFmpeg segment extraction failed: {result.stderr}")
                                if not seg_output.exists() or seg_output.stat().st_size == 0:
                                    raise ValueError(f"Segment output invalid: {seg_output}")
                                print(f"  Segment output: {seg_output.stat().st_size} bytes", file=sys.stderr)
                                current_input = seg_output
                            break

                    # Then handle effects sequentially
                    for i, effect_config in enumerate(effects):
                        effect_name = effect_config.get("effect", "unknown")
                        effect_path = effect_config.get("effect_path")

                        # Try to resolve effect path
                        if not effect_path:
                            for effects_dir in ["effects", "sexp_effects/effects"]:
                                for ext in [".py", ".sexp"]:
                                    candidate = recipe_dir / effects_dir / f"{effect_name}{ext}"
                                    if candidate.exists():
                                        effect_path = str(candidate.relative_to(recipe_dir))
                                        break
                                if effect_path:
                                    break

                        is_last = (i == len(effects) - 1)
                        effect_output = output_file if is_last else work_dir / f"compound_{step_id}_fx_{i:02d}.mp4"

                        if effect_path:
                            full_path = recipe_dir / effect_path
                            effect_module = load_effect(full_path)
                            params = {k: v for k, v in effect_config.items()
                                      if k not in ("effect", "effect_path", "cid", "encoding", "type")}
                            print(f"  COMPOUND [{i+1}/{len(effects)}]: {effect_name} (Python)", file=sys.stderr)
                            # Debug: check input file
                            if not current_input.exists():
                                raise ValueError(f"Input file does not exist: {current_input}")
                            input_size = current_input.stat().st_size
                            print(f"    Input: {current_input.name} ({input_size} bytes)", file=sys.stderr)
                            if input_size == 0:
                                raise ValueError(f"Input file is empty: {current_input}")
                            run_effect(effect_module, current_input, effect_output, params, enc, analysis_data, time_offset=segment_start, max_duration=segment_duration)
                        else:
                            raise ValueError(f"COMPOUND EFFECT '{effect_name}' has no effect_path or FFmpeg mapping")

                        current_input = effect_output

                results[step_id] = output_file
                print(f"  -> {output_file}", file=sys.stderr)

            else:
                raise ValueError(f"Unknown node type: {node_type}")

        # Get final output
        final_output = results[plan["output_step_id"]]
        print(f"\n--- Output ---", file=sys.stderr)
        print(f"Final: {final_output}", file=sys.stderr)

        if output_path:
            # Handle stdout specially - remux to streamable format
            if str(output_path) in ("/dev/stdout", "-"):
                # MP4 isn't streamable, use matroska which is
                cmd = [
                    "ffmpeg", "-y", "-i", str(final_output),
                    "-c", "copy", "-f", "matroska", "pipe:1"
                ]
                subprocess.run(cmd, stdout=sys.stdout.buffer, stderr=subprocess.DEVNULL)
                return output_path
            else:
                shutil.copy(final_output, output_path)
                print(f"Copied to: {output_path}", file=sys.stderr)
                # Print path to stdout for piping
                print(output_path)
                return output_path
        else:
            out = recipe_dir / f"{plan['recipe_id']}-output.mp4"
            shutil.copy(final_output, out)
            print(f"Copied to: {out}", file=sys.stderr)
            # Print path to stdout for piping
            print(out)
            return out

    finally:
        print(f"Debug: temp files in {work_dir}", file=sys.stderr)


if __name__ == "__main__":
    import argparse

    parser = argparse.ArgumentParser(description="Execute a plan")
    parser.add_argument("plan", nargs="?", default="-", help="Plan file (- for stdin)")
    parser.add_argument("-o", "--output", type=Path, help="Output file")
    parser.add_argument("-d", "--dir", type=Path, default=Path("."), help="Recipe directory for resolving paths")
    parser.add_argument("-a", "--analysis", type=Path, help="Analysis file (.sexp)")

    args = parser.parse_args()

    plan_path = None if args.plan == "-" else Path(args.plan)
    if plan_path and not plan_path.exists():
        print(f"Plan not found: {plan_path}")
        sys.exit(1)

    # Load external analysis if provided
    external_analysis = None
    if args.analysis:
        if not args.analysis.exists():
            print(f"Analysis file not found: {args.analysis}")
            sys.exit(1)
        external_analysis = parse_analysis_sexp(args.analysis.read_text())

    execute_plan(plan_path, args.output, args.dir, external_analysis=external_analysis)