buzzer_2/firmware/fs/build_lfs_audio.py

#!/usr/bin/env python3
import argparse
import shutil
import subprocess
import tempfile
from pathlib import Path

import soundfile as sf
import yaml
from intelhex import IntelHex
from kokoro import KPipeline
from littlefs import LittleFS

DEFAULT_SAMPLE_RATE = 16000
DEFAULT_VOICE = "af_bella"
DEFAULT_BLOCK_SIZE = 4096
DEFAULT_BLOCK_COUNT = 2048
DEFAULT_FILTERS = [
    "highpass=f=120",
    "lowpass=f=6000",
    "acompressor=threshold=-18dB:ratio=3:attack=5:release=80",
    "loudnorm=I=-16:TP=-1.0",
]

DEFAULT_SYS_PROMPTS = [
    {"id": "404", "text": "No sound sample was found on the device."},
    {"id": "update", "text": "Firmware updated. Awaiting confirmation."},
    {"id": "confirm", "text": "State confirmed."},
]


def run_ffmpeg(cmd: list[str]) -> None:
    subprocess.run(cmd, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)


def export_raw_pcm(input_path: Path, output_path: Path, sample_rate: int, filters: list[str]) -> None:
    output_path.parent.mkdir(parents=True, exist_ok=True)
    filter_str = ",".join(filters)
    run_ffmpeg([
        "ffmpeg",
        "-y",
        "-i",
        str(input_path),
        "-af",
        filter_str,
        "-ar",
        str(sample_rate),
        "-ac",
        "1",
        "-f",
        "s16le",
        "-acodec",
        "pcm_s16le",
        str(output_path),
    ])


def load_sys_prompts(yaml_path: Path | None) -> list[dict]:
    if yaml_path is None:
        return DEFAULT_SYS_PROMPTS

    with open(yaml_path, "r", encoding="utf-8") as f:
        data = yaml.safe_load(f) or []

    prompts: list[dict] = []
    if isinstance(data, list):
        for item in data:
            if isinstance(item, dict) and item.get("id") and item.get("text"):
                prompts.append({"id": item["id"], "text": item["text"]})
    elif isinstance(data, dict):
        for item in data.get("assets", []):
            if isinstance(item, dict) and item.get("id") and item.get("text"):
                prompts.append({"id": item["id"], "text": item["text"]})

    return prompts


def build_sys_tts(prompts: list[dict], out_sys_dir: Path, sample_rate: int) -> int:
    pipeline = KPipeline(lang_code="a")
    generated = 0

    with tempfile.TemporaryDirectory(prefix="tts_tmp_") as tmp_dir_name:
        tmp_dir = Path(tmp_dir_name)

        for prompt in prompts:
            asset_id = prompt["id"]
            text = prompt["text"]

            tmp_wav = tmp_dir / f"{asset_id}.wav"
            generator = pipeline(text, voice=DEFAULT_VOICE, speed=1.0)
            for _, _, audio in generator:
                sf.write(tmp_wav, audio, 24000)
                break

            out_file = out_sys_dir / asset_id
            export_raw_pcm(tmp_wav, out_file, sample_rate=sample_rate, filters=DEFAULT_FILTERS)
            generated += 1

    return generated


def import_wavs_to_a(wav_dir: Path | None, out_a_dir: Path, sample_rate: int) -> int:
    if wav_dir is None:
        return 0
    if not wav_dir.exists() or not wav_dir.is_dir():
        raise FileNotFoundError(f"WAV directory not found: {wav_dir}")

    count = 0
    for wav_file in sorted(wav_dir.glob("*.wav")):
        out_file = out_a_dir / wav_file.stem
        export_raw_pcm(wav_file, out_file, sample_rate=sample_rate, filters=DEFAULT_FILTERS)
        count += 1

    return count


def add_files_recursive(fs: LittleFS, local_path: Path, lfs_path: str = "/") -> None:
    if not local_path.exists():
        return

    for item in sorted(local_path.iterdir()):
        target_path = f"{lfs_path.rstrip('/')}/{item.name}".replace("//", "/")
        if item.is_file():
            with open(item, "rb") as f:
                with fs.open(target_path, "wb") as lfs_file:
                    lfs_file.write(f.read())
        elif item.is_dir():
            fs.mkdir(target_path)
            add_files_recursive(fs, item, target_path)


def build_littlefs_hex(source_folder: Path, output_hex: Path, block_size: int, block_count: int, start_addr: int) -> None:
    fs = LittleFS(
        block_size=block_size,
        block_count=block_count,
        read_size=256,
        prog_size=256,
        lookahead_size=512,
        cache_size=4096,
    )

    add_files_recursive(fs, source_folder)

    ih = IntelHex()
    lfs_buffer = fs.context.buffer

    for idx in range(block_count):
        offset = idx * block_size
        block_data = lfs_buffer[offset : offset + block_size]
        if any(byte != 0xFF for byte in block_data):
            ih.frombytes(block_data, offset=start_addr + offset)

    ih.tofile(str(output_hex), format="hex")


def parse_args() -> argparse.Namespace:
    parser = argparse.ArgumentParser(
        description=(
            "Generate Bella-only TTS in /lfs/sys, optionally import WAVs into /lfs/a, "
            "then create LittleFS HEX."
        )
    )
    parser.add_argument("--wav-dir", default=None, help="Optional directory with WAV files for /lfs/a")
    parser.add_argument("--sys-yaml", default=None, help="Optional YAML with system prompts (id/text)")
    parser.add_argument("--sample-rate", type=int, default=DEFAULT_SAMPLE_RATE)
    parser.add_argument("--block-size", type=int, default=DEFAULT_BLOCK_SIZE)
    parser.add_argument("--block-count", type=int, default=DEFAULT_BLOCK_COUNT)
    parser.add_argument("--start-addr", type=lambda x: int(x, 0), default=0x12000000)
    parser.add_argument(
        "--output-hex",
        default=str(Path(__file__).resolve().parent / "lfs_external_flash.hex"),
        help="Output path for generated HEX",
    )
    parser.add_argument(
        "--keep-staging",
        action="store_true",
        help="Keep temporary staging directory for inspection",
    )
    return parser.parse_args()


def main() -> None:
    args = parse_args()

    fs_dir = Path(__file__).resolve().parent
    output_hex = Path(args.output_hex).resolve()
    wav_dir = Path(args.wav_dir).resolve() if args.wav_dir else None
    sys_yaml = Path(args.sys_yaml).resolve() if args.sys_yaml else None

    staging_root = fs_dir / ".tmp_lfs_build"
    if staging_root.exists():
        shutil.rmtree(staging_root)

    out_sys = staging_root / "lfs" / "sys"
    out_a = staging_root / "lfs" / "a"
    out_sys.mkdir(parents=True, exist_ok=True)
    out_a.mkdir(parents=True, exist_ok=True)

    prompts = load_sys_prompts(sys_yaml)
    if not prompts:
        raise RuntimeError("No system prompts available. Provide --sys-yaml or use defaults.")

    tts_count = build_sys_tts(prompts, out_sys, args.sample_rate)
    wav_count = import_wavs_to_a(wav_dir, out_a, args.sample_rate)

    build_littlefs_hex(
        source_folder=staging_root,
        output_hex=output_hex,
        block_size=args.block_size,
        block_count=args.block_count,
        start_addr=args.start_addr,
    )

    print(f"Done. TTS assets: {tts_count}, WAV imports: {wav_count}, HEX: {output_hex}")

    if not args.keep_staging and staging_root.exists():
        shutil.rmtree(staging_root)


if __name__ == "__main__":
    main()