#!/usr/bin/env python3 """ extract-palette.py — Build-time 5-color palette sidecar for photography. Walks content/photography/**/*.{jpg,jpeg,png} and writes a {photo}.palette.yaml sidecar alongside each image, containing five hex colors derived from the photograph via colorthief's k-means-like quantisation. The sidecar is consumed by photographyCtx in Hakyll and rendered as the thin
strip beneath each photo. Frontmatter `palette:` always wins. Authors can override the auto extraction for artistic reasons (e.g. exposing brand-aligned tones that aren't statistically dominant in the pixels). The sidecar is the fallback so authors don't need to write hex codes by hand. Staleness check: skips an image whose sidecar mtime > image mtime. Called by `make build` when .venv exists. Per-image failures are logged and the rest of the walk continues; the build never fails on a palette extraction error. """ from __future__ import annotations import argparse import sys from pathlib import Path from typing import Any import yaml from colorthief import ColorThief REPO_ROOT = Path(__file__).parent.parent CONTENT_DIR = REPO_ROOT / "content" / "photography" IMAGE_EXTS = {".jpg", ".jpeg", ".png"} # Number of swatches in the rendered strip. Five matches the existing # `photo-palette` CSS in static/css/photography.css, which sets # `display: flex; height: 0.75rem;` and divides the bar evenly. Bumping # this requires a CSS revisit — the bar reads as a unified strip up to # about 7 swatches; beyond that the bands become too narrow to perceive. N_SWATCHES = 5 # colorthief's quality knob: lower = better palette but slower. The # default of 10 is a reasonable trade-off; 1 is exhaustive. QUALITY = 10 def _hex(rgb: tuple[int, int, int]) -> str: return "#{:02x}{:02x}{:02x}".format(*rgb) def _sidecar_path(image: Path) -> Path: return image.with_suffix(image.suffix + ".palette.yaml") def _is_stale(image: Path, sidecar: Path) -> bool: if not sidecar.exists(): return True return image.stat().st_mtime > sidecar.stat().st_mtime def _atomic_write_yaml(path: Path, data: dict[str, Any]) -> None: tmp = path.with_suffix(path.suffix + ".tmp") with tmp.open("w", encoding="utf-8") as f: yaml.safe_dump(data, f, sort_keys=False, allow_unicode=True) tmp.replace(path) def _extract_palette(image: Path) -> list[str]: """Return up to N_SWATCHES hex colors, in colorthief's dominance order.""" ct = ColorThief(str(image)) palette = ct.get_palette(color_count=N_SWATCHES, quality=QUALITY) # colorthief sometimes returns one fewer entry than requested for # very low-color images; just take what we got. return [_hex(rgb) for rgb in palette[:N_SWATCHES]] def _process_one(image: Path, counters: dict[str, int]) -> None: """Extract a palette for one image, updating counters.""" if image.name.startswith(".") or image.name.endswith(".tmp"): return sidecar = _sidecar_path(image) if not _is_stale(image, sidecar): counters["skipped"] += 1 return try: palette = _extract_palette(image) except Exception as e: # noqa: BLE001 — keep walking print(f"extract-palette: {image}: {e}", file=sys.stderr) counters["failed"] += 1 return _atomic_write_yaml(sidecar, {"palette": palette}) counters["written"] += 1 def main() -> int: parser = argparse.ArgumentParser( description="Write 5-color palette sidecars for photography images.", ) parser.add_argument( "--file", type=Path, help="Process a single image instead of walking content/photography/. " "Used by tools/import-photo.sh to avoid a full re-walk per import.", ) args = parser.parse_args() counters = {"written": 0, "skipped": 0, "failed": 0} if args.file is not None: if not args.file.exists(): print(f"extract-palette: --file {args.file} does not exist", file=sys.stderr) return 1 if args.file.suffix.lower() not in IMAGE_EXTS: print( f"extract-palette: --file {args.file}: unsupported extension" f" (expected one of {sorted(IMAGE_EXTS)})", file=sys.stderr, ) return 1 _process_one(args.file, counters) else: if not CONTENT_DIR.exists(): print( f"extract-palette: {CONTENT_DIR} does not exist — skipping.", file=sys.stderr, ) return 0 for image in sorted(CONTENT_DIR.rglob("*")): if image.suffix.lower() not in IMAGE_EXTS: continue _process_one(image, counters) print( f"extract-palette: {counters['written']} written, " f"{counters['skipped']} skipped, {counters['failed']} failed", file=sys.stderr, ) return 0 if __name__ == "__main__": sys.exit(main())