#!/usr/bin/env python3 """Two-checkerboard camera-room calibration for WiFi pose training (ADR-152 S2.1.3). Aligns the ADR-079 ground-truth camera and the ESP32 WiFi transceivers in one shared 3D room frame -- the PerceptAlign (arXiv 2601.12252) defense against "coordinate overfitting", where CSI-to-camera-coordinate regression memorizes the deployment layout and collapses cross-layout. Procedure (<5 minutes): 1. Print a checkerboard (default 9x6 inner corners, 25 mm squares). 2. Tape one board flat on the ORIGIN WALL, tape-measure its top-left inner corner position in room coordinates (+x along wall, +y into room, +z up). 3. Lay the second board flat on the FLOOR, measure its near-left inner corner. 4. With the collection camera in its final position, photograph each board. 5. Run this script; tape-measure each ESP32 node position when prompted (or pass --geometry nodes.json). Output: a calibration bundle JSON consumed by scripts/collect-ground-truth.py --calibration Usage: python scripts/calibrate-camera-room.py \\ --wall-image photos/wall.jpg --wall-origin 0.50,0.0,1.60 \\ --floor-image photos/floor.jpg --floor-origin 1.00,1.00,0.0 \\ --calib-images "photos/intrinsics/*.jpg" \\ --geometry config/transceivers.json \\ --output data/calibration/camera-room.json """ from __future__ import annotations import argparse import glob import json import sys from datetime import datetime from pathlib import Path import cv2 import numpy as np sys.path.insert(0, str(Path(__file__).resolve().parent)) import calibration_lib as cal # noqa: E402 INTRINSICS_CACHE = Path("data") / ".cache" / "camera_intrinsics.json" def parse_vec3(text: str) -> np.ndarray: parts = [float(p) for p in text.replace(",", " ").split()] if len(parts) != 3: raise argparse.ArgumentTypeError(f"Expected 3 comma-separated numbers, got {text!r}") return np.array(parts, dtype=np.float64) def detect_corners(image_path: Path, cols: int, rows: int) -> tuple[np.ndarray, tuple[int, int]]: image = cv2.imread(str(image_path)) if image is None: print(f"ERROR: Cannot read image {image_path}", file=sys.stderr) sys.exit(1) corners = cal.find_board_corners(image, cols, rows) if corners is None: print( f"ERROR: No {cols}x{rows} checkerboard found in {image_path}. " "Check lighting, focus, and the --board-cols/--board-rows flags.", file=sys.stderr, ) sys.exit(1) h, w = image.shape[:2] return corners, (w, h) def resolve_intrinsics(args, repo_root: Path, board_args: tuple[int, int, float]) -> dict: """Pre-computed file > cached > computed from --calib-images > last-resort 2-view estimate from the wall+floor photos themselves.""" cols, rows, square_m = board_args if args.intrinsics: print(f"Intrinsics: loading {args.intrinsics}") return cal.load_intrinsics(Path(args.intrinsics)) cache_path = repo_root / INTRINSICS_CACHE if cache_path.exists() and not args.recalibrate_intrinsics: print(f"Intrinsics: using cached {cache_path} (pass --recalibrate-intrinsics to redo)") intr = cal.load_intrinsics(cache_path) intr["source"] = "cached" return intr if args.calib_images: paths = sorted(glob.glob(args.calib_images)) if len(paths) < 3: print( f"ERROR: --calib-images matched only {len(paths)} file(s); " "need >= 3 checkerboard views for stable intrinsics.", file=sys.stderr, ) sys.exit(1) corner_sets, image_size = [], None for p in paths: corners, size = detect_corners(Path(p), cols, rows) if image_size is None: image_size = size elif size != image_size: print(f"ERROR: {p} has size {size}, expected {image_size}.", file=sys.stderr) sys.exit(1) corner_sets.append(corners) print(f" corners found: {p}") intr = cal.compute_intrinsics(corner_sets, image_size, cols, rows, square_m) print(f"Intrinsics: computed from {len(paths)} views, " f"reprojection RMS {intr['reprojection_error_px']:.3f} px") cal.save_bundle(intr, cache_path) # plain JSON write; reused on next run print(f" cached to {cache_path}") return intr # Last resort: 2-view calibration from the extrinsic photos. Workable but # weak -- warn loudly and recommend a proper multi-view pass. print( "WARNING: no --intrinsics / cache / --calib-images; estimating intrinsics " "from the wall+floor photos alone (2 views, low quality). Prefer " "--calib-images with 5-10 varied board views.", file=sys.stderr, ) corner_sets, image_size = [], None for p in (args.wall_image, args.floor_image): corners, size = detect_corners(Path(p), cols, rows) image_size = image_size or size corner_sets.append(corners) intr = cal.compute_intrinsics(corner_sets, image_size, cols, rows, square_m) intr["source"] = "two-view-fallback" return intr def prompt_transceiver_geometry() -> dict: """Tape-measure entry of ESP32 node positions in room coordinates.""" print() print("Transceiver geometry -- enter one node per line:") print(" [yaw_deg] (meters, room frame; blank line to finish)") print(" example: esp32-s3-a 0.10 2.40 1.10 180") nodes = [] while True: try: line = input("node> ").strip() except EOFError: break if not line: break parts = line.split() if len(parts) not in (4, 5): print(" expected: [yaw_deg]", file=sys.stderr) continue try: node = {"id": parts[0], "position_m": [float(parts[1]), float(parts[2]), float(parts[3])]} if len(parts) == 5: node["antenna_yaw_deg"] = float(parts[4]) except ValueError: print(" positions must be numeric", file=sys.stderr) continue nodes.append(node) if not nodes: print("WARNING: no transceiver nodes entered; bundle will carry empty geometry.", file=sys.stderr) return {"nodes": nodes, "units": "meters", "source": "tape-measure-prompt"} def load_geometry_file(path: Path) -> dict: with open(path, "r", encoding="utf-8") as f: data = json.load(f) nodes = data.get("nodes", data if isinstance(data, list) else None) if nodes is None: raise ValueError(f"{path}: expected {{'nodes': [...]}} or a top-level list") for node in nodes: if "id" not in node or "position_m" not in node: raise ValueError(f"{path}: each node needs 'id' and 'position_m' [x,y,z]") return {"nodes": nodes, "units": "meters", "source": "file"} def main(): parser = argparse.ArgumentParser( description="Two-checkerboard camera-room calibration (ADR-152 S2.1.3 / ADR-079)." ) parser.add_argument("--wall-image", required=True, help="Photo of the checkerboard on the origin wall") parser.add_argument("--floor-image", required=True, help="Photo of the checkerboard on the floor (camera NOT moved)") parser.add_argument("--wall-origin", type=parse_vec3, default="0.5,0.0,1.6", help="Room xyz (m) of the wall board's first inner corner " "(default: 0.5,0.0,1.6)") parser.add_argument("--floor-origin", type=parse_vec3, default="1.0,1.0,0.0", help="Room xyz (m) of the floor board's first inner corner " "(default: 1.0,1.0,0.0)") parser.add_argument("--wall-axes", default="+x,-z", help="Wall board column,row directions in room frame (default: +x,-z)") parser.add_argument("--floor-axes", default="+x,+y", help="Floor board column,row directions in room frame (default: +x,+y)") parser.add_argument("--board-cols", type=int, default=cal.DEFAULT_BOARD_COLS, help=f"Inner corners per row (default: {cal.DEFAULT_BOARD_COLS})") parser.add_argument("--board-rows", type=int, default=cal.DEFAULT_BOARD_ROWS, help=f"Inner corners per column (default: {cal.DEFAULT_BOARD_ROWS})") parser.add_argument("--square-size-mm", type=float, default=cal.DEFAULT_SQUARE_SIZE_MM, help=f"Checkerboard square size in mm (default: {cal.DEFAULT_SQUARE_SIZE_MM})") parser.add_argument("--intrinsics", help="Pre-computed intrinsics JSON (skips computation)") parser.add_argument("--calib-images", help="Glob of >=3 checkerboard photos for intrinsics computation") parser.add_argument("--recalibrate-intrinsics", action="store_true", help="Ignore the cached intrinsics and recompute") parser.add_argument("--geometry", help="Transceiver geometry JSON ({nodes:[{id,position_m,[antenna_yaw_deg]}]}); " "omit to be prompted for tape-measure entry") parser.add_argument("--output", default=None, help="Bundle output path (default: data/calibration/camera-room-.json)") args = parser.parse_args() if isinstance(args.wall_origin, str): args.wall_origin = parse_vec3(args.wall_origin) if isinstance(args.floor_origin, str): args.floor_origin = parse_vec3(args.floor_origin) repo_root = Path(__file__).resolve().parent.parent cols, rows = args.board_cols, args.board_rows square_m = args.square_size_mm / 1000.0 # --- Intrinsics --- intrinsics = resolve_intrinsics(args, repo_root, (cols, rows, square_m)) camera_matrix = np.asarray(intrinsics["camera_matrix"], dtype=np.float64) dist_coeffs = np.asarray(intrinsics["dist_coeffs"], dtype=np.float64) # --- Corner detection on the two placed boards --- wall_corners, wall_size = detect_corners(Path(args.wall_image), cols, rows) floor_corners, floor_size = detect_corners(Path(args.floor_image), cols, rows) if wall_size != floor_size: print(f"ERROR: wall image {wall_size} and floor image {floor_size} differ in size; " "both must come from the fixed collection camera.", file=sys.stderr) sys.exit(1) print(f"Corners detected: wall + floor boards ({cols}x{rows}, {args.square_size_mm} mm)") # Re-scale intrinsics if they were computed at a different resolution # than the extrinsic photos (the bundle always stores K at wall_size). intr_size = tuple(intrinsics["image_size"]) if intr_size != wall_size: sx, sy = wall_size[0] / intr_size[0], wall_size[1] / intr_size[1] camera_matrix[0, 0] *= sx camera_matrix[0, 2] *= sx camera_matrix[1, 1] *= sy camera_matrix[1, 2] *= sy print(f" intrinsics scaled {intr_size} -> {wall_size}") intrinsics = {**intrinsics, "camera_matrix": camera_matrix.tolist(), "image_size": list(wall_size)} # --- Room-frame corner positions from the measured placements --- wall_u, wall_v = (cal.parse_axis(t) for t in args.wall_axes.split(",")) floor_u, floor_v = (cal.parse_axis(t) for t in args.floor_axes.split(",")) wall_room = cal.board_room_points(cols, rows, square_m, args.wall_origin, wall_u, wall_v) floor_room = cal.board_room_points(cols, rows, square_m, args.floor_origin, floor_u, floor_v) # --- Extrinsics: joint two-board solve (resolves per-board corner-order # ambiguity -- a single planar board is centrosymmetric; the pair is not) --- extrinsics = cal.solve_two_board_extrinsics( wall_room, wall_corners, floor_room, floor_corners, camera_matrix, dist_coeffs ) wall_rmse = extrinsics["per_board"]["wall"]["rmse_px"] floor_rmse = extrinsics["per_board"]["floor"]["rmse_px"] print(f" joint solve: RMSE {extrinsics['rmse_px']:.3f} px " f"(wall {wall_rmse:.3f} / floor {floor_rmse:.3f})") print(f" camera at room {np.round(extrinsics['translation_m'], 3).tolist()} m") if max(wall_rmse, floor_rmse) > 3.0: print( "WARNING: high per-board reprojection error -- re-check the measured " "board origins/axes and that the camera did not move between photos.", file=sys.stderr, ) # --- Transceiver geometry --- if args.geometry: geometry = load_geometry_file(Path(args.geometry)) print(f"Transceiver geometry: {len(geometry['nodes'])} node(s) from {args.geometry}") else: geometry = prompt_transceiver_geometry() # --- Bundle --- bundle = cal.make_bundle( camera_intrinsics=intrinsics, camera_to_room_extrinsics=extrinsics, checkerboard_spec={"cols": cols, "rows": rows, "square_size_mm": args.square_size_mm}, transceiver_geometry=geometry, ) if args.output: out_path = Path(args.output) else: ts = datetime.now().strftime("%Y%m%d_%H%M%S") out_path = repo_root / "data" / "calibration" / f"camera-room-{ts}.json" cal.save_bundle(bundle, out_path) print() print("=== Calibration bundle written ===") print(f" path: {out_path}") print(f" calibration_id: {cal.calibration_id(bundle)}") print(f" next: python scripts/collect-ground-truth.py --calibration {out_path}") if __name__ == "__main__": main()