DMontgomery40 · March 13, 2026 09:27
diff --git a/agents__openai.yaml b/agents__openai.yaml
 interface:
  display_name: "Frontend Code Review"
  short_description: "Catch UI bugs, races, and weak frontend tests"
  default_prompt: "Use $frontend-code-review to review the frontend diff for concrete UI correctness issues, state or async races, interaction bugs, accessibility regressions, and fake or weak tests."
diff --git a/references__browser-and-runtime-proof.md b/references__browser-and-runtime-proof.md
diff --git a/references__test-expansion-and-verification.md b/references__test-expansion-and-verification.md
diff --git a/scripts__review_surface_probe.py b/scripts__review_surface_probe.py
 #!/usr/bin/env python3
 from __future__ import annotations

 import argparse
 import json
 import subprocess
 import sys
 from pathlib import Path


 TEST_HINTS = (
    ".test.",
    ".spec.",
    "_test.py",
    "test_",
 )

 VERIFY_SCRIPT_KEYS = ("verify", "build", "lint", "check")
 TEST_SCRIPT_KEYS = ("test", "test:e2e", "test:unit", "test:ui", "test:fullstack", "test:mocked")


 def run(cmd: list[str], cwd: Path) -> str:
    try:
        return subprocess.check_output(cmd, cwd=str(cwd), stderr=subprocess.DEVNULL, text=True).strip()
    except Exception:
        return ""


 def git_root(path: Path) -> Path:
    root = run(["git", "rev-parse", "--show-toplevel"], path)
    return Path(root) if root else path


 def load_package_json(path: Path) -> dict:
    try:
        return json.loads(path.read_text())
    except Exception:
        return {}


 def tracked_tests(repo_root: Path) -> list[str]:
    output = run(["git", "ls-files"], repo_root)
    if not output:
        return []
    files = output.splitlines()
    return [f for f in files if any(hint in f for hint in TEST_HINTS) or "/tests/" in f or f.startswith("tests/")]


 def gather_commands(pkg_path: Path, label: str) -> tuple[list[str], list[str]]:
    data = load_package_json(pkg_path)
    scripts = data.get("scripts", {})
    test_cmds = []
    verify_cmds = []
    for key, value in scripts.items():
        rendered = f"{label}: {key} -> {value}"
        if key in TEST_SCRIPT_KEYS or "test" in key:
            test_cmds.append(rendered)
        elif key in VERIFY_SCRIPT_KEYS or any(token in key for token in VERIFY_SCRIPT_KEYS):
            verify_cmds.append(rendered)
    return test_cmds, verify_cmds


 def pyproject_markers(path: Path) -> list[str]:
    if not path.exists():
        return []
    text = path.read_text(errors="ignore")
    markers = []
    for token in ("pytest", "streamlit", "playwright", "vitest"):
        if token in text:
            markers.append(token)
    return markers


 def main() -> int:
    parser = argparse.ArgumentParser(description="Inspect repo review/test surfaces quickly.")
    parser.add_argument("repo", nargs="?", default=".", help="Repo path to inspect")
    parser.add_argument("--json", action="store_true", help="Emit JSON instead of markdown")
    args = parser.parse_args()

    start = Path(args.repo).expanduser().resolve()
    repo_root = git_root(start)

    package_candidates = [
        repo_root / "package.json",
        repo_root / "frontend" / "package.json",
        repo_root / "web" / "package.json",
        repo_root / "apps" / "web" / "package.json",
    ]
    package_candidates = [p for p in package_candidates if p.exists()]

    test_commands: list[str] = []
    verify_commands: list[str] = []
    deps: set[str] = set()
    for pkg in package_candidates:
        label = str(pkg.relative_to(repo_root))
        data = load_package_json(pkg)
        deps.update(data.get("dependencies", {}).keys())
        deps.update(data.get("devDependencies", {}).keys())
        tests, verify = gather_commands(pkg, label)
        test_commands.extend(tests)
        verify_commands.extend(verify)

    pyproject = repo_root / "pyproject.toml"
    pytest_ini = repo_root / "pytest.ini"
    py_markers = pyproject_markers(pyproject)
    if pytest_ini.exists() and "pytest" not in py_markers:
        py_markers.append("pytest")

    has_netlify = (repo_root / "netlify.toml").exists() or (repo_root / "netlify" / "functions").exists()
    has_playwright = any((repo_root / name).exists() for name in ("playwright.config.ts", "playwright.config.js", "playwright.config.mjs")) or "@playwright/test" in deps or "playwright" in py_markers
    has_vitest = any((repo_root / name).exists() for name in ("vitest.config.ts", "vitest.config.js", "vitest.config.mjs")) or "vitest" in deps
    has_jest = any((repo_root / name).exists() for name in ("jest.config.ts", "jest.config.js", "jest.config.mjs")) or "jest" in deps
    has_pytest = "pytest" in py_markers
    has_streamlit = "streamlit" in py_markers

    tracked = tracked_tests(repo_root)

    detected_surfaces = []
    if has_playwright:
        detected_surfaces.append("playwright")
    if has_vitest:
        detected_surfaces.append("vitest")
    if has_jest:
        detected_surfaces.append("jest")
    if has_pytest:
        detected_surfaces.append("pytest")
    if has_streamlit:
        detected_surfaces.append("streamlit")

    notes = []
    if has_netlify:
        notes.append("Netlify markers detected; deployed preview/prod proof may be required for functions, redirects, auth, or cookie behavior.")
    if has_playwright:
        notes.append("Repo Playwright CLI is available for durable browser regression coverage.")
    if not tracked:
        notes.append("Little or no tracked test coverage detected; prefer the thinnest honest addition in the repo's existing stack.")
    if not detected_surfaces:
        notes.append("No obvious automated test harness detected from common manifests/configs.")

    result = {
        "repo_root": str(repo_root),
        "has_netlify": has_netlify,
        "detected_test_surfaces": detected_surfaces,
        "test_commands": test_commands,
        "verify_commands": verify_commands,
        "tracked_test_file_count": len(tracked),
        "tracked_test_examples": tracked[:12],
        "notes": notes,
    }

    if args.json:
        print(json.dumps(result, indent=2))
        return 0

    print(f"Repo root: {result['repo_root']}")
    print(f"Netlify: {'yes' if has_netlify else 'no'}")
    print(f"Detected test surfaces: {', '.join(detected_surfaces) if detected_surfaces else 'none-obvious'}")
    print(f"Tracked test files: {len(tracked)}")
    if tracked:
        print("Tracked test examples:")
        for item in tracked[:12]:
            print(f"- {item}")
    if test_commands:
        print("Test commands:")
        for item in test_commands:
            print(f"- {item}")
    if verify_commands:
        print("Verify/build commands:")
        for item in verify_commands:
            print(f"- {item}")
    if notes:
        print("Notes:")
        for item in notes:
            print(f"- {item}")
    return 0


 if __name__ == "__main__":
    sys.exit(main())

diff --git a/scripts__sync_codex_claude.sh b/scripts__sync_codex_claude.sh
 #!/usr/bin/env bash
 set -euo pipefail

 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 SKILL_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"
 SKILL_NAME="$(basename "$SKILL_DIR")"

 CODEX_DIR="${CODEX_SKILL_DIR:-$HOME/.codex/skills/$SKILL_NAME}"
 CLAUDE_DIR="${CLAUDE_SKILL_DIR:-$HOME/.claude/skills/$SKILL_NAME}"

 usage() {
  cat <<EOF
 Sync shared review skill files between Codex and Claude skill folders.

 Usage:
  sync_codex_claude.sh [auto|codex-to-claude|claude-to-codex|status]

 Environment overrides:
  CODEX_SKILL_DIR   default: ~/.codex/skills/$SKILL_NAME
  CLAUDE_SKILL_DIR  default: ~/.claude/skills/$SKILL_NAME
 EOF
 }

 mtime() {
  local path="$1"
  if stat -f "%m" "$path" >/dev/null 2>&1; then
    stat -f "%m" "$path"
  else
    stat -c "%Y" "$path"
  fi
 }

 latest_mtime() {
  local dir="$1"
  local latest=0
  while IFS= read -r -d '' file; do
    local file_mtime
    file_mtime="$(mtime "$file")"
    if (( file_mtime > latest )); then
      latest="$file_mtime"
    fi
  done < <(find "$dir" -type f ! -path "*/agents/*" ! -name ".DS_Store" -print0)
  echo "$latest"
 }

 sync_one_way() {
  local src="$1"
  local dst="$2"
  mkdir -p "$dst"
  rsync -a --exclude "agents/" --exclude ".DS_Store" "$src/" "$dst/"
 }

 mode="${1:-auto}"
 case "$mode" in
  auto|codex-to-claude|claude-to-codex|status) ;;
  -h|--help|help)
    usage
    exit 0
    ;;
  *)
    usage >&2
    exit 1
    ;;
 esac

 mkdir -p "$CODEX_DIR" "$CLAUDE_DIR"

 codex_latest="$(latest_mtime "$CODEX_DIR")"
 claude_latest="$(latest_mtime "$CLAUDE_DIR")"

 if [[ "$mode" == "status" ]]; then
  echo "Codex latest mtime:  $codex_latest"
  echo "Claude latest mtime: $claude_latest"
  if (( codex_latest == claude_latest )); then
    echo "Status: likely in sync"
  elif (( codex_latest > claude_latest )); then
    echo "Status: Codex appears newer"
  else
    echo "Status: Claude appears newer"
  fi
  exit 0
 fi

 if [[ "$mode" == "auto" ]]; then
  if (( codex_latest == claude_latest )); then
    echo "No sync needed: mtimes match."
    exit 0
  elif (( codex_latest > claude_latest )); then
    mode="codex-to-claude"
  else
    mode="claude-to-codex"
  fi
 fi

 if [[ "$mode" == "codex-to-claude" ]]; then
  sync_one_way "$CODEX_DIR" "$CLAUDE_DIR"
  echo "Synced Codex -> Claude for $SKILL_NAME"
 else
  sync_one_way "$CLAUDE_DIR" "$CODEX_DIR"
  echo "Synced Claude -> Codex for $SKILL_NAME"
 fi
diff --git a/SKILL.md b/SKILL.md
	interface:
	display_name: "Frontend Code Review"
	short_description: "Catch UI bugs, races, and weak frontend tests"
	default_prompt: "Use $frontend-code-review to review the frontend diff for concrete UI correctness issues, state or async races, interaction bugs, accessibility regressions, and fake or weak tests."
	#!/usr/bin/env python3
	from __future__ import annotations

	import argparse
	import json
	import subprocess
	import sys
	from pathlib import Path


	TEST_HINTS = (
	".test.",
	".spec.",
	"_test.py",
	"test_",
	)

	VERIFY_SCRIPT_KEYS = ("verify", "build", "lint", "check")
	TEST_SCRIPT_KEYS = ("test", "test:e2e", "test:unit", "test:ui", "test:fullstack", "test:mocked")


	def run(cmd: list[str], cwd: Path) -> str:
	try:
	return subprocess.check_output(cmd, cwd=str(cwd), stderr=subprocess.DEVNULL, text=True).strip()
	except Exception:
	return ""


	def git_root(path: Path) -> Path:
	root = run(["git", "rev-parse", "--show-toplevel"], path)
	return Path(root) if root else path


	def load_package_json(path: Path) -> dict:
	try:
	return json.loads(path.read_text())
	except Exception:
	return {}


	def tracked_tests(repo_root: Path) -> list[str]:
	output = run(["git", "ls-files"], repo_root)
	if not output:
	return []
	files = output.splitlines()
	return [f for f in files if any(hint in f for hint in TEST_HINTS) or "/tests/" in f or f.startswith("tests/")]


	def gather_commands(pkg_path: Path, label: str) -> tuple[list[str], list[str]]:
	data = load_package_json(pkg_path)
	scripts = data.get("scripts", {})
	test_cmds = []
	verify_cmds = []
	for key, value in scripts.items():
	rendered = f"{label}: {key} -> {value}"
	if key in TEST_SCRIPT_KEYS or "test" in key:
	test_cmds.append(rendered)
	elif key in VERIFY_SCRIPT_KEYS or any(token in key for token in VERIFY_SCRIPT_KEYS):
	verify_cmds.append(rendered)
	return test_cmds, verify_cmds


	def pyproject_markers(path: Path) -> list[str]:
	if not path.exists():
	return []
	text = path.read_text(errors="ignore")
	markers = []
	for token in ("pytest", "streamlit", "playwright", "vitest"):
	if token in text:
	markers.append(token)
	return markers


	def main() -> int:
	parser = argparse.ArgumentParser(description="Inspect repo review/test surfaces quickly.")
	parser.add_argument("repo", nargs="?", default=".", help="Repo path to inspect")
	parser.add_argument("--json", action="store_true", help="Emit JSON instead of markdown")
	args = parser.parse_args()

	start = Path(args.repo).expanduser().resolve()
	repo_root = git_root(start)

	package_candidates = [
	repo_root / "package.json",
	repo_root / "frontend" / "package.json",
	repo_root / "web" / "package.json",
	repo_root / "apps" / "web" / "package.json",
	]
	package_candidates = [p for p in package_candidates if p.exists()]

	test_commands: list[str] = []
	verify_commands: list[str] = []
	deps: set[str] = set()
	for pkg in package_candidates:
	label = str(pkg.relative_to(repo_root))
	data = load_package_json(pkg)
	deps.update(data.get("dependencies", {}).keys())
	deps.update(data.get("devDependencies", {}).keys())
	tests, verify = gather_commands(pkg, label)
	test_commands.extend(tests)
	verify_commands.extend(verify)

	pyproject = repo_root / "pyproject.toml"
	pytest_ini = repo_root / "pytest.ini"
	py_markers = pyproject_markers(pyproject)
	if pytest_ini.exists() and "pytest" not in py_markers:
	py_markers.append("pytest")

	has_netlify = (repo_root / "netlify.toml").exists() or (repo_root / "netlify" / "functions").exists()
	has_playwright = any((repo_root / name).exists() for name in ("playwright.config.ts", "playwright.config.js", "playwright.config.mjs")) or "@playwright/test" in deps or "playwright" in py_markers
	has_vitest = any((repo_root / name).exists() for name in ("vitest.config.ts", "vitest.config.js", "vitest.config.mjs")) or "vitest" in deps
	has_jest = any((repo_root / name).exists() for name in ("jest.config.ts", "jest.config.js", "jest.config.mjs")) or "jest" in deps
	has_pytest = "pytest" in py_markers
	has_streamlit = "streamlit" in py_markers

	tracked = tracked_tests(repo_root)

	detected_surfaces = []
	if has_playwright:
	detected_surfaces.append("playwright")
	if has_vitest:
	detected_surfaces.append("vitest")
	if has_jest:
	detected_surfaces.append("jest")
	if has_pytest:
	detected_surfaces.append("pytest")
	if has_streamlit:
	detected_surfaces.append("streamlit")

	notes = []
	if has_netlify:
	notes.append("Netlify markers detected; deployed preview/prod proof may be required for functions, redirects, auth, or cookie behavior.")
	if has_playwright:
	notes.append("Repo Playwright CLI is available for durable browser regression coverage.")
	if not tracked:
	notes.append("Little or no tracked test coverage detected; prefer the thinnest honest addition in the repo's existing stack.")
	if not detected_surfaces:
	notes.append("No obvious automated test harness detected from common manifests/configs.")

	result = {
	"repo_root": str(repo_root),
	"has_netlify": has_netlify,
	"detected_test_surfaces": detected_surfaces,
	"test_commands": test_commands,
	"verify_commands": verify_commands,
	"tracked_test_file_count": len(tracked),
	"tracked_test_examples": tracked[:12],
	"notes": notes,
	}

	if args.json:
	print(json.dumps(result, indent=2))
	return 0

	print(f"Repo root: {result['repo_root']}")
	print(f"Netlify: {'yes' if has_netlify else 'no'}")
	print(f"Detected test surfaces: {', '.join(detected_surfaces) if detected_surfaces else 'none-obvious'}")
	print(f"Tracked test files: {len(tracked)}")
	if tracked:
	print("Tracked test examples:")
	for item in tracked[:12]:
	print(f"- {item}")
	if test_commands:
	print("Test commands:")
	for item in test_commands:
	print(f"- {item}")
	if verify_commands:
	print("Verify/build commands:")
	for item in verify_commands:
	print(f"- {item}")
	if notes:
	print("Notes:")
	for item in notes:
	print(f"- {item}")
	return 0


	if __name__ == "__main__":
	sys.exit(main())
	#!/usr/bin/env bash
	set -euo pipefail

	SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
	SKILL_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"
	SKILL_NAME="$(basename "$SKILL_DIR")"

	CODEX_DIR="${CODEX_SKILL_DIR:-$HOME/.codex/skills/$SKILL_NAME}"
	CLAUDE_DIR="${CLAUDE_SKILL_DIR:-$HOME/.claude/skills/$SKILL_NAME}"

	usage() {
	cat <<EOF
	Sync shared review skill files between Codex and Claude skill folders.

	Usage:
	sync_codex_claude.sh [auto\|codex-to-claude\|claude-to-codex\|status]

	Environment overrides:
	CODEX_SKILL_DIR default: ~/.codex/skills/$SKILL_NAME
	CLAUDE_SKILL_DIR default: ~/.claude/skills/$SKILL_NAME
	EOF
	}

	mtime() {
	local path="$1"
	if stat -f "%m" "$path" >/dev/null 2>&1; then
	stat -f "%m" "$path"
	else
	stat -c "%Y" "$path"
	fi
	}

	latest_mtime() {
	local dir="$1"
	local latest=0
	while IFS= read -r -d '' file; do
	local file_mtime
	file_mtime="$(mtime "$file")"
	if (( file_mtime > latest )); then
	latest="$file_mtime"
	fi
	done < <(find "$dir" -type f ! -path "/agents/" ! -name ".DS_Store" -print0)
	echo "$latest"
	}

	sync_one_way() {
	local src="$1"
	local dst="$2"
	mkdir -p "$dst"
	rsync -a --exclude "agents/" --exclude ".DS_Store" "$src/" "$dst/"
	}

	mode="${1:-auto}"
	case "$mode" in
	auto\|codex-to-claude\|claude-to-codex\|status) ;;
	-h\|--help\|help)
	usage
	exit 0
	;;
	*)
	usage >&2
	exit 1
	;;
	esac

	mkdir -p "$CODEX_DIR" "$CLAUDE_DIR"

	codex_latest="$(latest_mtime "$CODEX_DIR")"
	claude_latest="$(latest_mtime "$CLAUDE_DIR")"

	if [[ "$mode" == "status" ]]; then
	echo "Codex latest mtime: $codex_latest"
	echo "Claude latest mtime: $claude_latest"
	if (( codex_latest == claude_latest )); then
	echo "Status: likely in sync"
	elif (( codex_latest > claude_latest )); then
	echo "Status: Codex appears newer"
	else
	echo "Status: Claude appears newer"
	fi
	exit 0
	fi

	if [[ "$mode" == "auto" ]]; then
	if (( codex_latest == claude_latest )); then
	echo "No sync needed: mtimes match."
	exit 0
	elif (( codex_latest > claude_latest )); then
	mode="codex-to-claude"
	else
	mode="claude-to-codex"
	fi
	fi

	if [[ "$mode" == "codex-to-claude" ]]; then
	sync_one_way "$CODEX_DIR" "$CLAUDE_DIR"
	echo "Synced Codex -> Claude for $SKILL_NAME"
	else
	sync_one_way "$CLAUDE_DIR" "$CODEX_DIR"
	echo "Synced Claude -> Codex for $SKILL_NAME"
	fi