Priority aging in xenia-cpu/scheduler.rs:pick_runnable
(effective_priority = base + age_bonus(now_round - last_run_round),
capped at +31, AGING_ROUNDS_PER_BONUS=1). Strict-priority was parking
priority=0 threads behind CPU-bound priority=15 audio mixer
(sub_824D1328 guest spinwait at PC=0x824d1404 on CPU5). Aging
eventually picks the starved thread, breaking the producer-consumer
cycle that caused 5-tid wedge at PC=0x824ac578 since AUDIT-049 (10 May).
Cascade observed: tid=13 clean exit; events 121K -> 13M (107x); last
host_ns 767ms -> 51,011ms (66x); 8 new threads spawn; VdSwap 1 -> 2.
Complete two-day iterate sequence (2026-05-27 -> 2026-05-28):
- 2.F: VdSwap drain timeout 900ms -> 1ms (xenia-gpu/handle.rs); 876x
perf win on VdSwap kernel callback
- 2.H: vA0000000 physical heap bucket added (state.rs, exports.rs);
ctx_ptrs now in 0xA0000000-0xBFFFFFFF range matching canary
- 2.L: Phase-A diff harness categorized [return_value mismatch],
[status mismatch], [args_resolved.path mismatch] tags
(tools/diff-events/diff_events.py); closes reading-error #41
(silent test-harness state leak invalidating trace diffs)
- 2.M: always-on exit-thread-state.json sibling to Phase-A JSONL
(event_log.rs + xenia-app/main.rs); closes reading-error #42
(Phase-A blind to blocked-forever waits)
- 2.Q: signal.match kernel instrumentation in NtSetEvent /
NtReleaseSemaphore / KeSetEvent / KeReleaseSemaphore
(exports.rs); emits target_handle + waiter_count + waiter_tids
- 2.T: wake.requested kernel instrumentation in wake_eligible_waiters
(exports.rs); emits target_tid + transition + new_state
- 2.V: scheduler priority aging (xenia-cpu/scheduler.rs) [keystone]
Plus accumulated WIP from earlier May (contention_manifest,
phase_b_snapshot, xam/xaudio enhancements, analysis db, xex loader,
xenia-app main loop, etc.). Audit-runs/ artifacts remain untracked
per project convention.
Tests: 300 xenia-cpu / 227 xenia-kernel / 5 xenia-app / 19 xenia-path
/ 30+ smaller suites -- all PASS, 0 regressions. Determinism preserved
(2x cold runs bit-identical at 13,003,881 events post-2.V).
Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
546 lines
21 KiB
Python
546 lines
21 KiB
Python
#!/usr/bin/env python3
|
||
"""Phase B state-snapshot diff tool.
|
||
|
||
Reads two snapshot directories (one per engine, `<dir>/canary/` and
|
||
`<dir>/ours/`) emitted by `phase_b_snapshot` at the moment immediately
|
||
before the first guest PPC instruction of the XEX entry_point. Produces
|
||
a markdown report (`report.md`) plus a machine-readable JSON sibling
|
||
(`report.json`) classifying every observable divergence.
|
||
|
||
Field-comparison rules + classification table:
|
||
audit-runs/phase-b-state-equivalence/README.md
|
||
Both engines' emitter source + this tool read the same rules.
|
||
|
||
Usage:
|
||
diff_state.py --canary <dir>/canary --ours <dir>/ours [--out report.md]
|
||
diff_state.py --canary <a> --ours <b> --validate-identical
|
||
|
||
Exit codes:
|
||
0 — no divergence (or `--validate-identical` succeeded)
|
||
1 — divergences found
|
||
2 — STOP triggered (image_loaded_sha256 / xex_entry_point / iso_sha256
|
||
mismatch — interpretation of downstream files is not valid)
|
||
"""
|
||
|
||
from __future__ import annotations
|
||
|
||
import argparse
|
||
import hashlib
|
||
import json
|
||
import sys
|
||
from pathlib import Path
|
||
from typing import Any
|
||
|
||
SCHEMA_VERSION = 1
|
||
|
||
# ---------- field-comparison rules (declared up front) ----------
|
||
|
||
# Per-snapshot-file fields the diff tool always skips at the top level.
|
||
SKIP_TOP_FIELDS = {"schema_version", "engine", "deterministic_skip"}
|
||
|
||
# Per-file: extra fields skipped. JSON-pointer-style ("a.b.c") matched
|
||
# either at top-level keys or within array-of-objects members keyed by
|
||
# `handle_semantic_id` etc.
|
||
SKIP_BY_FILE: dict[str, set[str]] = {
|
||
"cpu_state.json": {"hw_id"},
|
||
"memory.json": set(),
|
||
"kernel.json": {"raw_handle_id", "exports_registered_count"},
|
||
"vfs.json": set(),
|
||
"config.json": {
|
||
"build_id",
|
||
"iso_path",
|
||
"host_ns_at_snapshot",
|
||
"wall_clock_iso8601",
|
||
"cli_argv",
|
||
"cvars.phase_b_snapshot_dir",
|
||
},
|
||
}
|
||
|
||
# `objects` etc. are sets (sort then compare); `regions`/`probes`/`gpr`/
|
||
# etc. are sequences (positional compare). Mismatches handled separately.
|
||
SET_FIELDS: dict[str, dict[str, str]] = {
|
||
# file -> field_name -> sort-key (used as dict key)
|
||
"kernel.json": {
|
||
"objects": "handle_semantic_id",
|
||
"handle_name_table": "name",
|
||
},
|
||
"vfs.json": {"cache_root_listing": "relpath"},
|
||
"memory.json": {"heaps": "base"},
|
||
}
|
||
|
||
# STOP-trigger fields (δ-content critical equivalence).
|
||
# Note: image_loaded_sha256 is reported but NOT a STOP trigger here. The
|
||
# raw hash mismatches when engines patch imports differently — see
|
||
# check_invariants() which evaluates `image_canonical_sha256` (computed
|
||
# from image.bin + xex.json) as the real semantic STOP key.
|
||
STOP_FIELDS = {
|
||
("config.json", "xex_entry_point"),
|
||
("config.json", "iso_sha256"),
|
||
}
|
||
|
||
|
||
# ---------- divergence record ----------
|
||
|
||
class Divergence:
|
||
__slots__ = ("file", "path", "kind", "canary", "ours", "klass")
|
||
|
||
def __init__(self, file: str, path: str, kind: str, canary: Any, ours: Any, klass: str):
|
||
self.file = file
|
||
self.path = path
|
||
self.kind = kind
|
||
self.canary = canary
|
||
self.ours = ours
|
||
self.klass = klass
|
||
|
||
def to_dict(self) -> dict:
|
||
return {
|
||
"file": self.file,
|
||
"path": self.path,
|
||
"kind": self.kind,
|
||
"canary": self.canary,
|
||
"ours": self.ours,
|
||
"class": self.klass,
|
||
}
|
||
|
||
|
||
# ---------- classification ----------
|
||
|
||
def classify(file: str, path: str, kind: str, canary: Any, ours: Any) -> str:
|
||
if (file, path) in STOP_FIELDS:
|
||
return "delta-content-STOP"
|
||
if kind in ("set-size-mismatch", "missing-field", "extra-field", "seq-length"):
|
||
return "sigma-structural"
|
||
if path.endswith(".sha256") or path.endswith("_sha256"):
|
||
return "delta-content"
|
||
if path.startswith("objects[") and ".details." in path:
|
||
return "gamma-kernel-content"
|
||
if file == "vfs.json" and path.startswith("cache_root_listing"):
|
||
return "kappa-cache"
|
||
if path in ("heaps[].base", "heaps[].name"):
|
||
return "epsilon-host-allocator"
|
||
if path in ("host_ns_at_snapshot", "wall_clock_iso8601"):
|
||
return "tau-host-timing"
|
||
return "gamma-kernel-content"
|
||
|
||
|
||
# ---------- generic walker ----------
|
||
|
||
def collect_skip_set(file: str, doc: dict) -> set[str]:
|
||
s = set(SKIP_TOP_FIELDS) | set(SKIP_BY_FILE.get(file, set()))
|
||
extra = doc.get("deterministic_skip")
|
||
if isinstance(extra, list):
|
||
for x in extra:
|
||
if isinstance(x, str):
|
||
s.add(x)
|
||
return s
|
||
|
||
|
||
def is_skipped(file: str, path: str, skip: set[str]) -> bool:
|
||
if path in skip:
|
||
return True
|
||
# Strip array indices for membership check, so "objects[].raw_handle_id"
|
||
# in the skip set matches "objects[3].raw_handle_id".
|
||
bracketed = []
|
||
parts = path.split(".")
|
||
for p in parts:
|
||
idx = p.find("[")
|
||
if idx >= 0:
|
||
bracketed.append(p[:idx] + "[]")
|
||
else:
|
||
bracketed.append(p)
|
||
norm = ".".join(bracketed)
|
||
if norm in skip:
|
||
return True
|
||
# Last-token (leaf field) match — e.g. "raw_handle_id" anywhere.
|
||
leaf = bracketed[-1]
|
||
if leaf in skip:
|
||
return True
|
||
return False
|
||
|
||
|
||
def diff_value(
|
||
file: str,
|
||
path: str,
|
||
a: Any,
|
||
b: Any,
|
||
out: list[Divergence],
|
||
skip: set[str],
|
||
set_keys: dict[str, str] | None = None,
|
||
) -> None:
|
||
if is_skipped(file, path, skip):
|
||
return
|
||
if type(a) != type(b):
|
||
out.append(Divergence(file, path, "type-mismatch", a, b,
|
||
classify(file, path, "type-mismatch", a, b)))
|
||
return
|
||
if isinstance(a, dict):
|
||
a_keys = set(a.keys())
|
||
b_keys = set(b.keys())
|
||
for k in sorted(a_keys - b_keys):
|
||
sub = f"{path}.{k}" if path else k
|
||
if is_skipped(file, sub, skip):
|
||
continue
|
||
out.append(Divergence(file, sub, "missing-field", a[k], None,
|
||
classify(file, sub, "missing-field", a[k], None)))
|
||
for k in sorted(b_keys - a_keys):
|
||
sub = f"{path}.{k}" if path else k
|
||
if is_skipped(file, sub, skip):
|
||
continue
|
||
out.append(Divergence(file, sub, "extra-field", None, b[k],
|
||
classify(file, sub, "extra-field", None, b[k])))
|
||
for k in sorted(a_keys & b_keys):
|
||
sub = f"{path}.{k}" if path else k
|
||
diff_value(file, sub, a[k], b[k], out, skip, set_keys)
|
||
return
|
||
if isinstance(a, list):
|
||
# Set-field handling: sort by configured key.
|
||
last_seg = path.rsplit(".", 1)[-1] if path else ""
|
||
bare = last_seg.split("[", 1)[0]
|
||
key = (set_keys or {}).get(bare)
|
||
if key is not None:
|
||
a_sorted = sorted(a, key=lambda x: x.get(key, "") if isinstance(x, dict) else "")
|
||
b_sorted = sorted(b, key=lambda x: x.get(key, "") if isinstance(x, dict) else "")
|
||
a_keys = {x.get(key) for x in a_sorted if isinstance(x, dict)}
|
||
b_keys = {x.get(key) for x in b_sorted if isinstance(x, dict)}
|
||
missing = sorted(a_keys - b_keys, key=str)
|
||
extra = sorted(b_keys - a_keys, key=str)
|
||
for m in missing:
|
||
out.append(Divergence(file, f"{path}[{key}={m}]",
|
||
"missing-from-ours", m, None,
|
||
classify(file, f"{path}[{key}={m}]",
|
||
"missing-from-ours", m, None)))
|
||
for e in extra:
|
||
out.append(Divergence(file, f"{path}[{key}={e}]",
|
||
"extra-in-ours", None, e,
|
||
classify(file, f"{path}[{key}={e}]",
|
||
"extra-in-ours", None, e)))
|
||
common = sorted(a_keys & b_keys, key=str)
|
||
a_by = {x.get(key): x for x in a_sorted if isinstance(x, dict)}
|
||
b_by = {x.get(key): x for x in b_sorted if isinstance(x, dict)}
|
||
for ck in common:
|
||
diff_value(file, f"{path}[{key}={ck}]", a_by[ck], b_by[ck],
|
||
out, skip, set_keys)
|
||
return
|
||
# Sequence-field: positional.
|
||
if len(a) != len(b):
|
||
out.append(Divergence(file, path, "seq-length", len(a), len(b),
|
||
classify(file, path, "seq-length", len(a), len(b))))
|
||
n = min(len(a), len(b))
|
||
else:
|
||
n = len(a)
|
||
for i in range(n):
|
||
diff_value(file, f"{path}[{i}]", a[i], b[i], out, skip, set_keys)
|
||
return
|
||
if a != b:
|
||
out.append(Divergence(file, path, "value", a, b,
|
||
classify(file, path, "value", a, b)))
|
||
|
||
|
||
# ---------- file-level orchestration ----------
|
||
|
||
def load_json(p: Path) -> dict:
|
||
with p.open("r", encoding="utf-8") as f:
|
||
return json.load(f)
|
||
|
||
|
||
def diff_directory(canary_dir: Path, ours_dir: Path) -> tuple[list[Divergence], dict]:
|
||
files = ["cpu_state.json", "memory.json", "kernel.json", "vfs.json", "config.json"]
|
||
divergences: list[Divergence] = []
|
||
manifest_canary = load_json(canary_dir / "manifest.json") if (canary_dir / "manifest.json").exists() else {}
|
||
manifest_ours = load_json(ours_dir / "manifest.json") if (ours_dir / "manifest.json").exists() else {}
|
||
file_status = {}
|
||
for name in files:
|
||
cp = canary_dir / name
|
||
op = ours_dir / name
|
||
if not cp.exists():
|
||
divergences.append(Divergence(name, "<file>", "missing-file",
|
||
"absent", "present", "sigma-structural"))
|
||
file_status[name] = "missing-in-canary"
|
||
continue
|
||
if not op.exists():
|
||
divergences.append(Divergence(name, "<file>", "missing-file",
|
||
"present", "absent", "sigma-structural"))
|
||
file_status[name] = "missing-in-ours"
|
||
continue
|
||
ch = manifest_canary.get("files", {}).get(name)
|
||
oh = manifest_ours.get("files", {}).get(name)
|
||
if ch is not None and ch == oh:
|
||
# Verify the manifest hashes against the actual file contents
|
||
# before trusting them — a tampered file with an intact manifest
|
||
# would otherwise be silently masked.
|
||
ch_actual = hashlib.sha256(cp.read_bytes()).hexdigest()
|
||
oh_actual = hashlib.sha256(op.read_bytes()).hexdigest()
|
||
if ch_actual == ch and oh_actual == oh:
|
||
file_status[name] = "identical"
|
||
continue
|
||
# Manifest claim does not match disk — fall through to full diff
|
||
# and surface the manifest mismatch as a structural divergence.
|
||
if ch_actual != ch:
|
||
divergences.append(Divergence(
|
||
name, "<manifest>", "manifest-hash-mismatch", ch, ch_actual,
|
||
"sigma-structural"))
|
||
if oh_actual != oh:
|
||
divergences.append(Divergence(
|
||
name, "<manifest>", "manifest-hash-mismatch", oh, oh_actual,
|
||
"sigma-structural"))
|
||
a = load_json(cp)
|
||
b = load_json(op)
|
||
skip = collect_skip_set(name, a) | collect_skip_set(name, b)
|
||
diff_value(name, "", a, b, divergences, skip,
|
||
set_keys=SET_FIELDS.get(name))
|
||
file_status[name] = "diverged"
|
||
return divergences, file_status
|
||
|
||
|
||
# ---------- invariants ----------
|
||
|
||
def _canonicalize_image(image: bytes, xex_meta: dict, image_base: int) -> bytes:
|
||
"""Mask XEX import slots to 0xCD. Import patches are legitimate
|
||
engine-specific runtime overlays (record_type=0 var slots = 4 bytes,
|
||
record_type=1 thunks = 16 bytes); they break a naive byte-equality
|
||
invariant even when both engines decoded the XEX identically."""
|
||
ranges = []
|
||
for lib in xex_meta.get("import_libraries", []):
|
||
for imp in lib.get("imports", []):
|
||
addr = imp["address"]
|
||
rt = imp["record_type"]
|
||
if rt == 0:
|
||
ranges.append((addr, addr + 4))
|
||
elif rt == 1:
|
||
ranges.append((addr, addr + 16))
|
||
buf = bytearray(image)
|
||
for sva, eva in ranges:
|
||
s = sva - image_base
|
||
e = eva - image_base
|
||
if s < 0 or e > len(buf):
|
||
continue
|
||
for i in range(s, e):
|
||
buf[i] = 0xCD
|
||
return bytes(buf)
|
||
|
||
|
||
def check_invariants(
|
||
canary_dir: Path, ours_dir: Path, xex_json: Path | None = None
|
||
) -> tuple[list[tuple[str, str, str, bool]], bool]:
|
||
"""Returns (rows, stop) where each row is (name, canary_val, ours_val, ok).
|
||
`stop` is True iff any STOP-class invariant failed.
|
||
|
||
When --xex-json is provided AND both snapshots contain `image.bin`,
|
||
the image-load invariant is computed over a canonicalized buffer
|
||
(XEX import slots masked). This relaxes the original raw-bytes STOP
|
||
to the only meaningful semantic check — both engines decoded the
|
||
XEX identically — and avoids tripping on legitimate runtime import
|
||
patches (canary's 0xDEADC0DE vs ours's 0x00000000 sentinels)."""
|
||
rows = []
|
||
stop = False
|
||
try:
|
||
c_cfg = load_json(canary_dir / "config.json")
|
||
o_cfg = load_json(ours_dir / "config.json")
|
||
c_cpu = load_json(canary_dir / "cpu_state.json")
|
||
o_cpu = load_json(ours_dir / "cpu_state.json")
|
||
except FileNotFoundError as e:
|
||
return [(f"file_present:{e.filename}", "", "", False)], True
|
||
|
||
c_entry = c_cfg.get("xex_entry_point")
|
||
o_entry = o_cfg.get("xex_entry_point")
|
||
rows.append(("xex_entry_point", str(c_entry), str(o_entry), c_entry == o_entry))
|
||
if c_entry != o_entry:
|
||
stop = True
|
||
|
||
c_pc = c_cpu.get("pc")
|
||
o_pc = o_cpu.get("pc")
|
||
pc_match = c_pc == c_entry and o_pc == o_entry
|
||
rows.append((
|
||
"cpu_state.pc == xex_entry_point",
|
||
f"{c_pc} == {c_entry}",
|
||
f"{o_pc} == {o_entry}",
|
||
pc_match,
|
||
))
|
||
if not pc_match:
|
||
stop = True
|
||
|
||
c_img = c_cfg.get("image_loaded_sha256")
|
||
o_img = o_cfg.get("image_loaded_sha256")
|
||
# Original raw hash — informational. Mismatch is expected when the
|
||
# engines patch imports differently. Reported but does NOT STOP.
|
||
rows.append((
|
||
"image_loaded_sha256 (raw)",
|
||
c_img or "",
|
||
o_img or "",
|
||
c_img == o_img,
|
||
))
|
||
|
||
# Canonical hash — the real equivalence check. Requires both engines
|
||
# to have dumped image.bin (--phase-b-dump-section-content) AND a
|
||
# caller-supplied --xex-json with the import table. When unavailable
|
||
# we fall back to the raw hash as the STOP key for backward compat.
|
||
c_img_bin = canary_dir / "image.bin"
|
||
o_img_bin = ours_dir / "image.bin"
|
||
canonical_available = (
|
||
xex_json is not None
|
||
and c_img_bin.exists()
|
||
and o_img_bin.exists()
|
||
)
|
||
if canonical_available:
|
||
xex_meta = json.loads(Path(xex_json).read_text())
|
||
image_base = xex_meta.get("image_base", 0x82000000)
|
||
cbytes = c_img_bin.read_bytes()
|
||
obytes = o_img_bin.read_bytes()
|
||
c_canon = _canonicalize_image(cbytes, xex_meta, image_base)
|
||
o_canon = _canonicalize_image(obytes, xex_meta, image_base)
|
||
import hashlib as _hl
|
||
c_canon_h = _hl.sha256(c_canon).hexdigest()
|
||
o_canon_h = _hl.sha256(o_canon).hexdigest()
|
||
canon_ok = c_canon_h == o_canon_h
|
||
rows.append((
|
||
"image_canonical_sha256",
|
||
c_canon_h,
|
||
o_canon_h,
|
||
canon_ok,
|
||
))
|
||
if not canon_ok:
|
||
stop = True
|
||
else:
|
||
# No canonicalization possible — fall back to raw bytes as the
|
||
# STOP key. This preserves the original Phase B semantics.
|
||
if c_img != o_img:
|
||
stop = True
|
||
return rows, stop
|
||
|
||
|
||
# ---------- report writing ----------
|
||
|
||
def write_report(out_path: Path, canary_dir: Path, ours_dir: Path,
|
||
divergences: list[Divergence], file_status: dict,
|
||
invariants: list, stop: bool):
|
||
lines = []
|
||
lines.append("# Phase B snapshot diff")
|
||
lines.append("")
|
||
lines.append(f"- canary snapshot: `{canary_dir}`")
|
||
lines.append(f"- ours snapshot: `{ours_dir}`")
|
||
lines.append("")
|
||
lines.append("## Invariants (HARD GATE)")
|
||
lines.append("")
|
||
lines.append("| invariant | canary | ours | ok? |")
|
||
lines.append("|---|---|---|---|")
|
||
for name, cval, oval, ok in invariants:
|
||
lines.append(f"| {name} | `{cval}` | `{oval}` | {'PASS' if ok else 'FAIL'} |")
|
||
lines.append("")
|
||
if stop:
|
||
lines.append("> **STOP**: a primary equivalence invariant failed. "
|
||
"Downstream divergences are not interpretable until this is "
|
||
"resolved. Re-run with `--phase-b-dump-section-content` on both "
|
||
"engines and binary-diff the regions to localize.")
|
||
lines.append("")
|
||
lines.append("## File-level summary")
|
||
lines.append("")
|
||
lines.append("| file | status | divergence count by class |")
|
||
lines.append("|---|---|---|")
|
||
by_file_class: dict[tuple[str, str], int] = {}
|
||
for d in divergences:
|
||
by_file_class[(d.file, d.klass)] = by_file_class.get((d.file, d.klass), 0) + 1
|
||
for fname, st in file_status.items():
|
||
counts = []
|
||
for klass in ["sigma-structural", "delta-content-STOP", "delta-content",
|
||
"gamma-kernel-content", "kappa-cache",
|
||
"epsilon-host-allocator", "tau-host-timing"]:
|
||
c = by_file_class.get((fname, klass), 0)
|
||
if c:
|
||
counts.append(f"{klass}={c}")
|
||
lines.append(f"| {fname} | {st} | {' '.join(counts) if counts else '—'} |")
|
||
lines.append("")
|
||
# Per-class sections.
|
||
by_class: dict[str, list[Divergence]] = {}
|
||
for d in divergences:
|
||
by_class.setdefault(d.klass, []).append(d)
|
||
priority_order = [
|
||
("sigma-structural", "σ-structural divergences (priority 1)"),
|
||
("delta-content-STOP", "δ-content STOP divergences"),
|
||
("delta-content", "δ-content divergences (priority 2)"),
|
||
("gamma-kernel-content", "γ-kernel-content divergences (priority 2)"),
|
||
("kappa-cache", "κ-cache divergences (re-run after pre-clean)"),
|
||
("epsilon-host-allocator", "ε-host-allocator (informational)"),
|
||
("tau-host-timing", "τ-host-timing (informational)"),
|
||
]
|
||
for klass, title in priority_order:
|
||
items = by_class.get(klass, [])
|
||
if not items:
|
||
continue
|
||
lines.append(f"## {title}")
|
||
lines.append("")
|
||
for d in items[:200]: # cap each section
|
||
lines.append(f"- **{d.file}** `{d.path}`: kind=`{d.kind}` "
|
||
f"canary=`{d.canary!r}` ours=`{d.ours!r}`")
|
||
if len(items) > 200:
|
||
lines.append(f"- _… {len(items) - 200} more in this class (see report.json)_")
|
||
lines.append("")
|
||
lines.append("## Phase C handoff")
|
||
lines.append("")
|
||
lines.append("Suggested attack order: σ first (structural), then γ ranked by "
|
||
"object type (Thread > Event > Semaphore > Mutex > Timer > File > "
|
||
"Other), then δ. ε and τ are catalog-only.")
|
||
out_path.write_text("\n".join(lines), encoding="utf-8")
|
||
|
||
|
||
def write_report_json(out_path: Path, divergences: list[Divergence],
|
||
file_status: dict, invariants: list, stop: bool):
|
||
obj = {
|
||
"schema_version": SCHEMA_VERSION,
|
||
"invariants": [
|
||
{"name": n, "canary": c, "ours": o, "ok": ok}
|
||
for n, c, o, ok in invariants
|
||
],
|
||
"stop": stop,
|
||
"file_status": file_status,
|
||
"divergences": [d.to_dict() for d in divergences],
|
||
}
|
||
out_path.write_text(json.dumps(obj, indent=2, sort_keys=True), encoding="utf-8")
|
||
|
||
|
||
# ---------- CLI ----------
|
||
|
||
def main():
|
||
ap = argparse.ArgumentParser()
|
||
ap.add_argument("--canary", required=True)
|
||
ap.add_argument("--ours", required=True)
|
||
ap.add_argument("--out", default=None)
|
||
ap.add_argument("--xex-json", default=None,
|
||
help="optional xex.json metadata for canonical image-load "
|
||
"invariant (requires image.bin in both snapshot dirs)")
|
||
ap.add_argument("--validate-identical", action="store_true")
|
||
ns = ap.parse_args()
|
||
canary_dir = Path(ns.canary)
|
||
ours_dir = Path(ns.ours)
|
||
if not canary_dir.is_dir() or not ours_dir.is_dir():
|
||
print(f"both snapshot dirs must exist: {canary_dir} {ours_dir}", file=sys.stderr)
|
||
sys.exit(2)
|
||
|
||
xex_json = Path(ns.xex_json) if ns.xex_json else None
|
||
invariants, stop = check_invariants(canary_dir, ours_dir, xex_json)
|
||
divergences, file_status = diff_directory(canary_dir, ours_dir)
|
||
|
||
if ns.validate_identical:
|
||
if divergences or not all(ok for _, _, _, ok in invariants):
|
||
print("validate-identical: differences found", file=sys.stderr)
|
||
sys.exit(1)
|
||
print("validate-identical: OK")
|
||
sys.exit(0)
|
||
|
||
out_md = Path(ns.out) if ns.out else (canary_dir.parent / "report.md")
|
||
out_json = out_md.with_suffix(".json")
|
||
write_report(out_md, canary_dir, ours_dir, divergences, file_status,
|
||
invariants, stop)
|
||
write_report_json(out_json, divergences, file_status, invariants, stop)
|
||
print(f"wrote {out_md} ({len(divergences)} divergences)")
|
||
print(f"wrote {out_json}")
|
||
|
||
if stop:
|
||
sys.exit(2)
|
||
if divergences:
|
||
sys.exit(1)
|
||
sys.exit(0)
|
||
|
||
|
||
if __name__ == "__main__":
|
||
main()
|