From 5c2bc61fd63ea1fb0f3cd7eaedbcaea4c8ef1f1c Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Wed, 6 May 2026 02:42:25 +0000
Subject: [PATCH 1/2] Add self-test harness, integration tests, SLA budgets,
 and pipeline contracts

Agent-Logs-Url: https://github.com/DaScient-Intelligence/Plan-Examiner/sessions/594db8e5-858f-4cf8-ba13-0eb0a71df477

Co-authored-by: DaScient <25983786+DaScient@users.noreply.github.com>
---
 .../data/fixtures/selftest/clean-office.dxf   | 110 ++++++++
 assets/data/fixtures/selftest/expected.json   |  86 ++++++
 .../selftest/non-compliant-assembly.dxf       |  86 ++++++
 .../fixtures/selftest/sparse-warehouse.dxf    |  26 ++
 assets/js/agent/pipeline.js                   | 127 ++++++++-
 assets/js/agent/self-test.js                  | 258 ++++++++++++++++++
 tests/integration.pipeline.test.js            | 111 ++++++++
 tests/rules.schema.test.js                    |  25 ++
 8 files changed, 823 insertions(+), 6 deletions(-)
 create mode 100644 assets/data/fixtures/selftest/clean-office.dxf
 create mode 100644 assets/data/fixtures/selftest/expected.json
 create mode 100644 assets/data/fixtures/selftest/non-compliant-assembly.dxf
 create mode 100644 assets/data/fixtures/selftest/sparse-warehouse.dxf
 create mode 100644 assets/js/agent/self-test.js
 create mode 100644 tests/integration.pipeline.test.js
 create mode 100644 tests/rules.schema.test.js

diff --git a/assets/data/fixtures/selftest/clean-office.dxf b/assets/data/fixtures/selftest/clean-office.dxf
new file mode 100644
index 0000000..45b1502
--- /dev/null
+++ b/assets/data/fixtures/selftest/clean-office.dxf
@@ -0,0 +1,110 @@
+  0
+SECTION
+  2
+ENTITIES
+  0
+TEXT
+  8
+A-TITLE
+  1
+PROJECT: SAMPLE OFFICE BUILDING
+  0
+TEXT
+  8
+A-TITLE
+  1
+GROSS FLOOR AREA: 12000 sq ft
+  0
+TEXT
+  8
+A-EGRESS
+  1
+OCCUPANT LOAD: 80
+  0
+TEXT
+  8
+A-EGRESS
+  1
+NUMBER OF STORIES: 2
+  0
+TEXT
+  8
+A-EGRESS
+  1
+BUILDING HEIGHT: 24 ft
+  0
+TEXT
+  8
+A-CORR
+  1
+CORRIDOR WIDTH: 48 in
+  0
+TEXT
+  8
+A-DOOR
+  1
+DOOR CLEAR WIDTH: 36 in
+  0
+TEXT
+  8
+A-STAIR
+  1
+STAIR TREAD: 11 in
+  0
+TEXT
+  8
+A-STAIR
+  1
+STAIR RISER: 7 in
+  0
+TEXT
+  8
+A-STAIR
+  1
+STAIR WIDTH: 44 in
+  0
+TEXT
+  8
+A-FIRE
+  1
+FIRE SPRINKLER NFPA 13 SYSTEM PROVIDED
+  0
+TEXT
+  8
+A-FIRE
+  1
+FIRE ALARM NFPA 72 PROVIDED
+  0
+TEXT
+  8
+A-FIRE
+  1
+EXIT SIGN AT EACH DOOR
+  0
+TEXT
+  8
+A-FIRE
+  1
+EMERGENCY LIGHTING WITH BATTERY BACKUP
+  0
+TEXT
+  8
+A-PARK
+  1
+TOTAL PARKING: 40
+  0
+TEXT
+  8
+A-PARK
+  1
+ACCESSIBLE PARKING: 2
+  0
+TEXT
+  8
+A-OCC
+  1
+OCCUPANCY GROUP: B
+  0
+ENDSEC
+  0
+EOF
diff --git a/assets/data/fixtures/selftest/expected.json b/assets/data/fixtures/selftest/expected.json
new file mode 100644
index 0000000..91cae31
--- /dev/null
+++ b/assets/data/fixtures/selftest/expected.json
@@ -0,0 +1,86 @@
+{
+  "$comment": "Golden expectations for Plan-Examiner self-test fixtures. Each entry's flagged_ids must be a SUBSET of actual FLAGGED finding ids; counts/score use inclusive [min,max] bands tolerant of rule-pack growth. min_facts is a lower bound on extracted fact keys (excluding internal _ keys and form-injected metadata).",
+  "version": "1.0.0",
+  "generated_against": {
+    "engine_version": "2.0.0",
+    "rules_index_version": "3.0.0",
+    "date": "2026-05-06"
+  },
+  "fixtures": [
+    {
+      "id": "clean-office",
+      "file": "clean-office.dxf",
+      "label": "Compliant 2-story office (Use Group B)",
+      "form_data": { "buildingType": "Commercial", "buildingCode": "2024 IBC", "city": "Test", "state": "CA", "country": "US" },
+      "expected": {
+        "source": "dxf",
+        "use_group": "B",
+        "min_facts": 12,
+        "required_fact_keys": [
+          "grossArea", "occupantLoad", "stories", "buildingHeightFt",
+          "corridorWidthInches", "doorWidthInches", "stairTreadDepthIn",
+          "stairRiserHeightIn", "stairWidthInches",
+          "totalParkingSpaces", "accessibleParkingSpaces", "occupancyGroup"
+        ],
+        "required_bool_flags": {
+          "hasSprinklers": true,
+          "hasFireAlarm": true,
+          "hasExitSigns": true,
+          "hasEmergencyLighting": true
+        },
+        "must_flag_ids": [],
+        "must_not_flag_ids": ["IBC-1011.5", "IBC-1010.1", "ADA-404.2.3"],
+        "counts": {
+          "FLAGGED": { "min": 0, "max": 1 },
+          "REVIEW":  { "min": 30, "max": 200 },
+          "PASS":    { "min": 8,  "max": 200 }
+        },
+        "score_band": { "min": 60, "max": 100 }
+      }
+    },
+    {
+      "id": "non-compliant-assembly",
+      "file": "non-compliant-assembly.dxf",
+      "label": "Assembly hall with substandard egress (Use Group A)",
+      "form_data": { "buildingType": "Commercial", "buildingCode": "2024 IBC", "city": "Test", "state": "NY", "country": "US" },
+      "expected": {
+        "source": "dxf",
+        "use_group": "A",
+        "min_facts": 10,
+        "required_fact_keys": [
+          "grossArea", "occupantLoad", "corridorWidthInches",
+          "doorWidthInches", "stairTreadDepthIn", "stairRiserHeightIn",
+          "occupancyGroup"
+        ],
+        "must_flag_ids": ["IBC-1011.5", "IBC-1010.1", "ADA-404.2.3"],
+        "must_not_flag_ids": [],
+        "counts": {
+          "FLAGGED": { "min": 3,  "max": 50 },
+          "REVIEW":  { "min": 20, "max": 200 },
+          "PASS":    { "min": 0,  "max": 200 }
+        },
+        "score_band": { "min": 30, "max": 80 }
+      }
+    },
+    {
+      "id": "sparse-warehouse",
+      "file": "sparse-warehouse.dxf",
+      "label": "Sparse warehouse with minimal annotations (Use Group S)",
+      "form_data": { "buildingType": "Industrial", "buildingCode": "2024 IBC", "city": "Test", "state": "TX", "country": "US" },
+      "expected": {
+        "source": "dxf",
+        "use_group": "S",
+        "min_facts": 1,
+        "required_fact_keys": ["grossArea", "occupancyGroup"],
+        "must_flag_ids": [],
+        "must_not_flag_ids": [],
+        "counts": {
+          "FLAGGED": { "min": 0,  "max": 5 },
+          "REVIEW":  { "min": 10, "max": 200 },
+          "PASS":    { "min": 0,  "max": 200 }
+        },
+        "score_band": { "min": 40, "max": 100 }
+      }
+    }
+  ]
+}
diff --git a/assets/data/fixtures/selftest/non-compliant-assembly.dxf b/assets/data/fixtures/selftest/non-compliant-assembly.dxf
new file mode 100644
index 0000000..7f9a9d8
--- /dev/null
+++ b/assets/data/fixtures/selftest/non-compliant-assembly.dxf
@@ -0,0 +1,86 @@
+  0
+SECTION
+  2
+ENTITIES
+  0
+TEXT
+  8
+A-TITLE
+  1
+PROJECT: NON-COMPLIANT ASSEMBLY HALL
+  0
+TEXT
+  8
+A-TITLE
+  1
+GROSS FLOOR AREA: 8000 sq ft
+  0
+TEXT
+  8
+A-EGRESS
+  1
+OCCUPANT LOAD: 600
+  0
+TEXT
+  8
+A-EGRESS
+  1
+NUMBER OF STORIES: 1
+  0
+TEXT
+  8
+A-EGRESS
+  1
+BUILDING HEIGHT: 18 ft
+  0
+TEXT
+  8
+A-CORR
+  1
+CORRIDOR WIDTH: 30 in
+  0
+TEXT
+  8
+A-DOOR
+  1
+DOOR CLEAR WIDTH: 28 in
+  0
+TEXT
+  8
+A-STAIR
+  1
+STAIR TREAD: 9 in
+  0
+TEXT
+  8
+A-STAIR
+  1
+STAIR RISER: 8.5 in
+  0
+TEXT
+  8
+A-OCC
+  1
+OCCUPANCY GROUP: A
+  0
+TEXT
+  8
+A-OCC
+  1
+USE: ASSEMBLY HALL RESTAURANT
+  0
+TEXT
+  8
+A-PARK
+  1
+TOTAL PARKING: 50
+  0
+TEXT
+  8
+A-PARK
+  1
+ACCESSIBLE PARKING: 1
+  0
+ENDSEC
+  0
+EOF
diff --git a/assets/data/fixtures/selftest/sparse-warehouse.dxf b/assets/data/fixtures/selftest/sparse-warehouse.dxf
new file mode 100644
index 0000000..aae44f0
--- /dev/null
+++ b/assets/data/fixtures/selftest/sparse-warehouse.dxf
@@ -0,0 +1,26 @@
+  0
+SECTION
+  2
+ENTITIES
+  0
+TEXT
+  8
+A-TITLE
+  1
+PROJECT: SPARSE INDUSTRIAL WAREHOUSE
+  0
+TEXT
+  8
+A-TITLE
+  1
+GROSS FLOOR AREA: 25000 sq ft
+  0
+TEXT
+  8
+A-OCC
+  1
+USE: WAREHOUSE STORAGE INDUSTRIAL
+  0
+ENDSEC
+  0
+EOF
diff --git a/assets/js/agent/pipeline.js b/assets/js/agent/pipeline.js
index 6e5bea6..321c972 100644
--- a/assets/js/agent/pipeline.js
+++ b/assets/js/agent/pipeline.js
@@ -31,6 +31,91 @@ PE.Pipeline = (function () {
   var BASE_RULES_PATH = 'assets/data/rules/';
   var PLACEHOLDERS_KEY = 'pe.rulePlaceholders';
 
+  // Engine version is the runtime "what code did the work" stamp. Updated
+  // by hand when the pipeline contract changes; also surfaced in result.
+  var ENGINE_VERSION = '2.0.0';
+
+  // Per-step performance budgets (milliseconds). Steps that exceed their
+  // budget emit a single WARN entry to PE.Log so a slow upload never goes
+  // unnoticed — but never fail the run. Also exported for the perf test
+  // suite to enforce.
+  var SLA = {
+    ingest:   15000,
+    classify:   500,
+    extract:   8000,
+    select:    3000,
+    evaluate:  2000,
+    cite:       500,
+    draft:    20000,
+    total:    30000
+  };
+
+  // Monotonic-ish run id counter for log correlation.
+  var _runSeq = 0;
+  function _newRunId() {
+    _runSeq++;
+    var rand = Math.random().toString(36).slice(2, 8);
+    return 'run-' + Date.now().toString(36) + '-' + _runSeq + '-' + rand;
+  }
+
+  function _checkBudget(L, stepId, durationMs) {
+    var budget = SLA[stepId];
+    if (typeof budget === 'number' && durationMs > budget && L) {
+      L.warn('pipeline', 'SLA breach: ' + stepId + ' took ' + durationMs + 'ms (budget ' + budget + 'ms)',
+        { stepId: stepId, durationMs: durationMs, budgetMs: budget });
+    }
+  }
+
+  /**
+   * Pipeline contract guards. Each step has a structural invariant that
+   * must hold; violations throw a structured error rather than corrupting
+   * downstream state silently. Throws are caught by the surrounding
+   * try/catch and surfaced via emit(stepId,'error',...) + PE.Log.
+   */
+  function _assertExtractionShape(ext) {
+    if (!ext || typeof ext !== 'object') throw _contractErr('ingest', 'extraction must be an object');
+    if (typeof ext.source !== 'string')  throw _contractErr('ingest', 'extraction.source must be a string');
+    if (ext.unsupported) return; // unsupported branches return early; no further shape required
+    if (!ext.facts || typeof ext.facts !== 'object') throw _contractErr('ingest', 'extraction.facts must be an object');
+    var hasContent = (typeof ext.text === 'string') || Array.isArray(ext.layers) || Array.isArray(ext.pages);
+    if (!hasContent) throw _contractErr('ingest', 'extraction must include text/layers/pages');
+  }
+  function _assertFindingsShape(findings) {
+    if (!Array.isArray(findings)) throw _contractErr('evaluate', 'findings must be an array');
+    for (var i = 0; i < findings.length; i++) {
+      var f = findings[i];
+      if (!f || typeof f !== 'object')        throw _contractErr('evaluate', 'finding[' + i + '] is not an object');
+      if (typeof f.id !== 'string' || !f.id)  throw _contractErr('evaluate', 'finding[' + i + '].id missing');
+      if (['PASS', 'REVIEW', 'FLAGGED'].indexOf(f.status) === -1) {
+        throw _contractErr('evaluate', 'finding[' + i + '].status invalid: ' + f.status);
+      }
+    }
+  }
+  function _contractErr(step, msg) {
+    var e = new Error('Pipeline contract violation at ' + step + ': ' + msg);
+    e.code   = 'PIPELINE_CONTRACT';
+    e.step   = step;
+    return e;
+  }
+
+  /**
+   * Compute a short, deterministic fingerprint of the loaded rule packs.
+   * Stamped onto every result so a saved/exported report is reproducible.
+   * Cheap FNV-1a over the sorted (id, version, ruleCount) tuples.
+   */
+  function _fingerprintPacks(packs) {
+    var parts = (packs || []).map(function (p) {
+      return (p.id || '') + '@' + (p.version || '?') + ':' + ((p.rules || []).length);
+    }).sort();
+    var s = parts.join('|');
+    var h = 0x811c9dc5 >>> 0;
+    for (var i = 0; i < s.length; i++) {
+      h ^= s.charCodeAt(i);
+      h = (h + ((h << 1) + (h << 4) + (h << 7) + (h << 8) + (h << 24))) >>> 0;
+    }
+    return ('00000000' + h.toString(16)).slice(-8);
+  }
+
   // ── Rule pack loader ─────────────────────────────────────────────────
   var _packCache = {};
 
@@ -179,8 +264,14 @@ PE.Pipeline = (function () {
     function _stepLog(stepId, status, detail, data) {
       if (L) L.info('pipeline', stepId + ' ' + status + ': ' + (detail || ''), data || null);
     }
-    var result = { facts: {}, packs: [], findings: [], score: 0, summary: '', correctionLetter: '' };
-    if (L) L.info('pipeline', 'Pipeline start', { file: file.name, size: file.size, formData: formData });
+    var result = {
+      facts: {}, packs: [], findings: [], score: 0, summary: '', correctionLetter: '',
+      runId: _newRunId(),
+      engineVersion: ENGINE_VERSION,
+      rulesVersion: null,         // filled in once packs are selected
+      startedAt: new Date().toISOString()
+    };
+    if (L) L.info('pipeline', 'Pipeline start', { runId: result.runId, engineVersion: ENGINE_VERSION, file: file.name, size: file.size, formData: formData });
 
     // ── Step 1: Ingest ─────────────────────────────────────────────
     var sT0 = _now();
@@ -197,6 +288,7 @@ PE.Pipeline = (function () {
       });
       var sT1 = _now();
       var ingestMs = Math.round(sT1 - sT0);
+      _checkBudget(L, 'ingest', ingestMs);
       if (extraction.unsupported) {
         var unsupMsg = extraction.unsupportedReason ||
           (extraction.source === 'dwg'
@@ -227,6 +319,7 @@ PE.Pipeline = (function () {
         sha256: extraction.fileMeta && extraction.fileMeta.sha256
       });
       if (extraction.warning && extraction.warningMsg && L) L.warn('pipeline', extraction.warningMsg, { warning: extraction.warning });
+      _assertExtractionShape(extraction);
     } catch (err) {
       emit('ingest', 'error', 'Ingestion failed: ' + err.message);
       if (L) L.error('pipeline', 'ingest failed: ' + err.message, { error: err && err.stack });
@@ -247,6 +340,7 @@ PE.Pipeline = (function () {
     var classifyDetail = 'Classified as ' + facts.buildingType + (useGroup !== facts.buildingType ? ' (IBC Use Group: ' + useGroup + ')' : '') + '.';
     emit('classify', 'done', classifyDetail);
     _stepLog('classify', 'done', classifyDetail, { durationMs: Math.round(_now() - sT0), buildingType: facts.buildingType, useGroup: useGroup });
+    _checkBudget(L, 'classify', Math.round(_now() - sT0));
 
     // ── Step 3: Extract Facts (regex + optional AI vision) ────────
     sT0 = _now();
@@ -323,6 +417,7 @@ PE.Pipeline = (function () {
       durationMs: Math.round(_now() - sT0), factsCount: extracted.length, factKeys: extracted,
       visionStatus: visionStatus, visionReason: visionReason || null
     });
+    _checkBudget(L, 'extract', Math.round(_now() - sT0));
     result.facts = facts;
 
     // ── Step 4: Select Rules ──────────────────────────────────────
@@ -333,12 +428,15 @@ PE.Pipeline = (function () {
     try {
       packs = await selectPacks(formData.buildingCode || '2024 IBC', facts.buildingType);
       result.packs = packs;
+      result.rulesVersion = _fingerprintPacks(packs);
       var selectDetail = packs.length + ' rule pack(s) loaded: ' + packs.map(function (p) { return p.name; }).join(', ') + '.';
       emit('select', 'done', selectDetail);
       _stepLog('select', 'done', selectDetail, {
         durationMs: Math.round(_now() - sT0),
-        packs: packs.map(function (p) { return { id: p.id, name: p.name, ruleCount: (p.rules || []).length }; })
+        rulesVersion: result.rulesVersion,
+        packs: packs.map(function (p) { return { id: p.id, name: p.name, version: p.version || null, ruleCount: (p.rules || []).length }; })
       });
+      _checkBudget(L, 'select', Math.round(_now() - sT0));
     } catch (err) {
       emit('select', 'error', 'Failed to load rule packs: ' + err.message);
       if (L) L.error('pipeline', 'select failed: ' + err.message, { error: err && err.stack });
@@ -374,6 +472,7 @@ PE.Pipeline = (function () {
       });
       if (L) L.info('pipeline', 'added ' + result.visionConflicts.length + ' vision-conflict REVIEW finding(s)', { conflicts: result.visionConflicts.length });
     }
+    _assertFindingsShape(findings);
     var compScore = PE.RuleEngine.score(findings);
     result.findings = findings;
     result.score    = compScore;
@@ -395,6 +494,7 @@ PE.Pipeline = (function () {
       score:     compScore,
       coverage:  result.coverage ? { keys: result.coverage.length, missing: result.coverage.filter(function (c) { return c.missing; }).length } : null
     });
+    _checkBudget(L, 'evaluate', Math.round(_now() - sT0));
 
     // ── Step 6: Cite ──────────────────────────────────────────────
     sT0 = _now();
@@ -405,6 +505,7 @@ PE.Pipeline = (function () {
     var citeDetail = citedCount + ' citations attached from ' + packs.map(function (p) { return p.name; }).join(', ') + '.';
     emit('cite', 'done', citeDetail);
     _stepLog('cite', 'done', citeDetail, { durationMs: Math.round(_now() - sT0), cited: citedCount });
+    _checkBudget(L, 'cite', Math.round(_now() - sT0));
 
     // ── Step 7: Draft ─────────────────────────────────────────────
     sT0 = _now();
@@ -426,8 +527,16 @@ PE.Pipeline = (function () {
       emit('draft', 'error', 'LLM draft failed (' + err.message + ') — deterministic summary used.');
       if (L) L.error('pipeline', 'draft failed: ' + err.message, { error: err && err.stack });
     }
-
-    if (L) L.info('pipeline', 'Pipeline complete', { totalMs: Math.round(_now() - pipeT0), score: result.score, findings: result.findings.length });
+    _checkBudget(L, 'draft', Math.round(_now() - sT0));
+
+    var totalMs = Math.round(_now() - pipeT0);
+    result.completedAt = new Date().toISOString();
+    result.totalMs     = totalMs;
+    _checkBudget(L, 'total', totalMs);
+    if (L) L.info('pipeline', 'Pipeline complete', {
+      runId: result.runId, totalMs: totalMs, score: result.score,
+      findings: result.findings.length, engineVersion: result.engineVersion, rulesVersion: result.rulesVersion
+    });
 
     return result;
   }
@@ -487,7 +596,13 @@ PE.Pipeline = (function () {
     return 'B'; // default
   }
 
-  return { run: run, STEPS: STEPS, loadPack: loadPack, selectPacks: selectPacks, getStoredPlaceholders: getStoredPlaceholders, setStoredPlaceholders: setStoredPlaceholders };
+  return {
+    run: run, STEPS: STEPS,
+    SLA: SLA, ENGINE_VERSION: ENGINE_VERSION,
+    loadPack: loadPack, selectPacks: selectPacks,
+    getStoredPlaceholders: getStoredPlaceholders, setStoredPlaceholders: setStoredPlaceholders,
+    fingerprintPacks: _fingerprintPacks
+  };
 
 }());
 
diff --git a/assets/js/agent/self-test.js b/assets/js/agent/self-test.js
new file mode 100644
index 0000000..93251aa
--- /dev/null
+++ b/assets/js/agent/self-test.js
@@ -0,0 +1,258 @@
+/**
+ * Plan-Examiner Self-Test Harness (PE.SelfTest)
+ *
+ * Loads bundled selftest fixtures and runs them through the deterministic
+ * extract → select → evaluate → score path, then asserts each fixture's
+ * golden expectations from `assets/data/fixtures/selftest/expected.json`.
+ *
+ * Designed to run in BOTH the browser (where it powers the in-app
+ * "Run Diagnostics" button) and Node (where `scripts/status.mjs` and
+ * `tests/integration.pipeline.test.js` import it via the test loader).
+ *
+ * The harness intentionally exercises the same code paths the upload
+ * pipeline uses for DXF — `PE.Extractors.fromDxf`, `PE.Pipeline.selectPacks`,
+ * and `PE.RuleEngine.evaluate` — so a green run is concrete proof that
+ * uploaded plans really are scanned, evaluated, and scored.
+ *
+ * Usage (browser console, or via the Run Diagnostics button):
+ *     await PE.SelfTest.run();   // returns { ok, summary, results }
+ *
+ * No network or LLM calls. No data leaves the browser.
+ */
+
+var PE = (typeof window !== 'undefined' && window.PE) ? window.PE : (typeof global !== 'undefined' && global.PE) || {};
+
+PE.SelfTest = (function () {
+  'use strict';
+
+  var FIXTURES_BASE = 'assets/data/fixtures/selftest/';
+
+  function _L() { return (PE && PE.Log) ? PE.Log : null; }
+  function _log(level, msg, data) { var L = _L(); if (L && L[level]) L[level]('selftest', msg, data || null); }
+
+  function _now() {
+    return (typeof performance !== 'undefined' && performance.now) ? performance.now() : Date.now();
+  }
+
+  /**
+   * Loads `expected.json` and a fixture file as text. Uses fetch when
+   * available (browser + Node 18+); the Node test loader installs a
+   * file-system fetch shim so the same code works under `node --test`.
+   */
+  async function _loadText(url) {
+    var resp = await fetch(url);
+    if (!resp.ok) throw new Error('Failed to load ' + url + ' (' + resp.status + ')');
+    return await resp.text();
+  }
+
+  async function _loadJson(url) {
+    return JSON.parse(await _loadText(url));
+  }
+
+  function _inBand(value, band) {
+    if (!band) return true;
+    if (typeof band.min === 'number' && value < band.min) return false;
+    if (typeof band.max === 'number' && value > band.max) return false;
+    return true;
+  }
+
+  function _missing(arr, want) {
+    return (want || []).filter(function (k) { return arr.indexOf(k) === -1; });
+  }
+
+  function _factKeysOf(facts) {
+    return Object.keys(facts || {}).filter(function (k) {
+      if (k.charAt(0) === '_') return false;                                       // internal
+      if (k === 'buildingType' || k === 'buildingCode' || k === 'city' ||
+          k === 'state' || k === 'country') return false;                          // form-injected
+      var v = facts[k];
+      return v !== null && v !== undefined && v !== '';
+    });
+  }
+
+  /**
+   * Run a single fixture. Returns a structured result. Never throws —
+   * any unexpected error becomes `{ ok:false, error:... }` so the
+   * harness can complete and report all fixtures.
+   */
+  async function runFixture(fx, base) {
+    var t0 = _now();
+    var result = {
+      id: fx.id,
+      file: fx.file,
+      label: fx.label,
+      ok: false,
+      durationMs: 0,
+      assertions: [],
+      facts: null,
+      counts: null,
+      score: null,
+      flagged: [],
+      error: null
+    };
+    function assert(name, pass, detail) {
+      result.assertions.push({ name: name, pass: !!pass, detail: detail || '' });
+      if (!pass) result.ok = false;
+    }
+
+    try {
+      if (!PE.Extractors || !PE.RuleEngine || !PE.Pipeline) {
+        throw new Error('PE modules not loaded (Extractors / RuleEngine / Pipeline)');
+      }
+      var fixtureUrl = (base || FIXTURES_BASE) + fx.file;
+      var text = await _loadText(fixtureUrl);
+
+      // Only DXF fixtures are supported by the deterministic Node-runnable
+      // path; PDF/DOCX rely on browser-only libs (pdf.js / mammoth).
+      var isDxf = /\.dxf$/i.test(fx.file);
+      if (!isDxf) {
+        throw new Error('SelfTest fixtures must be .dxf in this build (got "' + fx.file + '")');
+      }
+
+      var ext = PE.Extractors.fromDxf(text);
+      var facts = ext.facts || {};
+      facts.buildingType   = (fx.form_data && fx.form_data.buildingType) || facts.buildingType || 'Commercial';
+      facts.occupancyGroup = facts.occupancyGroup || (fx.expected && fx.expected.use_group) || 'B';
+
+      var packs    = await PE.Pipeline.selectPacks((fx.form_data && fx.form_data.buildingCode) || '2024 IBC', facts.buildingType);
+      var findings = PE.RuleEngine.evaluate(facts, packs, facts.buildingType, {});
+      var score    = PE.RuleEngine.score(findings);
+
+      var counts = { PASS: 0, REVIEW: 0, FLAGGED: 0 };
+      var flaggedIds = [];
+      findings.forEach(function (f) {
+        counts[f.status] = (counts[f.status] || 0) + 1;
+        if (f.status === 'FLAGGED') flaggedIds.push(f.id);
+      });
+
+      result.facts   = facts;
+      result.counts  = counts;
+      result.score   = score;
+      result.flagged = flaggedIds;
+      result.ok      = true;            // flips to false on any assertion failure
+
+      var exp = fx.expected || {};
+
+      assert('source matches', ext.source === exp.source,
+             'expected source=' + exp.source + ', got ' + ext.source);
+
+      var keys = _factKeysOf(facts);
+      assert('min facts extracted',
+             keys.length >= (exp.min_facts || 0),
+             'expected ≥' + (exp.min_facts || 0) + ', got ' + keys.length);
+
+      var missing = _missing(keys, exp.required_fact_keys);
+      assert('required fact keys present',
+             missing.length === 0,
+             missing.length ? 'missing: ' + missing.join(', ') : '');
+
+      if (exp.required_bool_flags) {
+        Object.keys(exp.required_bool_flags).forEach(function (flag) {
+          var want = exp.required_bool_flags[flag];
+          assert('bool flag ' + flag + '=' + want,
+                 facts[flag] === want,
+                 'got ' + JSON.stringify(facts[flag]));
+        });
+      }
+
+      var missingFlags = _missing(flaggedIds, exp.must_flag_ids);
+      assert('must-flag rule ids present',
+             missingFlags.length === 0,
+             missingFlags.length ? 'missing flags: ' + missingFlags.join(', ') : '');
+
+      var unexpectedFlags = (exp.must_not_flag_ids || []).filter(function (id) {
+        return flaggedIds.indexOf(id) !== -1;
+      });
+      assert('must-not-flag rule ids absent',
+             unexpectedFlags.length === 0,
+             unexpectedFlags.length ? 'unexpected flags: ' + unexpectedFlags.join(', ') : '');
+
+      ['FLAGGED', 'REVIEW', 'PASS'].forEach(function (s) {
+        if (exp.counts && exp.counts[s]) {
+          assert(s + ' count in band',
+                 _inBand(counts[s], exp.counts[s]),
+                 s + '=' + counts[s] + ' band=' + JSON.stringify(exp.counts[s]));
+        }
+      });
+
+      assert('score in band',
+             _inBand(score, exp.score_band),
+             'score=' + score + ' band=' + JSON.stringify(exp.score_band));
+
+    } catch (err) {
+      result.ok = false;
+      result.error = (err && err.message) ? err.message : String(err);
+      _log('error', 'fixture ' + fx.id + ' threw: ' + result.error);
+    }
+
+    result.durationMs = Math.round(_now() - t0);
+    return result;
+  }
+
+  /**
+   * Run all fixtures listed in `expected.json`. Resolves to a summary
+   * regardless of pass/fail — never rejects.
+   *
+   * @param {Object} [opts]
+   * @param {string} [opts.base]   Override fixtures base path (e.g. for tests).
+   * @param {Function} [opts.onProgress]   Called with (fxResult) per fixture.
+   */
+  async function run(opts) {
+    opts = opts || {};
+    var base = opts.base || FIXTURES_BASE;
+    var t0 = _now();
+    var results = [];
+    var fatal = null;
+
+    _log('info', 'SelfTest run start', { base: base });
+
+    var manifest;
+    try {
+      manifest = await _loadJson(base + 'expected.json');
+    } catch (e) {
+      fatal = 'Could not load expected.json: ' + (e && e.message);
+      _log('error', fatal);
+    }
+
+    if (manifest && Array.isArray(manifest.fixtures)) {
+      for (var i = 0; i < manifest.fixtures.length; i++) {
+        var fx = manifest.fixtures[i];
+        var r;
+        try {
+          r = await runFixture(fx, base);
+        } catch (e) {
+          r = { id: fx.id, ok: false, error: 'runFixture threw: ' + (e && e.message), assertions: [], facts: null, counts: null, score: null, flagged: [] };
+        }
+        results.push(r);
+        if (typeof opts.onProgress === 'function') {
+          try { opts.onProgress(r); } catch (e) { /* ignore */ }
+        }
+      }
+    }
+
+    var passed = results.filter(function (r) { return r.ok; }).length;
+    var summary = {
+      ok: !fatal && results.length > 0 && passed === results.length,
+      total: results.length,
+      passed: passed,
+      failed: results.length - passed,
+      manifestVersion: (manifest && manifest.version) || null,
+      fatal: fatal,
+      durationMs: Math.round(_now() - t0),
+      generatedAt: new Date().toISOString()
+    };
+
+    _log(summary.ok ? 'info' : 'warn', 'SelfTest run complete: ' + passed + '/' + results.length + ' passed', summary);
+
+    return { summary: summary, results: results };
+  }
+
+  return {
+    run: run,
+    runFixture: runFixture,
+    FIXTURES_BASE: FIXTURES_BASE
+  };
+}());
+
+if (typeof window !== 'undefined') window.PE = PE;
+else if (typeof global !== 'undefined') global.PE = PE;
diff --git a/tests/integration.pipeline.test.js b/tests/integration.pipeline.test.js
new file mode 100644
index 0000000..a5f1a9a
--- /dev/null
+++ b/tests/integration.pipeline.test.js
@@ -0,0 +1,111 @@
+/**
+ * End-to-end integration test for the upload → score path.
+ *
+ * Unlike `pipeline.test.js` (which mocks the extractor), this test wires
+ * the REAL `PE.Extractors`, `PE.RuleEngine`, `PE.Pipeline.selectPacks`,
+ * and `PE.SelfTest` modules together, runs them against the bundled
+ * fixtures in `assets/data/fixtures/selftest/`, and asserts each
+ * fixture's golden expectations.
+ *
+ * If this test stays green, the platform really does scan, evaluate,
+ * and score uploaded plans — the same code paths the in-app
+ * "Run Diagnostics" button hits.
+ */
+
+const test   = require('node:test');
+const assert = require('node:assert');
+const fs     = require('node:fs');
+const path   = require('node:path');
+
+const loader = require('./helpers/load');
+const { ROOT } = loader;
+
+// File-system fetch shim: lets self-test / pipeline modules `fetch()` rule
+// packs and fixtures from the repo on disk. Same pattern as pipeline.test.js.
+global.fetch = function (url) {
+  // Strip leading dots / origin so both 'assets/...' and './assets/...' resolve.
+  var rel = String(url).replace(/^.*?(assets\/)/, '$1');
+  var abs = path.join(ROOT, rel);
+  if (!fs.existsSync(abs)) {
+    return Promise.resolve({
+      ok: false, status: 404,
+      json: () => Promise.reject(new Error('not found')),
+      text: () => Promise.reject(new Error('not found'))
+    });
+  }
+  var body = fs.readFileSync(abs, 'utf8');
+  return Promise.resolve({
+    ok: true, status: 200,
+    json: () => Promise.resolve(JSON.parse(body)),
+    text: () => Promise.resolve(body)
+  });
+};
+
+loader.loadAll();
+loader.loadSource('assets/js/agent/pipeline.js');
+loader.loadSource('assets/js/agent/self-test.js');
+
+const PE = global.PE;
+
+test('SelfTest module is registered', () => {
+  assert.ok(PE.SelfTest, 'PE.SelfTest should be exported');
+  assert.ok(typeof PE.SelfTest.run === 'function');
+});
+
+test('SelfTest fixtures and expected.json exist on disk', () => {
+  const expectedPath = path.join(ROOT, 'assets/data/fixtures/selftest/expected.json');
+  assert.ok(fs.existsSync(expectedPath), 'expected.json must exist');
+  const manifest = JSON.parse(fs.readFileSync(expectedPath, 'utf8'));
+  assert.ok(Array.isArray(manifest.fixtures) && manifest.fixtures.length >= 3,
+    'manifest must declare ≥3 fixtures');
+  manifest.fixtures.forEach(fx => {
+    const fp = path.join(ROOT, 'assets/data/fixtures/selftest', fx.file);
+    assert.ok(fs.existsSync(fp), 'fixture missing on disk: ' + fx.file);
+  });
+});
+
+test('SelfTest.run() exercises real extractors → rule engine → score and all fixtures pass', async () => {
+  const { summary, results } = await PE.SelfTest.run();
+
+  // Print a per-fixture diagnostic line in case CI fails — makes triage trivial.
+  results.forEach(r => {
+    const failed = r.assertions.filter(a => !a.pass);
+    const detail = failed.length
+      ? '\n      ' + failed.map(a => '✗ ' + a.name + (a.detail ? ' — ' + a.detail : '')).join('\n      ')
+      : '';
+    // eslint-disable-next-line no-console
+    console.log(
+      '    [selftest] ' + r.id +
+      ' ok=' + r.ok +
+      ' score=' + r.score +
+      ' counts=' + JSON.stringify(r.counts) +
+      ' flagged=' + (r.flagged || []).length +
+      detail
+    );
+  });
+
+  assert.strictEqual(summary.fatal, null, 'fatal: ' + summary.fatal);
+  assert.ok(summary.total >= 3, 'expected ≥3 fixtures, got ' + summary.total);
+  assert.strictEqual(summary.failed, 0,
+    summary.failed + '/' + summary.total + ' fixtures failed (see console output above)');
+});
+
+test('Non-compliant fixture really produces FLAGGED findings (proves rule engine fires)', async () => {
+  const { results } = await PE.SelfTest.run();
+  const nc = results.find(r => r.id === 'non-compliant-assembly');
+  assert.ok(nc, 'non-compliant-assembly result must exist');
+  assert.ok(nc.flagged.length >= 3,
+    'non-compliant fixture should produce ≥3 FLAGGED findings; got ' + nc.flagged.length);
+  // The 28-in door width must be flagged (ADA-404.2.3 / IBC-1010.1).
+  const hasDoorFlag = nc.flagged.some(id => /1010|404\.2\.3/.test(id));
+  assert.ok(hasDoorFlag,
+    'expected door-width related FLAG; got: ' + nc.flagged.join(','));
+});
+
+test('Sparse fixture surfaces missing-evidence as REVIEW, never as silent PASS', async () => {
+  const { results } = await PE.SelfTest.run();
+  const sp = results.find(r => r.id === 'sparse-warehouse');
+  assert.ok(sp, 'sparse-warehouse result must exist');
+  assert.ok(sp.counts.REVIEW >= 10,
+    'sparse fixture should produce many REVIEW findings; got ' + sp.counts.REVIEW);
+});
diff --git a/tests/rules.schema.test.js b/tests/rules.schema.test.js
new file mode 100644
index 0000000..74db2f4
--- /dev/null
+++ b/tests/rules.schema.test.js
@@ -0,0 +1,25 @@
+/**
+ * Schema validation gate.
+ *
+ * Spawns `scripts/validate-rules.mjs` and asserts a clean exit. This test
+ * is the safety net that catches malformed rule packs (missing license,
+ * unknown check_fn, broken extends-chain, schema drift) before they reach
+ * production. Mirrors the validate-json CI job for local `npm test`.
+ */
+
+const test       = require('node:test');
+const assert     = require('node:assert');
+const { spawnSync } = require('node:child_process');
+const path       = require('node:path');
+
+const ROOT = path.resolve(__dirname, '..');
+
+test('scripts/validate-rules.mjs exits 0 (rule packs are schema-valid)', () => {
+  const r = spawnSync('node', ['scripts/validate-rules.mjs'], { cwd: ROOT, encoding: 'utf8' });
+  if (r.status !== 0) {
+    // eslint-disable-next-line no-console
+    console.log('--- validate-rules stdout ---\n' + r.stdout);
+    console.log('--- validate-rules stderr ---\n' + r.stderr);
+  }
+  assert.strictEqual(r.status, 0, 'validate-rules.mjs reported errors');
+});

From 000f7504d5c4b75553f30702e9f69280c0063b5f Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Wed, 6 May 2026 02:47:36 +0000
Subject: [PATCH 2/2] Add perf/crash tests, diagnostics UI, log.exportRun,
 rules-report, status, health workflow

Agent-Logs-Url: https://github.com/DaScient-Intelligence/Plan-Examiner/sessions/594db8e5-858f-4cf8-ba13-0eb0a71df477

Co-authored-by: DaScient <25983786+DaScient@users.noreply.github.com>
---
 .github/workflows/ci.yml       |   2 +
 .github/workflows/health.yml   |  33 ++++++++++
 .gitignore                     |   3 +
 assets/js/agent/rule-engine.js |  19 +++++-
 assets/js/app.js               |  50 +++++++++++++++
 assets/js/utils/log.js         |  48 +++++++++++++++
 docs/RULES.md                  |  38 ++++++++++++
 index.html                     |  11 ++++
 package.json                   |   6 +-
 scripts/rules-report.mjs       | 108 +++++++++++++++++++++++++++++++++
 scripts/status.mjs             |  95 +++++++++++++++++++++++++++++
 sw.js                          |  27 ++++++++-
 tests/extractors.crash.test.js |  86 ++++++++++++++++++++++++++
 tests/pipeline.perf.test.js    |  92 ++++++++++++++++++++++++++++
 14 files changed, 615 insertions(+), 3 deletions(-)
 create mode 100644 .github/workflows/health.yml
 create mode 100644 docs/RULES.md
 create mode 100644 scripts/rules-report.mjs
 create mode 100644 scripts/status.mjs
 create mode 100644 tests/extractors.crash.test.js
 create mode 100644 tests/pipeline.perf.test.js

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 149ab97..0c4f75d 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -45,6 +45,8 @@ jobs:
           done
       - name: Validate rule packs (schema + envelope + check_fn refs)
         run: node scripts/validate-rules.mjs
+      - name: Verify docs/RULES.md is up to date
+        run: node scripts/rules-report.mjs --check
 
   check-links:
     name: Link Check
diff --git a/.github/workflows/health.yml b/.github/workflows/health.yml
new file mode 100644
index 0000000..9b22732
--- /dev/null
+++ b/.github/workflows/health.yml
@@ -0,0 +1,33 @@
+name: Health Check
+
+# Daily self-test against the bundled fixtures. Fails fast if the
+# extract → evaluate → score path regresses on a known-good plan.
+
+on:
+  schedule:
+    - cron: '17 6 * * *'        # 06:17 UTC daily
+  workflow_dispatch: {}
+
+permissions:
+  contents: read
+
+jobs:
+  selftest:
+    name: Self-test fixtures
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+    steps:
+      - uses: actions/checkout@v6
+      - uses: actions/setup-node@v6
+        with:
+          node-version: 20
+      - name: Run headless self-test
+        run: node scripts/status.mjs
+      - name: Upload status.json
+        if: always()
+        uses: actions/upload-artifact@v4
+        with:
+          name: status-json
+          path: status.json
+          if-no-files-found: warn
diff --git a/.gitignore b/.gitignore
index e2bc39a..8b4b4a5 100644
--- a/.gitignore
+++ b/.gitignore
@@ -16,6 +16,9 @@ dist/
 *.log
 *.tmp
 
+# Status / health-check output (regenerated by scripts/status.mjs)
+status.json
+
 # ── Private / owner-only artifacts ─────────────────────────────────────
 # The `private/` directory is for owner-only notes that must NOT be
 # committed (e.g., the plaintext list of donor emails that map to the
diff --git a/assets/js/agent/rule-engine.js b/assets/js/agent/rule-engine.js
index f57b2ae..cda9d3d 100644
--- a/assets/js/agent/rule-engine.js
+++ b/assets/js/agent/rule-engine.js
@@ -365,11 +365,21 @@ PE.RuleEngine = (function () {
     return merged;
   }
 
+  // Per-evaluate context memoization. Each `evaluate()` call sees a
+  // stable `facts` reference and one `packPlaceholders` per pack. We
+  // cache the derived context (occupancy, sprinklered flag, etc.) by
+  // (facts → placeholders) identity to avoid re-deriving it per rule.
+  // Cleared between top-level evaluate calls via _ctxCache reset.
+  var _ctxCache = null;
   function _buildContext(facts, placeholders) {
     facts = facts || {};
     placeholders = placeholders || {};
+    if (_ctxCache && _ctxCache.facts === facts) {
+      var hit = _ctxCache.byPlaceholders.get(placeholders);
+      if (hit) return hit;
+    }
     var occ = (facts.occupancyGroup || facts.useGroup || '').toString().toUpperCase();
-    return {
+    var ctx = {
       facts: facts,
       placeholders: placeholders,
       occupancy: occ,
@@ -377,7 +387,13 @@ PE.RuleEngine = (function () {
       construction: (facts.constructionType || placeholders.construction_type || '').toString(),
       stories: facts.stories || 1
     };
+    if (!_ctxCache || _ctxCache.facts !== facts) {
+      _ctxCache = { facts: facts, byPlaceholders: new Map() };
+    }
+    _ctxCache.byPlaceholders.set(placeholders, ctx);
+    return ctx;
   }
+  function _resetContextCache() { _ctxCache = null; }
 
   function _selectorMatches(sel, ctx) {
     var parts = sel.split('.');
@@ -470,6 +486,7 @@ PE.RuleEngine = (function () {
    */
   function evaluate(facts, packs, buildingType, opts) {
     opts = opts || {};
+    _resetContextCache();          // fresh per-call memo for derived context
     var globalPlaceholders = opts.placeholders || {};
     var raw = [];
     var L = (typeof window !== 'undefined' && window.PE && window.PE.Log) ? window.PE.Log : null;
diff --git a/assets/js/app.js b/assets/js/app.js
index 4d63dbe..60cbb66 100644
--- a/assets/js/app.js
+++ b/assets/js/app.js
@@ -729,6 +729,56 @@ PE.App = (function () {
       if (s) { s.textContent = 'Vision consent revoked.'; s.style.color = '#fbbf24'; }
     });
 
+    // ── Run Diagnostics ────────────────────────────────────────────
+    // Exercises the same extract → evaluate → score path the upload
+    // pipeline uses, against bundled fixtures. Provides non-developer
+    // verifiable proof that the scanner is functioning.
+    var stBtn  = document.getElementById('selfTestBtn');
+    var stOut  = document.getElementById('selfTestResults');
+    var stStat = document.getElementById('selfTestStatus');
+    if (stBtn && PE.SelfTest) stBtn.addEventListener('click', async function () {
+      stBtn.disabled = true;
+      var origLabel = stBtn.innerHTML;
+      stBtn.innerHTML = '<i class="fas fa-spinner fa-spin text-xs mr-1" aria-hidden="true"></i>Running…';
+      if (stStat) { stStat.textContent = 'Running self-test against bundled fixtures…'; stStat.style.color = '#94a3b8'; }
+      try {
+        var out = await PE.SelfTest.run();
+        var lines = [];
+        var ok = out.summary && out.summary.ok;
+        lines.push((ok ? '✅' : '❌') + ' ' + out.summary.passed + '/' + out.summary.total +
+                   ' fixtures passed (' + out.summary.durationMs + 'ms, manifest v' + (out.summary.manifestVersion || '?') + ')');
+        (out.results || []).forEach(function (r) {
+          var mark = r.ok ? '✓' : '✗';
+          lines.push('  ' + mark + ' ' + r.id + ' — score ' + r.score +
+                     ', ' + (r.counts ? (r.counts.FLAGGED + ' flagged, ' + r.counts.REVIEW + ' review, ' + r.counts.PASS + ' pass') : 'n/a') +
+                     ' (' + r.durationMs + 'ms)');
+          if (!r.ok) {
+            (r.assertions || []).filter(function (a) { return !a.pass; }).forEach(function (a) {
+              lines.push('       • ' + a.name + (a.detail ? ' — ' + a.detail : ''));
+            });
+            if (r.error) lines.push('       error: ' + r.error);
+          }
+        });
+        if (stOut) {
+          stOut.style.display = 'block';
+          stOut.textContent = lines.join('\n');
+          stOut.style.borderColor = ok ? 'rgba(52,211,153,.35)' : 'rgba(248,113,113,.35)';
+        }
+        if (stStat) {
+          stStat.textContent = ok
+            ? '✓ Scanner verified — all ' + out.summary.total + ' fixtures passed in ' + out.summary.durationMs + 'ms.'
+            : '✗ ' + out.summary.failed + ' of ' + out.summary.total + ' fixtures failed (see details).';
+          stStat.style.color = ok ? '#34d399' : '#f87171';
+        }
+      } catch (e) {
+        if (stOut) { stOut.style.display = 'block'; stOut.textContent = 'Diagnostics failed: ' + (e && e.message ? e.message : String(e)); }
+        if (stStat) { stStat.textContent = '✗ Diagnostics threw an error.'; stStat.style.color = '#f87171'; }
+      } finally {
+        stBtn.disabled = false;
+        stBtn.innerHTML = origLabel;
+      }
+    });
+
     // Vision consent modal wiring.
     var vcOverlay = document.getElementById('visionConsentOverlay');
     if (vcOverlay) {
diff --git a/assets/js/utils/log.js b/assets/js/utils/log.js
index 9395957..f42eb01 100644
--- a/assets/js/utils/log.js
+++ b/assets/js/utils/log.js
@@ -236,6 +236,52 @@ PE.Log = (function () {
     }).join('\n');
   }
 
+  /**
+   * Filter the buffer to entries that mention `runId` in their data
+   * payload. Useful for the "Download diagnostic bundle" support flow.
+   * If no runId is provided, returns all entries.
+   */
+  function entriesForRun(runId) {
+    if (!runId) return _buffer.slice();
+    return _buffer.filter(function (e) {
+      if (!e || !e.data) return false;
+      // PE.Pipeline stamps `runId` on its boot/complete entries; rule-engine
+      // and extractor entries don't, so the "for this run" view is a
+      // best-effort filter centered on the pipeline lifecycle.
+      try {
+        var s = JSON.stringify(e.data);
+        return s.indexOf(runId) !== -1;
+      } catch (x) { return false; }
+    });
+  }
+
+  /**
+   * Build a self-contained, redacted JSON diagnostic bundle suitable for
+   * attaching to a support ticket. Includes:
+   *   - bundle metadata (schema version, generated timestamp)
+   *   - environment fingerprint (UA, app version if known)
+   *   - the run's structured log entries
+   *   - any caller-supplied summary (file metadata, score, findings, facts)
+   *
+   * No raw file contents, no API keys (already redacted by _redactString
+   * applied at record time). Safe to share.
+   */
+  function exportRun(runId, extras) {
+    var bundle = {
+      schema:      'plan-examiner.diagnostic-bundle',
+      schemaVersion: 1,
+      generatedAt: new Date().toISOString(),
+      runId:       runId || null,
+      env: {
+        userAgent: (typeof navigator !== 'undefined' && navigator.userAgent) || 'n/a',
+        engineVersion: (typeof window !== 'undefined' && window.PE && window.PE.Pipeline && window.PE.Pipeline.ENGINE_VERSION) || null
+      },
+      log: entriesForRun(runId),
+      run: extras || null
+    };
+    return bundle;
+  }
+
   // ── Init ─────────────────────────────────────────────────────────────
   _enabled = _resolveEnabled();
   _consoleLevel = _enabled ? LEVELS.debug : LEVELS.warn;
@@ -261,6 +307,8 @@ PE.Log = (function () {
     trace:      trace,
     group:      group,
     entries:    entries,
+    entriesForRun: entriesForRun,
+    exportRun:  exportRun,
     clear:      clear,
     subscribe:  subscribe,
     formatText: formatText
diff --git a/docs/RULES.md b/docs/RULES.md
new file mode 100644
index 0000000..b706717
--- /dev/null
+++ b/docs/RULES.md
@@ -0,0 +1,38 @@
+<!-- Auto-generated by scripts/rules-report.mjs. Do not edit by hand. -->
+# Plan-Examiner Rule-Pack Inventory
+
+Generated: 2026-05-06  
+Total packs: **23** &middot; Total rules: **153** &middot; Disabled: 0 &middot; Experimental: 8
+
+| Pack | Version | Schema | Category | License | Rules | Disabled | Experimental | Extends | Applies To | Indexed |
+|------|---------|--------|----------|---------|------:|---------:|-------------:|---------|------------|:-------:|
+| `a117-1-2017` (ICC A117.1-2017 Accessible & Usable Buildings and Facilities) | 2017 | 3.0.0 | accessibility | reference-only | 4 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `aba-2015` (Architectural Barriers Act Accessibility Standards) | 2015 | 3.0.0 | accessibility | public-domain | 4 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `ada-2010` (ADA Standards for Accessible Design 2010) | 2010 | 3.0.0 | accessibility | public-domain | 38 | 0 | 1 | — | 2024 IBC, Local, Other | ✅ |
+| `cbc-title24-2022` (California Building Code (Title 24, Part 2) 2022) | 2022 | 3.0.0 | local | state-law | 3 | 0 | 0 | ibc-2021 | Local | ✅ |
+| `chicago-bc-2022` (Chicago Construction Codes 2022) | 2022 | 3.0.0 | local | state-law | 1 | 0 | 0 | ibc-2021 | Local | ✅ |
+| `fhag` (Fair Housing Act Design Manual) | 1998 (rev.) | 3.0.0 | fair-housing | public-domain | 7 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `ibc-2021` (International Building Code 2021) | 2021 | 3.0.0 | building | reference-only | 29 | 0 | 3 | — | 2024 IBC, 2021 IBC, Local, Other | ✅ |
+| `ibc-2024` (International Building Code 2024) | 2024 | 3.0.0 | building | reference-only | 3 | 0 | 0 | ibc-2021 | 2024 IBC, Local, Other | ✅ |
+| `iebc-2021` (International Existing Building Code 2021) | 2021 | 3.0.0 | existing-buildings | reference-only | 5 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `iecc-2021` (International Energy Conservation Code 2021) | 2021 | 3.0.0 | energy | reference-only | 4 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `ifc-2021` (International Fire Code 2021) | 2021 | 3.0.0 | fire | reference-only | 5 | 0 | 2 | — | 2024 IBC, Local, Other | ✅ |
+| `imc-2021` (International Mechanical Code 2021) | 2021 | 3.0.0 | mechanical | reference-only | 3 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `ipc-2021` (International Plumbing Code 2021) | 2021 | 3.0.0 | plumbing | reference-only | 3 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `irc-2021` (International Residential Code 2021) | 2021 | 3.0.0 | residential | reference-only | 7 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `nfpa-1-2024` (NFPA 1 Fire Code 2024) | 2024 | 3.0.0 | fire | reference-only | 2 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `nfpa-101-2024` (NFPA 101 Life Safety Code 2024) | 2024 | 3.0.0 | life-safety | reference-only | 1 | 0 | 0 | nfpa-101 | 2024 IBC, Local, Other | ✅ |
+| `nfpa-101` (NFPA 101 Life Safety Code 2021) | 2021 | 3.0.0 | life-safety | reference-only | 15 | 0 | 2 | — | 2024 IBC, Local, Other | ✅ |
+| `nfpa-13-2022` (NFPA 13 Standard for the Installation of Sprinkler Systems) | 2022 | 3.0.0 | fire | reference-only | 3 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `nfpa-72-2022` (NFPA 72 National Fire Alarm and Signaling Code) | 2022 | 3.0.0 | fire | reference-only | 3 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `nfpa-80-2022` (NFPA 80 Standard for Fire Doors and Other Opening Protectives) | 2022 | 3.0.0 | fire | reference-only | 2 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `nyc-bc-2022` (New York City Building Code 2022) | 2022 | 3.0.0 | local | state-law | 2 | 0 | 0 | ibc-2021 | Local | ✅ |
+| `osha-1910-subpart-d` (OSHA 29 CFR 1910 Subpart D – Walking-Working Surfaces) | 2017 | 3.0.0 | occupational-safety | public-domain | 5 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+| `osha-1910-subpart-e` (OSHA 29 CFR 1910 Subpart E – Means of Egress / Emergency Plans) | 2002 | 3.0.0 | occupational-safety | public-domain | 4 | 0 | 0 | — | 2024 IBC, Local, Other | ✅ |
+
+## Notes
+
+- **Indexed** = listed in `assets/data/rules/index.json` and exposed to the UI.
+- **Extends** packs inherit and override rules from their parent.
+- Run `node scripts/validate-rules.mjs` to confirm every pack is schema-valid and references known check functions.
+- Run `node scripts/rules-report.mjs` to regenerate this file (CI fails if it goes stale).
diff --git a/index.html b/index.html
index 2fa5c5e..d52b0b3 100644
--- a/index.html
+++ b/index.html
@@ -802,6 +802,16 @@ <h2 class="font-display font-bold text-white text-lg flex items-center gap-3">
           <p id="llmTestStatus" class="text-xs flex-1" style="color:#64748b;min-height:1em;"></p>
         </div>
 
+        <!-- Run Diagnostics: a non-developer-runnable proof that the
+             extract → score path is functioning end-to-end. -->
+        <div class="glass rounded-xl p-4" style="border:1px solid rgba(56,189,248,.18);">
+          <div class="flex items-center gap-2">
+            <button type="button" id="selfTestBtn" class="btn-ghost" style="padding:10px 16px;font-size:.8rem;flex-shrink:0;"><i class="fas fa-stethoscope text-xs mr-1" aria-hidden="true"></i>Run Diagnostics</button>
+            <p id="selfTestStatus" class="text-xs flex-1" style="color:#64748b;min-height:1em;">Runs the scanner against bundled fixtures &mdash; proves uploads really get scored.</p>
+          </div>
+          <pre id="selfTestResults" class="mt-3" style="display:none;background:rgba(0,0,0,.25);border:1px solid rgba(255,255,255,.06);border-radius:8px;padding:10px;font-family:'ui-monospace',monospace;font-size:.7rem;line-height:1.5;max-height:240px;overflow-y:auto;color:#94a3b8;white-space:pre-wrap;"></pre>
+        </div>
+
         <p id="aiSaveStatus" class="text-xs" style="color:#64748b;min-height:1em;"></p>
         <div class="flex gap-3">
           <button type="submit" class="btn-accent flex-1 justify-center" style="padding:12px;"><i class="fas fa-floppy-disk text-xs" aria-hidden="true"></i> Save Configuration</button>
@@ -943,6 +953,7 @@ <h3 class="font-display font-bold text-white text-lg">Keyboard Shortcuts</h3>
 <script src="assets/js/agent/extractors.js"></script>
 <script src="assets/js/agent/llm-bridge.js"></script>
 <script src="assets/js/agent/pipeline.js"></script>
+<script src="assets/js/agent/self-test.js"></script>
 <script src="assets/js/utils/history.js"></script>
 <script src="assets/js/utils/export.js"></script>
 <script src="assets/js/app.js"></script>
diff --git a/package.json b/package.json
index 666e03a..cf098fe 100644
--- a/package.json
+++ b/package.json
@@ -13,7 +13,11 @@
     "build:css": "tailwindcss -i ./assets/css/styles.input.css -o ./assets/css/styles.css --minify",
     "dev:css": "tailwindcss -i ./assets/css/styles.input.css -o ./assets/css/styles.css --watch",
     "serve": "npx serve . -p 3000",
-    "test": "node --test tests/"
+    "test": "node --test tests/",
+    "validate:rules": "node scripts/validate-rules.mjs",
+    "rules:report": "node scripts/rules-report.mjs",
+    "rules:report:check": "node scripts/rules-report.mjs --check",
+    "status": "node scripts/status.mjs"
   },
   "dependencies": {
     "dotenv": "^17.4.2",
diff --git a/scripts/rules-report.mjs b/scripts/rules-report.mjs
new file mode 100644
index 0000000..11a2bb4
--- /dev/null
+++ b/scripts/rules-report.mjs
@@ -0,0 +1,108 @@
+#!/usr/bin/env node
+/**
+ * scripts/rules-report.mjs
+ *
+ * Generates a human-readable inventory of every rule pack in
+ * `assets/data/rules/` and writes it to `docs/RULES.md`. Run in CI
+ * alongside `validate-rules.mjs` so PRs that change packs always update
+ * the published inventory.
+ *
+ * Usage:
+ *   node scripts/rules-report.mjs           # writes docs/RULES.md
+ *   node scripts/rules-report.mjs --check   # exits 1 if docs/RULES.md is stale
+ */
+
+import { readdirSync, readFileSync, writeFileSync, existsSync, mkdirSync } from 'node:fs';
+import { resolve, dirname, join } from 'node:path';
+import { fileURLToPath } from 'node:url';
+
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const ROOT      = resolve(__dirname, '..');
+const RULES_DIR = join(ROOT, 'assets', 'data', 'rules');
+const DOCS_DIR  = join(ROOT, 'docs');
+const OUT_PATH  = join(DOCS_DIR, 'RULES.md');
+
+const checkOnly = process.argv.includes('--check');
+
+function readJson(p) { return JSON.parse(readFileSync(p, 'utf8')); }
+
+const indexJson = readJson(join(RULES_DIR, 'index.json'));
+const indexById = new Map((indexJson.packs || []).map(p => [p.id, p]));
+
+const packFiles = readdirSync(RULES_DIR)
+  .filter(f => f.endsWith('.json') && f !== 'index.json')
+  .sort();
+
+const rows = [];
+let totalRules = 0, totalDisabled = 0, totalExperimental = 0;
+
+for (const f of packFiles) {
+  const pack = readJson(join(RULES_DIR, f));
+  const idx  = indexById.get(pack.id) || {};
+  const rules = Array.isArray(pack.rules) ? pack.rules : [];
+  const disabled     = rules.filter(r => r.disabled).length;
+  const experimental = rules.filter(r => r.experimental).length;
+  totalRules        += rules.length;
+  totalDisabled     += disabled;
+  totalExperimental += experimental;
+
+  const appliesTo = Array.isArray(idx.applies_to_codes) ? idx.applies_to_codes.join(', ')
+    : (Array.isArray(pack.applies_to) ? pack.applies_to.join(', ') : '—');
+
+  rows.push({
+    id: pack.id,
+    name: pack.name,
+    version: pack.version || '?',
+    schemaVersion: pack.schema_version || '—',
+    category: pack.category || idx.category || '—',
+    license: pack.license || '—',
+    rules: rules.length,
+    disabled, experimental,
+    appliesTo,
+    inIndex: indexById.has(pack.id),
+    extends: pack.extends || '',
+    file: f
+  });
+}
+
+// Build markdown
+const lines = [];
+lines.push('<!-- Auto-generated by scripts/rules-report.mjs. Do not edit by hand. -->');
+lines.push('# Plan-Examiner Rule-Pack Inventory');
+lines.push('');
+lines.push(`Generated: ${new Date().toISOString().slice(0, 10)}  `);
+lines.push(`Total packs: **${rows.length}** &middot; Total rules: **${totalRules}** &middot; Disabled: ${totalDisabled} &middot; Experimental: ${totalExperimental}`);
+lines.push('');
+lines.push('| Pack | Version | Schema | Category | License | Rules | Disabled | Experimental | Extends | Applies To | Indexed |');
+lines.push('|------|---------|--------|----------|---------|------:|---------:|-------------:|---------|------------|:-------:|');
+for (const r of rows) {
+  lines.push(`| \`${r.id}\` (${r.name}) | ${r.version} | ${r.schemaVersion} | ${r.category} | ${r.license} | ${r.rules} | ${r.disabled} | ${r.experimental} | ${r.extends || '—'} | ${r.appliesTo} | ${r.inIndex ? '✅' : '❌'} |`);
+}
+lines.push('');
+lines.push('## Notes');
+lines.push('');
+lines.push('- **Indexed** = listed in `assets/data/rules/index.json` and exposed to the UI.');
+lines.push('- **Extends** packs inherit and override rules from their parent.');
+lines.push('- Run `node scripts/validate-rules.mjs` to confirm every pack is schema-valid and references known check functions.');
+lines.push('- Run `node scripts/rules-report.mjs` to regenerate this file (CI fails if it goes stale).');
+lines.push('');
+
+const out = lines.join('\n');
+
+if (checkOnly) {
+  if (!existsSync(OUT_PATH)) {
+    console.error('docs/RULES.md is missing. Run: node scripts/rules-report.mjs');
+    process.exit(1);
+  }
+  const current = readFileSync(OUT_PATH, 'utf8');
+  if (current.trim() !== out.trim()) {
+    console.error('docs/RULES.md is stale. Run: node scripts/rules-report.mjs');
+    process.exit(1);
+  }
+  console.log('docs/RULES.md is up to date.');
+  process.exit(0);
+}
+
+if (!existsSync(DOCS_DIR)) mkdirSync(DOCS_DIR, { recursive: true });
+writeFileSync(OUT_PATH, out, 'utf8');
+console.log(`Wrote ${OUT_PATH} (${rows.length} packs, ${totalRules} rules).`);
diff --git a/scripts/status.mjs b/scripts/status.mjs
new file mode 100644
index 0000000..496d20a
--- /dev/null
+++ b/scripts/status.mjs
@@ -0,0 +1,95 @@
+#!/usr/bin/env node
+/**
+ * scripts/status.mjs
+ *
+ * Headless health check. Runs the same `PE.SelfTest.run()` the in-app
+ * "Run Diagnostics" button uses, against the bundled fixtures, and
+ * writes a `status.json` summary plus exits non-zero on failure.
+ *
+ * Designed for:
+ *   - Scheduled GitHub Actions health checks
+ *   - Local "is the engine OK?" sanity command (`npm run status`)
+ *
+ * No browser-only APIs are used: the helper test loader installs
+ * minimal `window`/`localStorage`/`crypto` shims, and a file-system
+ * fetch shim resolves `assets/...` URLs to disk.
+ */
+
+import { readFileSync, writeFileSync, existsSync } from 'node:fs';
+import { resolve, dirname, join } from 'node:path';
+import { fileURLToPath } from 'node:url';
+import { createRequire } from 'node:module';
+
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const ROOT      = resolve(__dirname, '..');
+
+// Use require() to load the existing CommonJS test loader.
+const require_ = createRequire(import.meta.url);
+const loader   = require_(join(ROOT, 'tests', 'helpers', 'load.js'));
+
+// File-system fetch shim (same pattern as the integration test).
+global.fetch = function (url) {
+  const rel = String(url).replace(/^.*?(assets\/)/, '$1');
+  const abs = join(loader.ROOT, rel);
+  if (!existsSync(abs)) {
+    return Promise.resolve({
+      ok: false, status: 404,
+      json: () => Promise.reject(new Error('not found')),
+      text: () => Promise.reject(new Error('not found'))
+    });
+  }
+  const body = readFileSync(abs, 'utf8');
+  return Promise.resolve({
+    ok: true, status: 200,
+    json: () => Promise.resolve(JSON.parse(body)),
+    text: () => Promise.resolve(body)
+  });
+};
+
+loader.loadAll();
+loader.loadSource('assets/js/agent/pipeline.js');
+loader.loadSource('assets/js/agent/self-test.js');
+
+const PE = global.PE;
+
+const startedAt = new Date().toISOString();
+const { summary, results } = await PE.SelfTest.run();
+
+const status = {
+  schema: 'plan-examiner.status',
+  schemaVersion: 1,
+  startedAt,
+  finishedAt: new Date().toISOString(),
+  ok: summary.ok,
+  summary,
+  fixtures: results.map(r => ({
+    id: r.id, file: r.file, ok: r.ok,
+    durationMs: r.durationMs, score: r.score, counts: r.counts,
+    flagged: r.flagged,
+    failedAssertions: (r.assertions || []).filter(a => !a.pass)
+  })),
+  engine: {
+    engineVersion: (PE.Pipeline && PE.Pipeline.ENGINE_VERSION) || null,
+    rulesIndexVersion: (() => {
+      try { return JSON.parse(readFileSync(join(ROOT, 'assets/data/rules/index.json'), 'utf8')).version; }
+      catch (e) { return null; }
+    })()
+  }
+};
+
+const outPath = join(ROOT, 'status.json');
+writeFileSync(outPath, JSON.stringify(status, null, 2) + '\n', 'utf8');
+
+const ok = summary.ok ? '✅' : '❌';
+console.log(`${ok} ${summary.passed}/${summary.total} fixtures passed (${summary.durationMs}ms)`);
+console.log(`Wrote ${outPath}`);
+
+if (!summary.ok) {
+  results.filter(r => !r.ok).forEach(r => {
+    console.error(`  ✗ ${r.id}${r.error ? ' — ' + r.error : ''}`);
+    (r.assertions || []).filter(a => !a.pass).forEach(a => {
+      console.error(`      • ${a.name}${a.detail ? ' — ' + a.detail : ''}`);
+    });
+  });
+  process.exit(1);
+}
diff --git a/sw.js b/sw.js
index 8ce3a80..d2239a4 100644
--- a/sw.js
+++ b/sw.js
@@ -3,7 +3,7 @@
  * Caches static assets for offline use (PWA).
  */
 
-var CACHE_NAME = 'plan-examiner-v4';
+var CACHE_NAME = 'plan-examiner-v5';
 var STATIC_ASSETS = [
   '/',
   '/index.html',
@@ -13,13 +13,38 @@ var STATIC_ASSETS = [
   '/assets/js/agent/extractors.js',
   '/assets/js/agent/llm-bridge.js',
   '/assets/js/agent/pipeline.js',
+  '/assets/js/agent/self-test.js',
   '/assets/js/utils/log.js',
   '/assets/js/utils/history.js',
   '/assets/js/utils/export.js',
   '/assets/data/rules/index.json',
   '/assets/data/rules/ibc-2021.json',
+  '/assets/data/rules/ibc-2024.json',
+  '/assets/data/rules/irc-2021.json',
+  '/assets/data/rules/iebc-2021.json',
+  '/assets/data/rules/iecc-2021.json',
+  '/assets/data/rules/imc-2021.json',
+  '/assets/data/rules/ipc-2021.json',
+  '/assets/data/rules/ifc-2021.json',
   '/assets/data/rules/ada-2010.json',
+  '/assets/data/rules/aba-2015.json',
+  '/assets/data/rules/a117-1-2017.json',
+  '/assets/data/rules/fhag.json',
+  '/assets/data/rules/nfpa-1-2024.json',
+  '/assets/data/rules/nfpa-13-2022.json',
+  '/assets/data/rules/nfpa-72-2022.json',
+  '/assets/data/rules/nfpa-80-2022.json',
   '/assets/data/rules/nfpa-101.json',
+  '/assets/data/rules/nfpa-101-2024.json',
+  '/assets/data/rules/osha-1910-subpart-d.json',
+  '/assets/data/rules/osha-1910-subpart-e.json',
+  '/assets/data/rules/cbc-title24-2022.json',
+  '/assets/data/rules/nyc-bc-2022.json',
+  '/assets/data/rules/chicago-bc-2022.json',
+  '/assets/data/fixtures/selftest/expected.json',
+  '/assets/data/fixtures/selftest/clean-office.dxf',
+  '/assets/data/fixtures/selftest/non-compliant-assembly.dxf',
+  '/assets/data/fixtures/selftest/sparse-warehouse.dxf',
   '/manifest.json',
   '/404.html'
 ];
diff --git a/tests/extractors.crash.test.js b/tests/extractors.crash.test.js
new file mode 100644
index 0000000..8120495
--- /dev/null
+++ b/tests/extractors.crash.test.js
@@ -0,0 +1,86 @@
+/**
+ * Crash-resilience matrix for the extractor and rule engine.
+ *
+ * Each scenario must surface a structured outcome — never throw an
+ * uncaught error, never produce a misleading PASS, never produce a
+ * silently empty result. Together they prove the upload path is robust
+ * to corrupt/edge-case input.
+ */
+
+const test   = require('node:test');
+const assert = require('node:assert');
+
+const loader = require('./helpers/load');
+loader.loadAll();
+const PE = global.PE;
+
+test('parse() on empty string returns flags-only object (no crash)', () => {
+  const f = PE.Extractors.parse('');
+  assert.ok(f && typeof f === 'object');
+  // The bool flags are always assigned (null when neither truthy nor falsy fires).
+  assert.ok(Object.prototype.hasOwnProperty.call(f, 'hasSprinklers'));
+});
+
+test('parse() on garbage / binary-ish input degrades gracefully', () => {
+  const garbage = String.fromCharCode(0, 0, 0xff, 0xfe, 0xfd) + 'NOT A PLAN';
+  const f = PE.Extractors.parse(garbage);
+  // No fact key like grossArea should be falsely populated.
+  assert.strictEqual(f.grossArea, undefined);
+  assert.strictEqual(f.occupantLoad, undefined);
+});
+
+test('fromDxf() with no SECTION/ENTITIES still returns a valid result envelope', () => {
+  const r = PE.Extractors.fromDxf('THIS IS NOT A DXF FILE\n');
+  assert.strictEqual(r.source, 'dxf');
+  assert.ok(r.facts && typeof r.facts === 'object');
+  assert.ok(Array.isArray(r.layers));
+  assert.strictEqual(r.lineCount, 0);
+});
+
+test('fromDxf() on empty string returns empty layers/lines (no throw)', () => {
+  const r = PE.Extractors.fromDxf('');
+  assert.strictEqual(r.source, 'dxf');
+  assert.deepStrictEqual(r.layers, []);
+  assert.strictEqual(r.lineCount, 0);
+  assert.strictEqual(r.textEntities, 0);
+});
+
+test('RuleEngine.evaluate() with empty facts produces only REVIEW + PASS, never throws', async () => {
+  // Load a tiny synthetic pack inline to sidestep filesystem.
+  const pack = {
+    id: 'tiny', name: 'Tiny', version: '1.0.0',
+    rules: [
+      { id: 'tiny.egress', code_section: 'X.1', label: 'egress width',
+        applies_to: ['Commercial', 'Other'], check_fn: 'egress_width',
+        parameters: { min_inches: 36, corridor_min_inches: 44 } },
+      { id: 'tiny.unknown', code_section: 'X.2', label: 'unknown fn',
+        applies_to: ['Commercial', 'Other'], check_fn: 'NOT_A_REAL_FN' }
+    ]
+  };
+  const findings = PE.RuleEngine.evaluate({}, [pack], 'Commercial', {});
+  assert.ok(Array.isArray(findings));
+  findings.forEach(f => {
+    assert.ok(['PASS', 'REVIEW', 'FLAGGED'].includes(f.status), 'invalid status: ' + f.status);
+  });
+  // Unknown check_fn must degrade to REVIEW, not crash.
+  const u = findings.find(x => x.id === 'tiny.unknown');
+  assert.ok(u, 'unknown-fn rule should still emit a finding');
+  assert.strictEqual(u.status, 'REVIEW');
+});
+
+test('RuleEngine.evaluate() never produces a finding outside the {PASS,REVIEW,FLAGGED} domain', () => {
+  const pack = {
+    id: 'tiny2', name: 'Tiny2', version: '1.0.0',
+    rules: [{ id: 'tiny.bad', code_section: 'X.3', label: 'broken check',
+              applies_to: ['Commercial', 'Other'], check_fn: 'egress_width',
+              parameters: null /* null params can throw inside the check */ }]
+  };
+  const findings = PE.RuleEngine.evaluate({}, [pack], 'Commercial', {});
+  findings.forEach(f => {
+    assert.ok(['PASS', 'REVIEW', 'FLAGGED'].includes(f.status));
+  });
+});
+
+test('RuleEngine.score() handles empty array (returns 100)', () => {
+  assert.strictEqual(PE.RuleEngine.score([]), 100);
+});
diff --git a/tests/pipeline.perf.test.js b/tests/pipeline.perf.test.js
new file mode 100644
index 0000000..d426039
--- /dev/null
+++ b/tests/pipeline.perf.test.js
@@ -0,0 +1,92 @@
+/**
+ * Performance / SLA budget enforcement.
+ *
+ * Runs every selftest fixture through the deterministic extract+evaluate
+ * path and verifies each step completes under its `PE.Pipeline.SLA`
+ * budget. The budgets are real-world targets — not microbenchmarks — so
+ * even a slow CI runner should clear them comfortably.
+ *
+ * If this test fails, the engine has regressed (or a rule pack has
+ * exploded) and the upload UX is degrading. Fix it, don't relax the
+ * budget casually.
+ */
+
+const test   = require('node:test');
+const assert = require('node:assert');
+const fs     = require('node:fs');
+const path   = require('node:path');
+
+const loader = require('./helpers/load');
+const { ROOT } = loader;
+
+global.fetch = function (url) {
+  var rel = String(url).replace(/^.*?(assets\/)/, '$1');
+  var abs = path.join(ROOT, rel);
+  if (!fs.existsSync(abs)) return Promise.resolve({ ok: false, status: 404 });
+  var body = fs.readFileSync(abs, 'utf8');
+  return Promise.resolve({
+    ok: true, status: 200,
+    json: () => Promise.resolve(JSON.parse(body)),
+    text: () => Promise.resolve(body)
+  });
+};
+
+loader.loadAll();
+loader.loadSource('assets/js/agent/pipeline.js');
+loader.loadSource('assets/js/agent/self-test.js');
+
+const PE = global.PE;
+
+test('PE.Pipeline.SLA exposes per-step + total budgets', () => {
+  assert.ok(PE.Pipeline.SLA, 'SLA must be exported');
+  ['ingest', 'extract', 'select', 'evaluate', 'cite', 'total'].forEach(k => {
+    assert.strictEqual(typeof PE.Pipeline.SLA[k], 'number', 'SLA.' + k + ' must be a number');
+    assert.ok(PE.Pipeline.SLA[k] > 0, 'SLA.' + k + ' must be > 0');
+  });
+});
+
+test('Selftest fixtures run end-to-end well under their SLA budgets', async () => {
+  // The integration path is not the full pipeline (no PDF.js / file I/O),
+  // so the relevant budgets are extract + select + evaluate. We give each
+  // fixture 3× headroom over the per-step SLA so a noisy CI runner won't
+  // cause a flake; real prod traces will be much faster.
+  const SLA = PE.Pipeline.SLA;
+  const ceiling = (SLA.extract + SLA.select + SLA.evaluate) * 3;
+
+  const { results } = await PE.SelfTest.run();
+  assert.ok(results.length >= 3);
+
+  results.forEach(r => {
+    assert.ok(r.durationMs < ceiling,
+      'fixture ' + r.id + ' took ' + r.durationMs + 'ms (ceiling ' + ceiling + 'ms)');
+  });
+});
+
+test('selectPacks() completes well within SLA.select on its own', async () => {
+  const t0 = Date.now();
+  const packs = await PE.Pipeline.selectPacks('2024 IBC', 'Commercial');
+  const ms = Date.now() - t0;
+  assert.ok(packs.length > 0, 'must load ≥1 pack');
+  // 4× headroom — still keeps us honest.
+  assert.ok(ms < PE.Pipeline.SLA.select * 4,
+    'selectPacks took ' + ms + 'ms (SLA ' + PE.Pipeline.SLA.select + 'ms)');
+});
+
+test('evaluate() of typical fact bundle finishes under SLA.evaluate', async () => {
+  const facts = {
+    grossArea: 12000, occupantLoad: 80, stories: 2, buildingHeightFt: 24,
+    corridorWidthInches: 48, doorWidthInches: 36,
+    stairTreadDepthIn: 11, stairRiserHeightIn: 7, stairWidthInches: 44,
+    totalParkingSpaces: 40, accessibleParkingSpaces: 2,
+    occupancyGroup: 'B', buildingType: 'Commercial',
+    hasSprinklers: true, hasFireAlarm: true, hasExitSigns: true,
+    hasEmergencyLighting: true, hasHandrails: true
+  };
+  const packs = await PE.Pipeline.selectPacks('2024 IBC', 'Commercial');
+  const t0 = Date.now();
+  const findings = PE.RuleEngine.evaluate(facts, packs, 'Commercial', {});
+  const ms = Date.now() - t0;
+  assert.ok(findings.length > 0, 'should produce findings');
+  assert.ok(ms < PE.Pipeline.SLA.evaluate * 4,
+    'evaluate took ' + ms + 'ms (SLA ' + PE.Pipeline.SLA.evaluate + 'ms)');
+});