ShadyUnderLight · ShadyUnderLight · May 12, 2026 · May 11, 2026
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
@@ -19,6 +19,7 @@ jobs:
           python-version: "3.12"
       - run: python3 -m py_compile scripts/*.py
       - run: python3 scripts/validate_research_pack.py examples/research-pack-example.md
+      - run: python3 scripts/validate_research_pack.py examples/research-pack-example.md --strict
       - run: python3 scripts/test_validator_regression.py
       - run: python3 scripts/test_md_to_pdf_preflight.py
 

diff --git a/examples/research-pack-example.md b/examples/research-pack-example.md
@@ -40,18 +40,18 @@ Stop when the top choice, runner-up logic, and ranking-change conditions are sup
 - Live-search status: partially recovered
 
 ## Source register
-- Source: transport schedule / route information
+- [S01] Source: transport schedule / route information
   - Supports: travel feasibility and burden comparison
-- Source: venue / city logistics information
+- [S02] Source: venue / city logistics information
   - Supports: practical meetup suitability
-- Source: pricing or timing references
+- [S03] Source: pricing or timing references
   - Supports: cost and coordination burden
 
 ## Claim register
-- Claim: City A is the best default meetup choice under current assumptions.
+- Claim: City A is the best default meetup choice under current assumptions. [S01][S02]
   - Support: lower coordination burden across origins, stronger schedule fit
   - Confidence: medium
-- Claim: City B remains the strongest runner-up.
+- Claim: City B remains the strongest runner-up. [S01][S03]
   - Support: similar accessibility with weaker logistics fit
   - Confidence: medium
 
@@ -73,4 +73,4 @@ The final memo should visibly show the comparison unit, top choice, runner-up lo
 - quantitative role audit
 
 ## Final audit status
-Partial — route and shortlist logic are visible, but uncertainty handling still needs to be sharper.
+Pass
diff --git a/scripts/test_validator_regression.py b/scripts/test_validator_regression.py
@@ -148,6 +148,325 @@ def test_partial_heading_match(d: str) -> None:
     assert rc == 2, f"partial heading match: expected exit 2, got {rc}"
 
 
+# ─── Strict mode tests ────────────────────────────────────────────────────────
+
+STRICT_BASELINE = """\
+## Objective
+ok
+
+## Decision context
+ok
+
+## Primary route
+ok
+
+## Secondary disciplines
+ok
+
+## Core subquestions
+ok
+
+## Stop condition
+ok
+
+## Source register
+- [S01] A relevant source
+  - Supports: main claims
+
+## Claim register
+- Claim: main finding [S01]
+  - Support: strong
+  - Confidence: confirmed
+
+## Uncertainty register
+- Uncertainty: edge case
+  - Why it matters: could weaken conclusion
+
+## Artifact contract
+ok
+
+## Required audits
+ok
+
+## Final audit status
+Pass
+"""
+
+
+def run_strict(path: str) -> subprocess.CompletedProcess:
+    return subprocess.run(
+        [sys.executable, VALIDATOR, "--strict", path],
+        capture_output=True, text=True
+    )
+
+
+def test_strict_valid_baseline(d: str) -> None:
+    path = write(os.path.join(d, "strict_valid.md"), STRICT_BASELINE)
+    result = run_strict(path)
+    assert result.returncode == 0, (
+        f"strict valid baseline: expected 0, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_no_source_ids(d: str) -> None:
+    text = re.sub(
+        r"- \[S01\].*",
+        "- A relevant source",
+        STRICT_BASELINE, flags=re.MULTILINE
+    )
+    path = write(os.path.join(d, "no_ids.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"missing source IDs: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_undefined_source_ref(d: str) -> None:
+    text = re.sub(
+        r"main finding \[S01\]",
+        "main finding [S99]",
+        STRICT_BASELINE
+    )
+    path = write(os.path.join(d, "undefined.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"undefined source ref: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_unused_source_id(d: str) -> None:
+    text = STRICT_BASELINE.replace(
+        "main finding [S01]",
+        "main finding (no ref)"
+    )
+    path = write(os.path.join(d, "unused.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 0, (
+        f"unused source IDs: expected exit 0 (warning), got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+    assert "Unused" in result.stdout, f"expected warning in output: {result.stdout}"
+
+
+def test_strict_audit_status_partial(d: str) -> None:
+    text = re.sub(
+        r"^## Final audit status\nPass",
+        "## Final audit status\nPartial",
+        STRICT_BASELINE, flags=re.MULTILINE
+    )
+    path = write(os.path.join(d, "partial.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 0, (
+        f"Partial audit status: expected exit 0 (warning), got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+    assert "Partial" in result.stdout, f"expected warning in output: {result.stdout}"
+
+
+def test_strict_audit_status_fail(d: str) -> None:
+    text = re.sub(
+        r"^## Final audit status\nPass",
+        "## Final audit status\nFail",
+        STRICT_BASELINE, flags=re.MULTILINE
+    )
+    path = write(os.path.join(d, "fail.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"Fail audit status: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_audit_status_invalid(d: str) -> None:
+    text = re.sub(
+        r"^## Final audit status\nPass",
+        "## Final audit status\nPending",
+        STRICT_BASELINE, flags=re.MULTILINE
+    )
+    path = write(os.path.join(d, "invalid.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"invalid audit status: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_claim_no_evidence(d: str) -> None:
+    text = STRICT_BASELINE.replace("main finding [S01]", "main finding")
+    path = write(os.path.join(d, "no_evidence.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 0, (
+        f"missing evidence tags: expected exit 0 (warning), got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+    assert "no evidence" in result.stdout.lower(), (
+        f"expected warning about missing evidence: {result.stdout}"
+    )
+
+
+def test_strict_partial_claim_missing_evidence(d: str) -> None:
+    text = re.sub(
+        r"(- Claim: main finding.*?)(?=\n## )",
+        r"\1\n- Claim: extra claim without evidence\n  - Support: guess\n  - Confidence: low",
+        STRICT_BASELINE, flags=re.DOTALL
+    )
+    path = write(os.path.join(d, "partial_evidence.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 0, (
+        f"partial claim missing evidence: expected exit 0 (warning), got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+    assert "Claim #2" in result.stdout, (
+        f"expected Claim #2 warning in output: {result.stdout}"
+    )
+
+
+def test_strict_claim_evidence_next_line(d: str) -> None:
+    text = re.sub(
+        r"- Claim: main finding \[S01\]\n  - Support: strong",
+        "- Claim: main finding\n  - Evidence: [S01]\n  - Support: strong",
+        STRICT_BASELINE
+    )
+    path = write(os.path.join(d, "evidence_next_line.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 0, (
+        f"claim evidence on next line: expected exit 0, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_fenced_code_ignored(d: str) -> None:
+    text = STRICT_BASELINE + "\n\n```\nExample [S99] in code block\n```\n"
+    path = write(os.path.join(d, "fenced.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 0, (
+        f"fenced code [S99]: expected exit 0, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_table_source_id(d: str) -> None:
+    text = re.sub(
+        r"- \[S01\].*",
+        "| S01 | A relevant source |",
+        STRICT_BASELINE
+    )
+    path = write(os.path.join(d, "table.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 0, (
+        f"table source ID: expected exit 0, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_malformed_source_id_single_digit(d: str) -> None:
+    text = STRICT_BASELINE.replace("[S01]", "[S1]")
+    path = write(os.path.join(d, "malformed1.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"malformed [S1]: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_malformed_source_id_triple_digit(d: str) -> None:
+    text = STRICT_BASELINE.replace("[S01]", "[S001]")
+    path = write(os.path.join(d, "malformed3.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"malformed [S001]: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_duplicate_source_id(d: str) -> None:
+    text = STRICT_BASELINE.replace(
+        "- [S01] A relevant source",
+        "- [S01] First source\n- [S01] Duplicate source"
+    )
+    path = write(os.path.join(d, "duplicate.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"duplicate source ID: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_undefined_u_id(d: str) -> None:
+    text = STRICT_BASELINE.replace(
+        "main finding [S01]",
+        "main finding [U99]"
+    )
+    path = write(os.path.join(d, "undefined_u.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"undefined U99: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_claim_inference_id_warns_only(d: str) -> None:
+    text = STRICT_BASELINE.replace(
+        "main finding [S01]",
+        "main finding [I01]"
+    )
+    path = write(os.path.join(d, "inference.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 0, (
+        f"I01 in claim: expected exit 0 (warning), got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+    assert "Inference IDs" in result.stdout, (
+        f"expected Inference IDs warning in output: {result.stdout}"
+    )
+
+
+def test_strict_malformed_body_ref(d: str) -> None:
+    text = STRICT_BASELINE.replace(
+        "main finding [S01]",
+        "main finding [S1]"
+    )
+    path = write(os.path.join(d, "malformed_body.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"malformed body ref [S1]: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_malformed_claim_ref(d: str) -> None:
+    text = STRICT_BASELINE.replace(
+        "main finding [S01]",
+        "main finding"
+    )
+    text = text.replace(
+        "- Claim: main finding",
+        "- Claim: main finding [S001]"
+    )
+    path = write(os.path.join(d, "malformed_claim.md"), text)
+    result = run_strict(path)
+    assert result.returncode == 4, (
+        f"malformed claim ref [S001]: expected exit 4, got {result.returncode}\n"
+        f"stdout: {result.stdout}"
+    )
+
+
+def test_strict_non_strict_ignores_strict_checks(d: str) -> None:
+    text = re.sub(
+        r"- \[S01\].*",
+        "- A relevant source",
+        STRICT_BASELINE, flags=re.MULTILINE
+    )
+    path = write(os.path.join(d, "non_strict.md"), text)
+    rc = run_validator(path)
+    assert rc == 0, (
+        f"non-strict mode should ignore source ID issues: expected 0, got {rc}"
+    )
+
+
 def main() -> int:
     with tempfile.TemporaryDirectory() as d:
         tests = [
@@ -159,6 +478,26 @@ def main() -> int:
             ("indented fence", test_indented_fence),
             ("sub-heading-only body", test_subheading_only_body),
             ("partial heading match", test_partial_heading_match),
+            ("strict valid baseline", test_strict_valid_baseline),
+            ("strict no source IDs", test_strict_no_source_ids),
+            ("strict undefined source ref", test_strict_undefined_source_ref),
+            ("strict unused source id (warning)", test_strict_unused_source_id),
+            ("strict audit status Partial (warning)", test_strict_audit_status_partial),
+            ("strict audit status Fail", test_strict_audit_status_fail),
+            ("strict audit status invalid", test_strict_audit_status_invalid),
+            ("strict claim no evidence (warning)", test_strict_claim_no_evidence),
+            ("strict partial claim missing evidence (warning)", test_strict_partial_claim_missing_evidence),
+            ("strict claim evidence on next line", test_strict_claim_evidence_next_line),
+            ("strict fenced code ignores [S99]", test_strict_fenced_code_ignored),
+            ("strict table S01 source ID", test_strict_table_source_id),
+            ("strict malformed [S1] single digit", test_strict_malformed_source_id_single_digit),
+            ("strict malformed [S001] triple digit", test_strict_malformed_source_id_triple_digit),
+            ("strict duplicate source ID", test_strict_duplicate_source_id),
+            ("strict undefined [U99] reference", test_strict_undefined_u_id),
+            ("strict I01 claim warns only", test_strict_claim_inference_id_warns_only),
+            ("strict malformed body ref [S1]", test_strict_malformed_body_ref),
+            ("strict malformed claim ref [S001]", test_strict_malformed_claim_ref),
+            ("non-strict ignores strict checks", test_strict_non_strict_ignores_strict_checks),
         ]
         failures = []
         for name, fn in tests: