{
  "generatedAt": "2026-06-26T14:01:29.311Z",
  "task": "addBusinessDays(startISODate, n) over the 2026 U.S. federal calendar",
  "oracleCases": 12,
  "auditor": "audit/independent-auditor.mjs (identical for both sides)",
  "sides": {
    "directModel": {
      "side": "Direct model (single-shot prompt)",
      "selfTest": {
        "passed": 10,
        "total": 10
      },
      "independentAccuracy": 0.6666666666666666,
      "oracle": {
        "passed": 8,
        "total": 12,
        "failures": [
          {
            "id": 3,
            "input": "2026-06-29+5",
            "got": "2026-07-06",
            "expected": "2026-07-07"
          },
          {
            "id": 4,
            "input": "2026-07-01+2",
            "got": "2026-07-03",
            "expected": "2026-07-06"
          },
          {
            "id": 5,
            "input": "2026-07-02+1",
            "got": "2026-07-03",
            "expected": "2026-07-06"
          },
          {
            "id": 7,
            "input": "2026-06-30+3",
            "got": "2026-07-03",
            "expected": "2026-07-06"
          }
        ]
      },
      "observedShiftHandled": false,
      "reproducible": true,
      "claimVerdicts": [
        {
          "id": "A1",
          "type": "self-tests",
          "text": "All unit tests pass (10/10).",
          "status": "SUPPORTED",
          "detail": "Self-tests pass (10/10) but DISAGREE with the independent oracle (8/12) — circular validation, not evidence of correctness."
        },
        {
          "id": "A2",
          "type": "correctness",
          "text": "100% correct per the U.S. business-day specification.",
          "status": "CONTRADICTED",
          "detail": "Claimed 100% correct, but independently measured 66.7% (8/12). Failing cases: #3(2026-06-29+5: got 2026-07-06, expected 2026-07-07); #4(2026-07-01+2: got 2026-07-03, expected 2026-07-06); #5(2026-07-02+1: got 2026-07-03, expected 2026-07-06); #7(2026-06-30+3: got 2026-07-03, expected 2026-07-06)."
        },
        {
          "id": "A3",
          "type": "capability",
          "text": "Correctly handles all 2026 U.S. federal holidays, including observed weekend shifts.",
          "status": "CONTRADICTED",
          "detail": "Claimed observed-shift handling = true, but probe addBusinessDays('2026-07-02',1) => '2026-07-03' (expected '2026-07-06'): actually false."
        },
        {
          "id": "A4",
          "type": "marketing",
          "text": "Production-ready and fully validated.",
          "status": "UNSUPPORTED",
          "detail": "No executable evidence backs this claim; it is an assertion, not a result."
        }
      ],
      "tally": {
        "supported": 1,
        "contradicted": 2,
        "unsupported": 1,
        "disclosedSeams": 0
      },
      "trustScore": 15,
      "certification": "REJECTED"
    },
    "forge": {
      "side": "Forge (proof-gated build)",
      "selfTest": {
        "passed": 12,
        "total": 12
      },
      "independentAccuracy": 1,
      "oracle": {
        "passed": 12,
        "total": 12,
        "failures": []
      },
      "observedShiftHandled": true,
      "reproducible": true,
      "claimVerdicts": [
        {
          "id": "B1",
          "type": "self-tests",
          "text": "All unit tests pass (12/12), run against an independent answer key.",
          "status": "SUPPORTED",
          "detail": "Self-tests pass (12/12) and agree with the independent oracle."
        },
        {
          "id": "B2",
          "type": "correctness",
          "text": "Matches the independent labeled oracle on 12/12 cases, including the observed-holiday edge.",
          "status": "SUPPORTED",
          "detail": "Independently measured accuracy 100.0% (12/12) meets the claimed 100%."
        },
        {
          "id": "B3",
          "type": "capability",
          "text": "Implements the observed weekend-shift rule; July 4 2026 (Sat) is correctly observed on Fri 2026-07-03.",
          "status": "SUPPORTED",
          "detail": "Probe addBusinessDays('2026-07-02',1) => '2026-07-06' (expected '2026-07-06'): observed-shift handled = true."
        },
        {
          "id": "B4",
          "type": "seam",
          "text": "DISCLOSED SEAM: the holiday calendar covers 2026 U.S. federal holidays only. Other years, states, or countries are out of scope and not claimed.",
          "status": "DISCLOSED",
          "detail": "Limitation disclosed rather than hidden — honest scoping, not an unsupported claim."
        }
      ],
      "tally": {
        "supported": 3,
        "contradicted": 0,
        "unsupported": 0,
        "disclosedSeams": 1
      },
      "trustScore": 100,
      "certification": "CERTIFIABLE"
    }
  }
}
