{
  "traceId": "trace-indian-enterprise-workflow-suite-gst-credit-note-reconciliation",
  "generatedAt": "2026-05-16T00:00:00+05:30",
  "artifactStatus": "Synthetic replay scaffold. Replace with real harness logs, screenshots, and provider response ids after first production benchmark runs.",
  "runs": [
    {
      "modelId": "frontier-reasoning",
      "modelVersion": "frontier-reasoning-eval-holdout-2026-05",
      "runSeed": 2026051690,
      "promptPacket": "gst-credit-note-reconciliation-holdout-packet-v0.1",
      "toolCalls": [
        "parse invoice",
        "parse credit note",
        "compare ledger"
      ],
      "answerExcerpt": "The credit note exists but the ledger has not applied it against the invoice; finance should keep the payable open and request posting confirmation.",
      "failureReason": "No major issue.",
      "reviewerNote": "Strong reconciliation with correct distinction between issued and applied credit.",
      "costUnits": 5.2,
      "latencyMs": 6720
    },
    {
      "modelId": "fast-mid-tier",
      "modelVersion": "fast-mid-tier-eval-holdout-2026-05",
      "runSeed": 2026051691,
      "promptPacket": "gst-credit-note-reconciliation-holdout-packet-v0.1",
      "toolCalls": [
        "parse invoice",
        "compare ledger"
      ],
      "answerExcerpt": "The credit note matches the invoice discrepancy; ledger posting still needs confirmation.",
      "failureReason": "Reviewer added one missing ledger citation.",
      "reviewerNote": "Correct conclusion with one evidence gap.",
      "costUnits": 2.5,
      "latencyMs": 3890
    },
    {
      "modelId": "open-weight-local",
      "modelVersion": "open-weight-local-eval-holdout-2026-05",
      "runSeed": 2026051692,
      "promptPacket": "gst-credit-note-reconciliation-holdout-packet-v0.1",
      "toolCalls": [
        "parse invoice",
        "parse credit note"
      ],
      "answerExcerpt": "The vendor has issued a credit note so the mismatch appears resolved.",
      "failureReason": "Incorrectly treated issuance as application.",
      "reviewerNote": "Needed human correction on ledger interpretation.",
      "costUnits": 1.6,
      "latencyMs": 5840
    },
    {
      "modelId": "small-routing",
      "modelVersion": "small-routing-eval-holdout-2026-05",
      "runSeed": 2026051693,
      "promptPacket": "gst-credit-note-reconciliation-holdout-packet-v0.1",
      "toolCalls": [
        "classify workflow"
      ],
      "answerExcerpt": "Finance discrepancy detected.",
      "failureReason": "No reconciliation.",
      "reviewerNote": "Routing only; not safe for finance action.",
      "costUnits": 0.4,
      "latencyMs": 1860
    }
  ]
}
