{
  "traceId": "trace-indian-enterprise-workflow-suite-gst-invoice-discrepancy",
  "generatedAt": "2026-05-16T00:00:00+05:30",
  "artifactStatus": "Synthetic replay scaffold. Replace with real harness logs, screenshots, and provider response ids after first production benchmark runs.",
  "runs": [
    {
      "modelId": "frontier-reasoning",
      "modelVersion": "frontier-reasoning-eval-public-2026-05",
      "runSeed": 2026051600,
      "promptPacket": "gst-invoice-discrepancy-public-packet-v0.1",
      "toolCalls": [
        "parse invoice table",
        "compare PO tax rate",
        "draft vendor note"
      ],
      "answerExcerpt": "The invoice uses a GST rate that does not match the purchase order, and the exception email explains why the vendor needs to revise the tax line before payment.",
      "failureReason": "Minor formatting cleanup only.",
      "reviewerNote": "Correct mismatch, cited all three evidence points, and proposed a clean vendor follow-up.",
      "costUnits": 4.8,
      "latencyMs": 6120
    },
    {
      "modelId": "fast-mid-tier",
      "modelVersion": "fast-mid-tier-eval-public-2026-05",
      "runSeed": 2026051601,
      "promptPacket": "gst-invoice-discrepancy-public-packet-v0.1",
      "toolCalls": [
        "parse invoice table",
        "compare PO tax rate"
      ],
      "answerExcerpt": "The GST discrepancy appears to come from a rate mismatch between the invoice and the PO.",
      "failureReason": "One citation label pointed to the right document but the wrong row.",
      "reviewerNote": "Correct calculation and tone; reviewer had to repair one citation label.",
      "costUnits": 2.1,
      "latencyMs": 3410
    },
    {
      "modelId": "open-weight-local",
      "modelVersion": "open-weight-local-eval-public-2026-05",
      "runSeed": 2026051602,
      "promptPacket": "gst-invoice-discrepancy-public-packet-v0.1",
      "toolCalls": [
        "parse invoice table"
      ],
      "answerExcerpt": "The invoice has a tax mismatch and should be checked against the purchase order.",
      "failureReason": "Confused CGST/SGST allocation and omitted the vendor exception email.",
      "reviewerNote": "Found a mismatch but confused CGST/SGST allocation and needed human correction.",
      "costUnits": 1.4,
      "latencyMs": 5280
    },
    {
      "modelId": "small-routing",
      "modelVersion": "small-routing-eval-public-2026-05",
      "runSeed": 2026051603,
      "promptPacket": "gst-invoice-discrepancy-public-packet-v0.1",
      "toolCalls": [
        "classify workflow"
      ],
      "answerExcerpt": "This looks like a finance escalation.",
      "failureReason": "Could route the task but generated an unsupported tax explanation.",
      "reviewerNote": "Useful triage signal only; generated an unsupported tax explanation.",
      "costUnits": 0.4,
      "latencyMs": 1810
    }
  ]
}
