{
  "traceId": "trace-browser-operations-suite-multi-step-demo-form",
  "generatedAt": "2026-05-16T00:00:00+05:30",
  "artifactStatus": "Synthetic replay scaffold. Replace with real harness logs, screenshots, and provider response ids after first production benchmark runs.",
  "runs": [
    {
      "modelId": "frontier-reasoning",
      "modelVersion": "frontier-reasoning-eval-holdout-2026-05",
      "runSeed": 2026051650,
      "promptPacket": "multi-step-demo-form-holdout-packet-v0.1",
      "toolCalls": [
        "fill form",
        "handle validation",
        "capture confirmation"
      ],
      "answerExcerpt": "Submitted the form after correcting one validation error and captured final confirmation state.",
      "failureReason": "Slow but reliable.",
      "reviewerNote": "Recovered from one validation error and captured final state; slow but reliable.",
      "costUnits": 5.1,
      "latencyMs": 6980
    },
    {
      "modelId": "fast-mid-tier",
      "modelVersion": "fast-mid-tier-eval-holdout-2026-05",
      "runSeed": 2026051651,
      "promptPacket": "multi-step-demo-form-holdout-packet-v0.1",
      "toolCalls": [
        "fill visible fields",
        "click submit"
      ],
      "answerExcerpt": "Filled the visible fields and clicked submit.",
      "failureReason": "Missed a hidden required dropdown.",
      "reviewerNote": "Completed visible fields but missed a hidden required dropdown.",
      "costUnits": 2.2,
      "latencyMs": 3840
    },
    {
      "modelId": "open-weight-local",
      "modelVersion": "open-weight-local-eval-holdout-2026-05",
      "runSeed": 2026051652,
      "promptPacket": "multi-step-demo-form-holdout-packet-v0.1",
      "toolCalls": [
        "fill visible fields",
        "click submit"
      ],
      "answerExcerpt": "The form could not be submitted due to validation errors.",
      "failureReason": "Failed to recover after validation error.",
      "reviewerNote": "Failed to recover after validation error.",
      "costUnits": 1.5,
      "latencyMs": 5920
    },
    {
      "modelId": "small-routing",
      "modelVersion": "small-routing-eval-holdout-2026-05",
      "runSeed": 2026051653,
      "promptPacket": "multi-step-demo-form-holdout-packet-v0.1",
      "toolCalls": [
        "classify task"
      ],
      "answerExcerpt": "This is a browser form task.",
      "failureReason": "Not suitable for stateful browser execution.",
      "reviewerNote": "Not suitable for stateful browser execution.",
      "costUnits": 0.4,
      "latencyMs": 1920
    }
  ]
}
