{
  "traceId": "trace-coding-agent-maintenance-suite-add-playwright-smoke-test",
  "scoreFormula": "Score equals the sum of weighted rubric components. Component earned points are allocated from the aggregate run score.",
  "scoreBreakdown": [
    [
      "Test coverage",
      35
    ],
    [
      "Scope",
      25
    ],
    [
      "Runtime discipline",
      25
    ],
    [
      "Verification",
      15
    ]
  ],
  "runScores": [
    {
      "modelId": "frontier-reasoning",
      "score": 77,
      "outcome": "Accepted",
      "scoreCalculation": [
        {
          "label": "Test coverage",
          "weight": 35,
          "earned": 27,
          "max": 35
        },
        {
          "label": "Scope",
          "weight": 25,
          "earned": 19,
          "max": 25
        },
        {
          "label": "Runtime discipline",
          "weight": 25,
          "earned": 19,
          "max": 25
        },
        {
          "label": "Verification",
          "weight": 15,
          "earned": 12,
          "max": 15
        }
      ]
    },
    {
      "modelId": "fast-mid-tier",
      "score": 68,
      "outcome": "Accepted with review",
      "scoreCalculation": [
        {
          "label": "Test coverage",
          "weight": 35,
          "earned": 24,
          "max": 35
        },
        {
          "label": "Scope",
          "weight": 25,
          "earned": 17,
          "max": 25
        },
        {
          "label": "Runtime discipline",
          "weight": 25,
          "earned": 17,
          "max": 25
        },
        {
          "label": "Verification",
          "weight": 15,
          "earned": 10,
          "max": 15
        }
      ]
    },
    {
      "modelId": "open-weight-local",
      "score": 49,
      "outcome": "Partial",
      "scoreCalculation": [
        {
          "label": "Test coverage",
          "weight": 35,
          "earned": 17,
          "max": 35
        },
        {
          "label": "Scope",
          "weight": 25,
          "earned": 12,
          "max": 25
        },
        {
          "label": "Runtime discipline",
          "weight": 25,
          "earned": 12,
          "max": 25
        },
        {
          "label": "Verification",
          "weight": 15,
          "earned": 8,
          "max": 15
        }
      ]
    },
    {
      "modelId": "small-routing",
      "score": 26,
      "outcome": "Rejected",
      "scoreCalculation": [
        {
          "label": "Test coverage",
          "weight": 35,
          "earned": 9,
          "max": 35
        },
        {
          "label": "Scope",
          "weight": 25,
          "earned": 7,
          "max": 25
        },
        {
          "label": "Runtime discipline",
          "weight": 25,
          "earned": 6,
          "max": 25
        },
        {
          "label": "Verification",
          "weight": 15,
          "earned": 4,
          "max": 15
        }
      ]
    }
  ]
}
