{
  "traceId": "trace-coding-agent-maintenance-suite-fix-command-k-search-regression",
  "scoreFormula": "Score equals the sum of weighted rubric components. Component earned points are allocated from the aggregate run score.",
  "scoreBreakdown": [
    [
      "Patch correctness",
      40
    ],
    [
      "Keyboard behavior",
      20
    ],
    [
      "Verification",
      25
    ],
    [
      "Diff hygiene",
      15
    ]
  ],
  "runScores": [
    {
      "modelId": "frontier-reasoning",
      "score": 78,
      "outcome": "Accepted",
      "scoreCalculation": [
        {
          "label": "Patch correctness",
          "weight": 40,
          "earned": 31,
          "max": 40
        },
        {
          "label": "Keyboard behavior",
          "weight": 20,
          "earned": 16,
          "max": 20
        },
        {
          "label": "Verification",
          "weight": 25,
          "earned": 19,
          "max": 25
        },
        {
          "label": "Diff hygiene",
          "weight": 15,
          "earned": 12,
          "max": 15
        }
      ]
    },
    {
      "modelId": "fast-mid-tier",
      "score": 66,
      "outcome": "Accepted with review",
      "scoreCalculation": [
        {
          "label": "Patch correctness",
          "weight": 40,
          "earned": 26,
          "max": 40
        },
        {
          "label": "Keyboard behavior",
          "weight": 20,
          "earned": 13,
          "max": 20
        },
        {
          "label": "Verification",
          "weight": 25,
          "earned": 17,
          "max": 25
        },
        {
          "label": "Diff hygiene",
          "weight": 15,
          "earned": 10,
          "max": 15
        }
      ]
    },
    {
      "modelId": "open-weight-local",
      "score": 52,
      "outcome": "Partial",
      "scoreCalculation": [
        {
          "label": "Patch correctness",
          "weight": 40,
          "earned": 21,
          "max": 40
        },
        {
          "label": "Keyboard behavior",
          "weight": 20,
          "earned": 10,
          "max": 20
        },
        {
          "label": "Verification",
          "weight": 25,
          "earned": 13,
          "max": 25
        },
        {
          "label": "Diff hygiene",
          "weight": 15,
          "earned": 8,
          "max": 15
        }
      ]
    },
    {
      "modelId": "small-routing",
      "score": 29,
      "outcome": "Rejected",
      "scoreCalculation": [
        {
          "label": "Patch correctness",
          "weight": 40,
          "earned": 12,
          "max": 40
        },
        {
          "label": "Keyboard behavior",
          "weight": 20,
          "earned": 6,
          "max": 20
        },
        {
          "label": "Verification",
          "weight": 25,
          "earned": 7,
          "max": 25
        },
        {
          "label": "Diff hygiene",
          "weight": 15,
          "earned": 4,
          "max": 15
        }
      ]
    }
  ]
}
