{
  "slug": "coding-agent-arena",
  "title": "Coding Agent Arena",
  "stage": "Research",
  "audience": "Engineering leaders and founders",
  "summary": "A coding-agent evaluation track for repository edits, bug fixes, browser checks, terminal usage, and regression discipline.",
  "href": "/studio/coding-agent-arena",
  "problem": "Coding agents are usually shown through curated demos. The Arena measures whether they can read an existing repository, make a scoped patch, run checks, inspect the UI, and produce work a senior engineer would review seriously.",
  "metrics": [
    "Patch correctness",
    "Test pass rate",
    "Review quality",
    "Time to mergeable PR"
  ],
  "outputs": [
    "Patch review",
    "Regression report",
    "Tool-use transcript",
    "Merge-readiness score"
  ],
  "buyerQuestions": [
    "Can this agent work inside our existing codebase?",
    "Does it respect ownership boundaries and avoid unrelated churn?",
    "Can it debug failing tests without hiding the failure?",
    "What tasks are safe to delegate today?"
  ],
  "evidenceLinks": [
    [
      "Coding Agent Maintenance Suite",
      "/benchmarks/coding-agent-maintenance-suite"
    ],
    [
      "Agentic Reliability Index",
      "/leaderboards#agentic-reliability-index"
    ],
    [
      "Leaderboard methodology",
      "/articles/building-a-useful-ai-leaderboard-without-fooling-ourselves"
    ]
  ],
  "demoState": "Live coding arena is connected to the Coding Agent Maintenance Suite; next step is importing real agent patches, logs, and review artifacts.",
  "catalogRank": 2,
  "maturity": "Research surface ready for benchmark-backed demos",
  "packetPath": "/reports/studio/coding-agent-arena.md",
  "jsonPath": "/reports/studio/coding-agent-arena.json",
  "previewImage": "/reports/studio/previews/coding-agent-arena.png",
  "previewAlt": "Coding Agent Arena live Studio preview screenshot",
  "demoReadinessScore": 82,
  "demoReadiness": "Demo-ready with current generated traces and interactive controls; replace screenshots with product walkthrough video when available.",
  "missingForLiveDemo": [
    "Product walkthrough video",
    "Client-approved example",
    "Real run export"
  ],
  "handoffOwner": "Sanjay Prasad",
  "nextDemoArtifact": "/reports/studio/coding-agent-arena.md"
}
