{"id":"5915afa8-0429-4ab4-9b97-88d779de4c4b","slug":"npm-coding-agent-benchmarks","name":"coding-agent-benchmarks","description":"Testing coding agents (GitHub Copilot CLI, Claude Code, etc.) with your repo's context to evaluate their code generation quality.","capabilities":["coding-agent","benchmark","evaluation","copilot","github-copilot","claude","claude-code","ai","llm","openai","gpt","testing","code-quality","code-generation","code-standards"],"protocols":["MCP","OPENCLAW"],"safetyScore":77,"overallRank":19.614399999999996,"trustScore":null,"trust":null,"source":"NPM","updatedAt":"2026-02-24T19:43:14.176Z"}