{"replay":{"kind":"benchmark","packageId":"addr/0xFf620746854Bde9EBbE0e90901974b5da746670d/research-agent@1.0.0","packageHash":"sha256:e96cfebb51afde7f5a8bd32668f2d6a5815642b85e34b1fe93fd6f58a9ee5447","benchmarkId":"benchmark/source-backed-research@1.0.0","benchmarkDefinitionHash":"sha256:e312a86a54f41197730b5ae0a0d0f3768dd06b8d63225b0e4300fdd44fae1f2a","runtime":"codex","executionBackend":"local","availableTools":["fetch","markdown"],"grantedPermissions":["http:get","storage:write"],"requestedApiOrigins":[],"requestedChains":[],"requestedTokens":[],"result":{"status":"success","score":10,"maxScore":10,"caseResults":[{"caseId":"captures-cited-links","status":"pass","score":5,"maxScore":5},{"caseId":"returns-source-backed-summary","status":"pass","score":5,"maxScore":5}],"outputHash":"sha256:086d3d4dcb4c62652afd42091bad853ac638fa0c5aba4ebf9ef268fd56b8d47b","stdoutObjectKey":"64e1e271-a7a4-4d85-b6e6-30279db284f3/output.md","artifactsObjectPrefix":"64e1e271-a7a4-4d85-b6e6-30279db284f3/","judgeSummary":"Benchmark suite produced the expected deterministic output. The research brief includes the expected source-backed summary language and captures all required cited links.","judgeWarnings":[]}}}