Replay for ecd857c0-e819-4a24-a5e2-de6b49aff162
Replay kind: benchmark
Replay source: original receipt
Comparison: pending or not applicable
{
"kind": "benchmark",
"packageId": "addr/0x33327fbc0e7040F14657eD61eaF7Eb4d723AF595/research-agent@1.0.0",
"packageHash": "sha256:22772b736fbd391446bbc7c974f114f9f8644869095820d3347e06bf37205cbd",
"benchmarkId": "benchmark/source-backed-research@1.0.0",
"benchmarkDefinitionHash": "sha256:e312a86a54f41197730b5ae0a0d0f3768dd06b8d63225b0e4300fdd44fae1f2a",
"runtime": "codex",
"executionBackend": "local",
"availableTools": [
"fetch",
"markdown"
],
"grantedPermissions": [
"http:get",
"storage:write"
],
"requestedApiOrigins": [],
"requestedChains": [],
"requestedTokens": [],
"result": {
"status": "success",
"score": 10,
"maxScore": 10,
"caseResults": [
{
"caseId": "captures-cited-links",
"status": "pass",
"score": 5,
"maxScore": 5
},
{
"caseId": "returns-source-backed-summary",
"status": "pass",
"score": 5,
"maxScore": 5
}
],
"outputHash": "sha256:086d3d4dcb4c62652afd42091bad853ac638fa0c5aba4ebf9ef268fd56b8d47b",
"stdoutObjectKey": "3e9a6a41-df97-4ec1-b230-47e17a24042c/output.md",
"artifactsObjectPrefix": "3e9a6a41-df97-4ec1-b230-47e17a24042c/",
"judgeSummary": "Benchmark suite produced the expected deterministic output. The research brief includes the expected source-backed summary language and all required cited links.",
"judgeWarnings": []
}
}