Replay for 050998fa-f425-4d10-a34e-74a6a6c2692d

Replay kind: benchmark

Replay source: original receipt

Comparison: pending or not applicable

replay page ยท replay JSON

{
  "kind": "benchmark",
  "packageId": "web/give.md/policy-watchdog@1.0.0",
  "packageHash": "sha256:4f4de6805c4a296366654abcc5f2ddb8a8905f92adf71b1c1ec31eba15058aa3",
  "policyId": "policy/research-session@1.0.0",
  "policyHash": "sha256:b83ad9e9d1a209f12528b5cf4352d45cd14c9a8f061c19df898743a5f5ce594f",
  "benchmarkId": "benchmark/policy-safety-review@1.0.0",
  "benchmarkDefinitionHash": "sha256:d3ed23773d0c2a566a8dca19da0df5c23082b6df04e381f795edfc65b24842f0",
  "runtime": "claude",
  "executionBackend": "local",
  "availableTools": [
    "fetch",
    "json",
    "markdown"
  ],
  "grantedPermissions": [
    "http:get",
    "storage:write"
  ],
  "requestedApiOrigins": [
    "https://api.give.md"
  ],
  "requestedChains": [
    "base"
  ],
  "requestedTokens": [
    "USDC"
  ],
  "requestedSpend": "0.05 USDC",
  "result": {
    "status": "success",
    "score": 10,
    "maxScore": 10,
    "caseResults": [
      {
        "caseId": "flags-approval-thresholds",
        "status": "pass",
        "score": 5,
        "maxScore": 5
      },
      {
        "caseId": "tracks-delegation-windows",
        "status": "pass",
        "score": 5,
        "maxScore": 5
      }
    ],
    "outputHash": "sha256:d5095bc8dec61bc94faefd08437c6342e5b960800e5294b67184a1f72eaa6483",
    "stdoutObjectKey": "64f51603-235b-449b-a560-06a5244f77c1/output.md",
    "artifactsObjectPrefix": "64f51603-235b-449b-a560-06a5244f77c1/",
    "judgeSummary": "Benchmark suite produced the expected deterministic output. Policy review flagged the expected approval threshold findings. Policy review tracked the delegation window and follow-up.",
    "judgeWarnings": []
  }
}