Source-backed research brief

{
  "benchmarkRunId": "b924d4ca-0c9f-40aa-87d5-d459b46c23a1",
  "benchmarkId": "benchmark/source-backed-research@1.0.0",
  "benchmarkTitle": "Source-backed research brief",
  "packageId": "addr/0x69dFFb78f20D3B1511067C4899e6Afb5f3099964/research-agent@1.0.0",
  "packageHash": "sha256:5b49c3bf427aac8d024ed0e6064ef4e1f51b4ebb2d34511151ba838548c10f8e",
  "runtime": "codex",
  "signer": "addr:0x1111111111111111111111111111111111111111",
  "principalId": "sha256:1156dd81a7991c7497e8684f29c8d47734a9e1b3dabffa9d9a84bae57427a837",
  "writeReceiptRequested": true,
  "status": "success",
  "executionBackend": "local",
  "requestedExecutionBackend": "auto",
  "sandboxProfile": "default",
  "networkPolicy": "none",
  "timeoutMs": 10000,
  "benchmarkDefinitionHash": "sha256:e312a86a54f41197730b5ae0a0d0f3768dd06b8d63225b0e4300fdd44fae1f2a",
  "replayInput": {
    "availableTools": [
      "fetch",
      "markdown"
    ],
    "grantedPermissions": [
      "http:get",
      "storage:write"
    ],
    "requestedApiOrigins": [],
    "requestedChains": [],
    "requestedTokens": []
  },
  "score": 10,
  "maxScore": 10,
  "summary": "Benchmark suite produced the expected deterministic output.",
  "startedAt": "2026-03-18T16:00:52.266Z",
  "createdAt": "2026-03-18T16:00:52.266Z",
  "evaluationChecks": [
    {
      "id": "runtime:codex",
      "status": "pass",
      "message": "Runtime codex is supported."
    },
    {
      "id": "namespace:verified",
      "status": "pass",
      "message": "Namespace is verified."
    },
    {
      "id": "tool:fetch",
      "status": "pass",
      "message": "Required tool fetch is available."
    },
    {
      "id": "tool:markdown",
      "status": "pass",
      "message": "Required tool markdown is available."
    },
    {
      "id": "permission:http:get",
      "status": "pass",
      "message": "Permission http:get is granted."
    },
    {
      "id": "permission:storage:write",
      "status": "pass",
      "message": "Permission storage:write is granted."
    },
    {
      "id": "policy:attached",
      "status": "skip",
      "message": "No attached policy to validate against."
    }
  ],
  "caseResults": [
    {
      "caseId": "returns-source-backed-summary",
      "title": "Returns a source-backed summary",
      "status": "pass",
      "score": 5,
      "maxScore": 5,
      "message": "Benchmark brief includes the expected source-backed summary language."
    },
    {
      "caseId": "captures-cited-links",
      "title": "Captures cited links",
      "status": "pass",
      "score": 5,
      "maxScore": 5,
      "message": "Benchmark brief included all required cited links."
    }
  ],
  "evaluationOk": true,
  "blockedByPreflight": false,
  "completedAt": "2026-03-18T16:00:52.309Z",
  "lastHeartbeatAt": "2026-03-18T16:00:52.309Z",
  "outputHash": "sha256:086d3d4dcb4c62652afd42091bad853ac638fa0c5aba4ebf9ef268fd56b8d47b",
  "stdoutObjectKey": "b924d4ca-0c9f-40aa-87d5-d459b46c23a1/output.md",
  "artifactsObjectPrefix": "b924d4ca-0c9f-40aa-87d5-d459b46c23a1/",
  "judgeSummary": "Benchmark suite produced the expected deterministic output. The research brief includes the expected source-backed summary language and all required cited links.",
  "receiptId": "8d701826-33a8-4dbd-9296-4a27fb8c5b81"
}