Source-backed research brief
{
"benchmarkRunId": "93e60ede-8c0c-4e3b-b470-a5ba3c629260",
"benchmarkId": "benchmark/source-backed-research@1.0.0",
"benchmarkTitle": "Source-backed research brief",
"packageId": "web/dynamic-credit-live-1773681992489.example/research-agent@1.0.1773681992489",
"packageHash": "sha256:e9e05c4c8d9d9b953d375ec1cb91b50f3dc19aab75e0e82b56008acec143429c",
"runtime": "codex",
"signer": "addr:dynamic-credit-live",
"writeReceiptRequested": false,
"status": "success",
"executionBackend": "local",
"requestedExecutionBackend": "auto",
"sandboxProfile": "default",
"networkPolicy": "none",
"timeoutMs": 10000,
"benchmarkDefinitionHash": "sha256:e312a86a54f41197730b5ae0a0d0f3768dd06b8d63225b0e4300fdd44fae1f2a",
"replayInput": {
"availableTools": [
"fetch",
"markdown"
],
"grantedPermissions": [
"http:get",
"storage:write"
],
"requestedApiOrigins": [],
"requestedChains": [],
"requestedTokens": []
},
"score": 10,
"maxScore": 10,
"summary": "Benchmark suite produced the expected deterministic output.",
"startedAt": "2026-03-16T17:26:38.404Z",
"createdAt": "2026-03-16T17:26:38.404Z",
"evaluationChecks": [
{
"id": "runtime:codex",
"status": "pass",
"message": "Runtime codex is supported."
},
{
"id": "namespace:verified",
"status": "pass",
"message": "Namespace is verified."
},
{
"id": "tool:fetch",
"status": "pass",
"message": "Required tool fetch is available."
},
{
"id": "tool:markdown",
"status": "pass",
"message": "Required tool markdown is available."
},
{
"id": "permission:http:get",
"status": "pass",
"message": "Permission http:get is granted."
},
{
"id": "permission:storage:write",
"status": "pass",
"message": "Permission storage:write is granted."
},
{
"id": "policy:attached",
"status": "skip",
"message": "No attached policy to validate against."
}
],
"caseResults": [
{
"caseId": "returns-source-backed-summary",
"title": "Returns a source-backed summary",
"status": "pass",
"score": 5,
"maxScore": 5,
"message": "Benchmark brief includes the expected source-backed summary language."
},
{
"caseId": "captures-cited-links",
"title": "Captures cited links",
"status": "pass",
"score": 5,
"maxScore": 5,
"message": "Benchmark brief included all required cited links."
}
],
"evaluationOk": true,
"blockedByPreflight": false,
"completedAt": "2026-03-16T17:26:38.404Z",
"lastHeartbeatAt": "2026-03-16T17:26:38.404Z",
"outputHash": "sha256:086d3d4dcb4c62652afd42091bad853ac638fa0c5aba4ebf9ef268fd56b8d47b",
"stdoutObjectKey": "93e60ede-8c0c-4e3b-b470-a5ba3c629260/output.md",
"artifactsObjectPrefix": "93e60ede-8c0c-4e3b-b470-a5ba3c629260/",
"judgeSummary": "Benchmark suite produced the expected deterministic output."
}