II.
EvalResult JSON
Structured · liveeval-result:swe-bench-verified.claude-sonnet-4-5.001
eval-result:swe-bench-verified.claude-sonnet-4-5.001 json
Inspect the normalized record payload exactly as the atlas UI reads it.
{
"id": "eval-result:swe-bench-verified.claude-sonnet-4-5.001",
"_kind": "EvalResult",
"_file": "benchmarks/eval-results/swe-bench-verified-claude-sonnet-4-5-result.yaml",
"_cluster": "benchmarks",
"attributes": {
"evalRunId": "eval-run:swe-bench-verified.claude-sonnet-4-5.2025-09",
"metricName": "pass_rate",
"score": 0.772,
"unit": "fraction",
"passFail": "pass",
"reportedAt": "2025-09-29T00:00:00Z"
},
"outgoingEdges": [
{
"from": "eval-result:swe-bench-verified.claude-sonnet-4-5.001",
"to": "eval-run:swe-bench-verified.claude-sonnet-4-5.2025-09",
"kind": "belongs_to_eval_run"
},
{
"from": "eval-result:swe-bench-verified.claude-sonnet-4-5.001",
"to": "benchmark:swe-bench-verified",
"kind": "scored_against",
"attributes": {}
}
],
"incomingEdges": [
{
"from": "claim:swe-bench-verified-claude-sonnet-4-5-anthropic-source-default",
"to": "eval-result:swe-bench-verified.claude-sonnet-4-5.001",
"kind": "about_subject"
}
]
}