eval-run:evalplus.gpt-5.2025-08
eval-run:evalplus.gpt-5.2025-08
EvalRunbenchmarks/eval-runs/extended-eval-runs.yaml·Open in Graph → {
"id": "eval-run:evalplus.gpt-5.2025-08",
"_kind": "EvalRun",
"_file": "benchmarks/eval-runs/extended-eval-runs.yaml",
"_cluster": "benchmarks",
"attributes": {
"target": "model:gpt-5@current",
"benchmarkId": "benchmark:bigcode-evalplus",
"testSetId": "test-set:swe-bench-verified-2024-12",
"targetId": "model:gpt-5@current",
"runAt": "2025-08-07T00:00:00Z",
"runBy": "evalplus-leaderboard",
"configHash": "sha256:placeholder-gpt-5-evalplus"
},
"outgoingEdges": [
{
"from": "eval-run:evalplus.gpt-5.2025-08",
"to": "model:gpt-5@current",
"kind": "evaluates_target"
},
{
"from": "eval-run:evalplus.gpt-5.2025-08",
"to": "benchmark:bigcode-evalplus",
"kind": "for_benchmark"
}
],
"incomingEdges": [
{
"from": "eval-result:evalplus.gpt-5.001",
"to": "eval-run:evalplus.gpt-5.2025-08",
"kind": "belongs_to_eval_run"
}
]
}