eval-result:gpqa-diamond.gemini-3-pro.2025-11-18.accuracy
eval-result:gpqa-diamond.gemini-3-pro.2025-11-18.accuracy
EvalResultbenchmarks/eval-results/eval-results-google.yaml·Open in Graph → {
"id": "eval-result:gpqa-diamond.gemini-3-pro.2025-11-18.accuracy",
"_kind": "EvalResult",
"_file": "benchmarks/eval-results/eval-results-google.yaml",
"_cluster": "benchmarks",
"attributes": {
"evalRunId": "eval-run:gpqa-diamond.gemini-3-pro.2025-11-18",
"metricName": "accuracy",
"score": 0.919,
"unit": "fraction",
"passFail": "pass",
"reportedAt": "2026-05-04T00:00:00Z"
},
"outgoingEdges": [
{
"from": "eval-result:gpqa-diamond.gemini-3-pro.2025-11-18.accuracy",
"to": "eval-run:gpqa-diamond.gemini-3-pro.2025-11-18",
"kind": "belongs_to_eval_run"
}
],
"incomingEdges": []
}