II.
Benchmark JSON
Structured · livebenchmark:agentboard
AgentBoard json
Inspect the normalized record payload exactly as the atlas UI reads it.
{
"id": "benchmark:agentboard",
"_kind": "Benchmark",
"_file": "benchmarks/benchmarks/benchmarks-leaderboards.yaml",
"_cluster": "benchmarks",
"attributes": {
"displayName": "AgentBoard",
"homepageUrl": "https://hkust-nlp.github.io/agentboard/",
"kind": "agent-leaderboard",
"targetsKind": "AgentVersion",
"description": "AgentBoard is an analytical benchmark and leaderboard for LLM agents\ncovering embodied tasks, web, tool use, and games. Reports\nfine-grained progress and sub-goal metrics rather than only success\nrate.\n"
},
"outgoingEdges": [
{
"from": "benchmark:agentboard",
"to": "domain:ml-ai",
"kind": "applies_to",
"attributes": {}
}
],
"incomingEdges": [
{
"from": "scope-boundary:agentboard.scope",
"to": "benchmark:agentboard",
"kind": "bounds_subject"
}
]
}