II.
Workflow JSON
Structured · liveworkflow:full-stack-system-reliability-review
Full-Stack System Reliability Review json
Inspect the normalized record payload exactly as the atlas UI reads it.
{
"id": "workflow:full-stack-system-reliability-review",
"_kind": "Workflow",
"_file": "workflows/workflows/workflows-cross-domain.yaml",
"_cluster": "workflows",
"attributes": {
"displayName": "Full-Stack System Reliability Review",
"workflowKind": "governance",
"triggerType": "scheduled",
"typicalCadence": "quarterly",
"complexity": "cross-team",
"description": "Reviews end-to-end system reliability across the full technology\nstack -- analyzing frontend error rates, API latency percentiles,\nand database query performance together as correlated signals,\nevaluating SLO attainment across web, API, and data tiers, reviewing\ncloud infrastructure capacity headroom and auto-scaling policy\neffectiveness, auditing observability coverage for blind spots in\ntracing, logging, and metrics pipelines, assessing CI/CD pipeline\nreliability and deployment success rates, stress-testing failover\nprocedures across availability zones, and correlating incident\nfrequency with recent change velocity. Produces cross-stack\nreliability scorecard, SLO attainment report, and prioritized\nhardening backlog. Excludes feature development.\n"
},
"outgoingEdges": [
{
"from": "workflow:full-stack-system-reliability-review",
"to": "role:staff-engineer",
"kind": "involves_role",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "role:platform-engineer",
"kind": "involves_role",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "role:incident-commander",
"kind": "involves_role",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "skill-area:sli-slo-management",
"kind": "requires_skill_area",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "skill-area:observability-pipeline",
"kind": "requires_skill_area",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "skill-area:chaos-engineering",
"kind": "requires_skill_area",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "domain:web-development",
"kind": "applies_to_domain",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "domain:databases",
"kind": "applies_to_domain",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "domain:cloud-infra",
"kind": "applies_to_domain",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "domain:observability",
"kind": "applies_to_domain",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "domain:devops",
"kind": "applies_to_domain",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "responsibility:slo-definition",
"kind": "triggers_responsibility",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "responsibility:capacity-planning",
"kind": "triggers_responsibility",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "responsibility:review-architecture-changes",
"kind": "triggers_responsibility",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "org-unit:engineering",
"kind": "performed_by_org_unit",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "org-unit:infra-engineering",
"kind": "performed_by_org_unit",
"attributes": {}
},
{
"from": "workflow:full-stack-system-reliability-review",
"to": "org-unit:incident-response-team",
"kind": "performed_by_org_unit",
"attributes": {}
}
],
"incomingEdges": []
}