Grid Reliability Command Center
SRE operations view for uptime posture, incident pressure, root causes, and active response queue.
Interactive Preview (Aurora Light)
Theme
Dashboard Definition
{
"id": "grid_reliability_command_center",
"version": "0.0.1",
"generated_at": "2026-02-22T00:00:00Z",
"updated_at": "2026-02-22T00:00:00Z",
"title": "Grid Reliability Command Center",
"description": "Operational reliability posture with incident backlog, root causes, and latency-risk hotspots.",
"source": "ops.platform_reliability_rollup",
"tags": [
"operations",
"reliability",
"sre"
],
"timezone": "UTC",
"default_locale": "en_US",
"widgets": [
{
"id": "metric_uptime",
"type": "metric",
"title": "30-Day Uptime",
"description": "API estate availability.",
"data_type": "percent",
"data_ref": "ds_uptime"
},
{
"id": "metric_mttr",
"type": "metric",
"title": "MTTR (min)",
"description": "Mean recovery time across incidents.",
"data_type": "number",
"data_ref": "ds_mttr"
},
{
"id": "chart_incidents_service",
"type": "bar-chart",
"title": "Open Incidents by Service",
"description": "Current incident concentration.",
"data_ref": "ds_incidents_service"
},
{
"id": "chart_error_budget",
"type": "line-chart",
"title": "Error Budget Burn",
"description": "Six-sprint burn trend by cluster.",
"x_min": 1,
"x_max": 6,
"data_ref": "ds_error_budget_burn"
},
{
"id": "chart_recovery_distribution",
"type": "box-plot",
"title": "Recovery Time Distribution",
"description": "Resolution spread by service family (minutes).",
"data_ref": "ds_recovery_distribution"
},
{
"id": "chart_root_cause",
"type": "pie-chart",
"title": "Root Cause Mix",
"description": "Incident attribution over trailing month.",
"data_ref": "ds_root_causes"
},
{
"id": "chart_latency_vs_error",
"type": "scatter-chart",
"title": "Latency vs Error Rate",
"description": "Service cluster health envelope.",
"x_min": 90,
"x_max": 300,
"data_ref": "ds_latency_error_scatter"
},
{
"id": "table_live_incidents",
"type": "table",
"title": "Live Incident Queue",
"description": "Prioritized active incidents.",
"data_ref": "ds_live_incidents"
}
]
}
Data Definition
{
"id": "grid_reliability_command_center_data",
"dashboard_id": "grid_reliability_command_center",
"data_sources": {
"ds_uptime": {
"kind": "inline",
"description": "Rolling 30-day API uptime.",
"updated_at": "2026-02-22T00:00:00Z",
"data": {
"value": 0.9994,
"data_type": "percent",
"sentiment": "positive"
}
},
"ds_mttr": {
"kind": "inline",
"description": "Mean time to recovery in minutes.",
"updated_at": "2026-02-22T00:00:00Z",
"data": {
"value": 34.8,
"data_type": "number",
"sentiment": "positive"
}
},
"ds_incidents_service": {
"kind": "inline",
"description": "Open incidents by service.",
"updated_at": "2026-02-22T00:00:00Z",
"data": [
{
"x": "Auth",
"y": 7
},
{
"x": "Billing",
"y": 5
},
{
"x": "Ingest",
"y": 9
},
{
"x": "Search",
"y": 4
},
{
"x": "Storage",
"y": 6
}
]
},
"ds_error_budget_burn": {
"kind": "inline",
"description": "Error budget burn by cluster over time.",
"updated_at": "2026-02-22T00:00:00Z",
"data": [
{
"label": "Primary",
"data": [
{
"x": 1,
"y": 2.5
},
{
"x": 2,
"y": 3.1
},
{
"x": 3,
"y": 3.6
},
{
"x": 4,
"y": 2.9
},
{
"x": 5,
"y": 4.2
},
{
"x": 6,
"y": 3.8
}
]
},
{
"label": "Failover",
"data": [
{
"x": 1,
"y": 1.2
},
{
"x": 2,
"y": 1.4
},
{
"x": 3,
"y": 1.8
},
{
"x": 4,
"y": 1.7
},
{
"x": 5,
"y": 2.1
},
{
"x": 6,
"y": 2.0
}
]
}
]
},
"ds_recovery_distribution": {
"kind": "inline",
"description": "MTTR distribution summary by service family.",
"updated_at": "2026-02-22T00:00:00Z",
"data": [
{
"x": "Core APIs",
"min": 12,
"q1": 22,
"median": 31,
"q3": 44,
"max": 71
},
{
"x": "Data Plane",
"min": 10,
"q1": 19,
"median": 27,
"q3": 39,
"max": 66
},
{
"x": "Edge",
"min": 6,
"q1": 14,
"median": 20,
"q3": 28,
"max": 52
},
{
"x": "Internal Tools",
"min": 4,
"q1": 9,
"median": 15,
"q3": 23,
"max": 48
}
]
},
"ds_root_causes": {
"kind": "inline",
"description": "Distribution of incident root causes.",
"updated_at": "2026-02-22T00:00:00Z",
"data": [
{
"label": "Dependency",
"value": 31
},
{
"label": "Capacity",
"value": 24
},
{
"label": "Config Drift",
"value": 19
},
{
"label": "Deploy Regression",
"value": 16
},
{
"label": "Unknown",
"value": 10
}
]
},
"ds_latency_error_scatter": {
"kind": "inline",
"description": "P95 latency versus error rate by service cluster.",
"updated_at": "2026-02-22T00:00:00Z",
"data": [
{
"label": "Core APIs",
"data": [
{
"x": 180,
"y": 0.6
},
{
"x": 210,
"y": 0.9
},
{
"x": 240,
"y": 1.2
},
{
"x": 265,
"y": 1.3
},
{
"x": 290,
"y": 1.7
}
]
},
{
"label": "Edge",
"data": [
{
"x": 95,
"y": 0.2
},
{
"x": 110,
"y": 0.3
},
{
"x": 130,
"y": 0.45
},
{
"x": 145,
"y": 0.52
},
{
"x": 165,
"y": 0.7
}
]
}
]
},
"ds_live_incidents": {
"kind": "inline",
"description": "Current active incident queue.",
"updated_at": "2026-02-22T00:00:00Z",
"data": {
"columns": [
{
"name": "Incident",
"data_key": "incident",
"data_type": "string",
"data_formatter": "",
"align": "start"
},
{
"name": "Service",
"data_key": "service",
"data_type": "string",
"data_formatter": "",
"align": "start"
},
{
"name": "Severity",
"data_key": "severity",
"data_type": "string",
"data_formatter": "",
"align": "center"
},
{
"name": "Owner",
"data_key": "owner",
"data_type": "string",
"data_formatter": "",
"align": "start"
},
{
"name": "ETA (min)",
"data_key": "eta_minutes",
"data_type": "number",
"data_formatter": "number",
"align": "end"
}
],
"rows": [
{
"incident": "INC-1452",
"service": "Ingest",
"severity": "SEV-1",
"owner": "Data Core",
"eta_minutes": 35
},
{
"incident": "INC-1455",
"service": "Auth",
"severity": "SEV-2",
"owner": "Identity",
"eta_minutes": 55
},
{
"incident": "INC-1458",
"service": "Storage",
"severity": "SEV-2",
"owner": "Platform",
"eta_minutes": 42
},
{
"incident": "INC-1461",
"service": "Billing",
"severity": "SEV-3",
"owner": "FinOps",
"eta_minutes": 75
}
]
}
}
},
"version": "0.0.1",
"generated_at": "2026-02-22T00:00:00Z",
"updated_at": "2026-02-22T00:00:00Z",
"source": "ops.platform_reliability_rollup",
"tags": [
"operations",
"reliability",
"sre"
],
"timezone": "UTC",
"default_locale": "en_US"
}
Theme Render Options
Aurora Light
{
"font": "IBM Plex Sans",
"layout": {
"columns": 24,
"width": 1400,
"align": "center",
"widget_columns": 24,
"widget_rows": 10,
"spacing": 10
},
"palette": {
"text_color": "#122135",
"background_color": "#F4F8FF",
"link_color": "#0F62FE",
"chart_colors": [
"#0F62FE",
"#24A148",
"#8A3FFC",
"#FF832B",
"#009D9A",
"#D12771",
"#5D9CEC",
"#A56EFF"
]
},
"title_typeography": {
"font": "IBM Plex Sans",
"color": "#0F1E33",
"size": 22,
"weight": 700,
"align": "start"
},
"description_typeography": {
"font": "IBM Plex Sans",
"color": "#3A4B63",
"size": 14,
"weight": 400,
"align": "start"
},
"widget_type_defaults": {
"title": {
"columns": 24,
"rows": 1
},
"description": {
"columns": 24,
"rows": 1
},
"metric": {
"columns": 6,
"rows": 2
},
"horizontal-ruler": {
"columns": 24,
"rows": 1
},
"bar-chart": {
"columns": 12,
"rows": 7
},
"heatmap": {
"columns": 12,
"rows": 7
},
"funnel": {
"columns": 12,
"rows": 7
},
"box-plot": {
"columns": 12,
"rows": 7
},
"treemap": {
"columns": 12,
"rows": 7
},
"line-chart": {
"columns": 12,
"rows": 7
},
"scatter-chart": {
"columns": 12,
"rows": 7
},
"pie-chart": {
"columns": 12,
"rows": 7
},
"table": {
"columns": 24,
"rows": 8
}
},
"locale": "en_US"
}
Midnight Grid
{
"font": "Space Grotesk",
"layout": {
"columns": 24,
"width": 1320,
"align": "center",
"widget_columns": 24,
"widget_rows": 10,
"spacing": 14
},
"palette": {
"text_color": "#E6EEFF",
"background_color": "#0E1320",
"link_color": "#7FB3FF",
"chart_colors": [
"#4EA1FF",
"#2BD9A6",
"#FFC857",
"#E9724C",
"#C77DFF",
"#F07167",
"#9AD1D4",
"#6D9DC5"
]
},
"title_typeography": {
"font": "Space Grotesk",
"color": "#F4F7FF",
"size": 22,
"weight": 700,
"align": "start"
},
"description_typeography": {
"font": "Space Grotesk",
"color": "#B4C0D3",
"size": 14,
"weight": 400,
"align": "start"
},
"widget_type_defaults": {
"title": {
"columns": 24,
"rows": 1
},
"description": {
"columns": 24,
"rows": 1
},
"metric": {
"columns": 12,
"rows": 3
},
"horizontal-ruler": {
"columns": 24,
"rows": 1
},
"bar-chart": {
"columns": 24,
"rows": 10
},
"heatmap": {
"columns": 24,
"rows": 10
},
"funnel": {
"columns": 24,
"rows": 10
},
"box-plot": {
"columns": 24,
"rows": 10
},
"treemap": {
"columns": 24,
"rows": 10
},
"line-chart": {
"columns": 24,
"rows": 10
},
"scatter-chart": {
"columns": 24,
"rows": 10
},
"pie-chart": {
"columns": 24,
"rows": 9
},
"table": {
"columns": 24,
"rows": 12
}
},
"locale": "en_US"
}
Sepia Ledger
{
"font": "Source Serif Pro",
"layout": {
"columns": 24,
"width": 1180,
"align": "center",
"widget_columns": 24,
"widget_rows": 10,
"spacing": 16
},
"palette": {
"text_color": "#2F241B",
"background_color": "#F6F1E8",
"link_color": "#8C4E2D",
"chart_colors": [
"#8C4E2D",
"#4C6A92",
"#5B8E7D",
"#B06C49",
"#7D5A9E",
"#9B3D3D",
"#356859",
"#73503C"
]
},
"title_typeography": {
"font": "Source Serif Pro",
"color": "#2A1D15",
"size": 23,
"weight": 700,
"align": "start"
},
"description_typeography": {
"font": "Source Serif Pro",
"color": "#5A4C40",
"size": 14,
"weight": 400,
"align": "start"
},
"widget_type_defaults": {
"title": {
"columns": 24,
"rows": 2
},
"description": {
"columns": 24,
"rows": 2
},
"metric": {
"columns": 8,
"rows": 2
},
"horizontal-ruler": {
"columns": 24,
"rows": 1
},
"bar-chart": {
"columns": 16,
"rows": 8
},
"heatmap": {
"columns": 24,
"rows": 8
},
"funnel": {
"columns": 8,
"rows": 8
},
"box-plot": {
"columns": 16,
"rows": 8
},
"treemap": {
"columns": 16,
"rows": 9
},
"line-chart": {
"columns": 24,
"rows": 9
},
"scatter-chart": {
"columns": 16,
"rows": 8
},
"pie-chart": {
"columns": 8,
"rows": 8
},
"table": {
"columns": 24,
"rows": 11
}
},
"locale": "en_US"
}