Created
July 4, 2022 13:04
-
-
Save bboreham/9666e947aef3fc1c46b540600ae9c7b8 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{ | |
"annotations": { | |
"list": [ | |
{ | |
"builtIn": 1, | |
"datasource": { | |
"type": "grafana", | |
"uid": "-- Grafana --" | |
}, | |
"enable": true, | |
"hide": true, | |
"iconColor": "rgba(0, 211, 255, 1)", | |
"name": "Annotations & Alerts", | |
"target": { | |
"limit": 100, | |
"matchAny": false, | |
"tags": [], | |
"type": "dashboard" | |
}, | |
"type": "dashboard" | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"enable": true, | |
"expr": "ALERTS{alertname=\"MimirRolloutUnderway\", cluster=~\"$cluster\", namespace=~\"$namespace\", alertstate=\"firing\"}", | |
"hide": false, | |
"iconColor": "rgba(255, 96, 96, 1)", | |
"name": "rollouts", | |
"showIn": 0, | |
"tags": [], | |
"titleFormat": "{{cluster}}/{{namespace}}", | |
"type": "tags" | |
} | |
] | |
}, | |
"editable": true, | |
"fiscalYearStartMonth": 0, | |
"graphTooltip": 0, | |
"id": 244, | |
"iteration": 1656411875785, | |
"links": [ | |
{ | |
"asDropdown": true, | |
"icon": "external link", | |
"includeVars": true, | |
"keepTime": true, | |
"tags": [ | |
"mimir" | |
], | |
"targetBlank": false, | |
"title": "Mimir dashboards", | |
"type": "dashboards" | |
} | |
], | |
"liveNow": false, | |
"panels": [ | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 0 | |
}, | |
"id": 34, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Headlines", | |
"type": "row" | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fieldConfig": { | |
"defaults": { | |
"color": { | |
"mode": "thresholds" | |
}, | |
"mappings": [], | |
"thresholds": { | |
"mode": "absolute", | |
"steps": [ | |
{ | |
"color": "green", | |
"value": null | |
}, | |
{ | |
"color": "red", | |
"value": 80 | |
} | |
] | |
}, | |
"unit": "short" | |
}, | |
"overrides": [] | |
}, | |
"gridPos": { | |
"h": 3, | |
"w": 4, | |
"x": 0, | |
"y": 1 | |
}, | |
"id": 1, | |
"links": [], | |
"options": { | |
"colorMode": "none", | |
"graphMode": "none", | |
"justifyMode": "auto", | |
"orientation": "horizontal", | |
"reduceOptions": { | |
"calcs": [ | |
"mean" | |
], | |
"fields": "", | |
"values": false | |
}, | |
"textMode": "auto" | |
}, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(cluster_namespace_job:cortex_distributor_received_samples:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\"})", | |
"format": "time_series", | |
"instant": true, | |
"intervalFactor": 2, | |
"refId": "A" | |
} | |
], | |
"title": "Samples / sec", | |
"type": "stat" | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Exemplars / sec\nThe total number of received exemplars by the distributors, excluding rejected and deduped exemplars, but not necessarily ingested by the ingesters.\n\n", | |
"fieldConfig": { | |
"defaults": { | |
"color": { | |
"mode": "thresholds" | |
}, | |
"mappings": [], | |
"thresholds": { | |
"mode": "absolute", | |
"steps": [ | |
{ | |
"color": "green", | |
"value": null | |
}, | |
{ | |
"color": "red", | |
"value": 80 | |
} | |
] | |
}, | |
"unit": "short" | |
}, | |
"overrides": [] | |
}, | |
"gridPos": { | |
"h": 3, | |
"w": 4, | |
"x": 4, | |
"y": 1 | |
}, | |
"id": 2, | |
"links": [], | |
"options": { | |
"colorMode": "none", | |
"graphMode": "none", | |
"justifyMode": "auto", | |
"orientation": "horizontal", | |
"reduceOptions": { | |
"calcs": [ | |
"mean" | |
], | |
"fields": "", | |
"values": false | |
}, | |
"textMode": "auto" | |
}, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(cluster_namespace_job:cortex_distributor_received_exemplars:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\"})", | |
"format": "time_series", | |
"instant": true, | |
"intervalFactor": 2, | |
"refId": "A" | |
} | |
], | |
"title": "Exemplars / sec", | |
"type": "stat" | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### In-memory series\nThe number of series not yet flushed to object storage that are held in ingester memory.\n\n", | |
"fieldConfig": { | |
"defaults": { | |
"color": { | |
"mode": "thresholds" | |
}, | |
"mappings": [], | |
"thresholds": { | |
"mode": "absolute", | |
"steps": [ | |
{ | |
"color": "green", | |
"value": null | |
}, | |
{ | |
"color": "red", | |
"value": 80 | |
} | |
] | |
}, | |
"unit": "short" | |
}, | |
"overrides": [] | |
}, | |
"gridPos": { | |
"h": 3, | |
"w": 4, | |
"x": 8, | |
"y": 1 | |
}, | |
"id": 3, | |
"links": [], | |
"options": { | |
"colorMode": "none", | |
"graphMode": "none", | |
"justifyMode": "auto", | |
"orientation": "horizontal", | |
"reduceOptions": { | |
"calcs": [ | |
"mean" | |
], | |
"fields": "", | |
"values": false | |
}, | |
"textMode": "auto" | |
}, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(cortex_ingester_memory_series{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}\n/ on(cluster, namespace) group_left\nmax by (cluster, namespace) (cortex_distributor_replication_factor{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\"}))\n", | |
"format": "time_series", | |
"instant": true, | |
"intervalFactor": 2, | |
"refId": "A" | |
} | |
], | |
"title": "In-memory series", | |
"type": "stat" | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Exemplars in ingesters\nNumber of TSDB exemplars currently in ingesters' storage.\n\n", | |
"fieldConfig": { | |
"defaults": { | |
"color": { | |
"mode": "thresholds" | |
}, | |
"mappings": [], | |
"thresholds": { | |
"mode": "absolute", | |
"steps": [ | |
{ | |
"color": "green", | |
"value": null | |
}, | |
{ | |
"color": "red", | |
"value": 80 | |
} | |
] | |
}, | |
"unit": "short" | |
}, | |
"overrides": [] | |
}, | |
"gridPos": { | |
"h": 3, | |
"w": 4, | |
"x": 12, | |
"y": 1 | |
}, | |
"id": 4, | |
"links": [], | |
"options": { | |
"colorMode": "none", | |
"graphMode": "none", | |
"justifyMode": "auto", | |
"orientation": "horizontal", | |
"reduceOptions": { | |
"calcs": [ | |
"mean" | |
], | |
"fields": "", | |
"values": false | |
}, | |
"textMode": "auto" | |
}, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(cortex_ingester_tsdb_exemplar_exemplars_in_storage{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}\n/ on(cluster, namespace) group_left\nmax by (cluster, namespace) (cortex_distributor_replication_factor{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\"}))\n", | |
"format": "time_series", | |
"instant": true, | |
"intervalFactor": 2, | |
"refId": "A" | |
} | |
], | |
"title": "Exemplars in ingesters", | |
"type": "stat" | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fieldConfig": { | |
"defaults": { | |
"color": { | |
"mode": "thresholds" | |
}, | |
"mappings": [], | |
"thresholds": { | |
"mode": "absolute", | |
"steps": [ | |
{ | |
"color": "green", | |
"value": null | |
}, | |
{ | |
"color": "red", | |
"value": 80 | |
} | |
] | |
}, | |
"unit": "short" | |
}, | |
"overrides": [] | |
}, | |
"gridPos": { | |
"h": 3, | |
"w": 4, | |
"x": 16, | |
"y": 1 | |
}, | |
"id": 5, | |
"links": [], | |
"options": { | |
"colorMode": "none", | |
"graphMode": "none", | |
"justifyMode": "auto", | |
"orientation": "horizontal", | |
"reduceOptions": { | |
"calcs": [ | |
"mean" | |
], | |
"fields": "", | |
"values": false | |
}, | |
"textMode": "auto" | |
}, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "count(count by(user) (cortex_ingester_active_series{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}))", | |
"format": "time_series", | |
"instant": true, | |
"intervalFactor": 2, | |
"refId": "A" | |
} | |
], | |
"title": "Tenants", | |
"type": "stat" | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fieldConfig": { | |
"defaults": { | |
"color": { | |
"mode": "thresholds" | |
}, | |
"mappings": [], | |
"thresholds": { | |
"mode": "absolute", | |
"steps": [ | |
{ | |
"color": "green", | |
"value": null | |
}, | |
{ | |
"color": "red", | |
"value": 80 | |
} | |
] | |
}, | |
"unit": "reqps" | |
}, | |
"overrides": [] | |
}, | |
"gridPos": { | |
"h": 3, | |
"w": 4, | |
"x": 20, | |
"y": 1 | |
}, | |
"id": 6, | |
"links": [], | |
"options": { | |
"colorMode": "none", | |
"graphMode": "none", | |
"justifyMode": "auto", | |
"orientation": "horizontal", | |
"reduceOptions": { | |
"calcs": [ | |
"mean" | |
], | |
"fields": "", | |
"values": false | |
}, | |
"textMode": "auto" | |
}, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((gateway|cortex-gw|cortex-gw-internal))\", route=~\"api_(v1|prom)_push\"}[$__rate_interval]))", | |
"format": "time_series", | |
"instant": true, | |
"intervalFactor": 2, | |
"refId": "A" | |
} | |
], | |
"title": "Requests / sec", | |
"type": "stat" | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 4 | |
}, | |
"id": 35, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Gateway", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": { | |
"1xx": "#EAB839", | |
"2xx": "#7EB26D", | |
"3xx": "#6ED0E0", | |
"4xx": "#EF843C", | |
"5xx": "#E24D42", | |
"error": "#E24D42", | |
"success": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 10, | |
"fillGradient": 0, | |
"gridPos": { | |
"h": 7, | |
"w": 8, | |
"x": 0, | |
"y": 5 | |
}, | |
"hiddenSeries": false, | |
"id": 7, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"options": { | |
"alertThreshold": true | |
}, | |
"percentage": false, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum by (status) (\n label_replace(label_replace(rate(cortex_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((gateway|cortex-gw|cortex-gw-internal))\", route=~\"api_(v1|prom)_push\"}[$__rate_interval]),\n \"status\", \"${1}xx\", \"status_code\", \"([0-9])..\"),\n \"status\", \"${1}\", \"status_code\", \"([a-z]+)\"))\n", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "{{status}}", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"timeRegions": [], | |
"title": "Requests / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
], | |
"yaxis": { | |
"align": false | |
} | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 1, | |
"fillGradient": 0, | |
"gridPos": { | |
"h": 7, | |
"w": 8, | |
"x": 8, | |
"y": 5 | |
}, | |
"hiddenSeries": false, | |
"id": 8, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"options": { | |
"alertThreshold": true | |
}, | |
"percentage": false, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum by (le) (cluster_job_route:cortex_request_duration_seconds_bucket:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((gateway|cortex-gw|cortex-gw-internal))\", route=~\"api_(v1|prom)_push\"})) * 1e3", | |
"format": "time_series", | |
"intervalFactor": 2, | |
"legendFormat": "99th Percentile", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.50, sum by (le) (cluster_job_route:cortex_request_duration_seconds_bucket:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((gateway|cortex-gw|cortex-gw-internal))\", route=~\"api_(v1|prom)_push\"})) * 1e3", | |
"format": "time_series", | |
"intervalFactor": 2, | |
"legendFormat": "50th Percentile", | |
"refId": "B", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "1e3 * sum(cluster_job_route:cortex_request_duration_seconds_sum:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((gateway|cortex-gw|cortex-gw-internal))\", route=~\"api_(v1|prom)_push\"}) / sum(cluster_job_route:cortex_request_duration_seconds_count:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((gateway|cortex-gw|cortex-gw-internal))\", route=~\"api_(v1|prom)_push\"})", | |
"format": "time_series", | |
"intervalFactor": 2, | |
"legendFormat": "Average", | |
"refId": "C", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"timeRegions": [], | |
"title": "Latency", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ms", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
], | |
"yaxis": { | |
"align": false | |
} | |
}, | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "$datasource" | |
}, | |
"fieldConfig": { | |
"defaults": { | |
"color": { | |
"mode": "palette-classic" | |
}, | |
"custom": { | |
"axisLabel": "", | |
"axisPlacement": "auto", | |
"barAlignment": 0, | |
"drawStyle": "line", | |
"fillOpacity": 0, | |
"gradientMode": "none", | |
"hideFrom": { | |
"legend": false, | |
"tooltip": false, | |
"viz": false | |
}, | |
"lineInterpolation": "linear", | |
"lineWidth": 1, | |
"pointSize": 5, | |
"scaleDistribution": { | |
"type": "linear" | |
}, | |
"showPoints": "never", | |
"spanNulls": false, | |
"stacking": { | |
"group": "A", | |
"mode": "none" | |
}, | |
"thresholdsStyle": { | |
"mode": "off" | |
} | |
}, | |
"mappings": [], | |
"min": 0, | |
"thresholds": { | |
"mode": "absolute", | |
"steps": [ | |
{ | |
"color": "green", | |
"value": null | |
}, | |
{ | |
"color": "red", | |
"value": 80 | |
} | |
] | |
}, | |
"unit": "s" | |
}, | |
"overrides": [] | |
}, | |
"gridPos": { | |
"h": 7, | |
"w": 8, | |
"x": 16, | |
"y": 5 | |
}, | |
"id": 9, | |
"links": [], | |
"options": { | |
"legend": { | |
"calcs": [], | |
"displayMode": "hidden", | |
"placement": "bottom" | |
}, | |
"tooltip": { | |
"mode": "multi", | |
"sort": "desc" | |
} | |
}, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"editorMode": "code", | |
"exemplar": true, | |
"expr": "histogram_quantile(0.99, sum by(le, pod) (rate(cortex_request_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((gateway|cortex-gw|cortex-gw-internal))\", route=~\"api_(v1|prom)_push\"}[$__rate_interval])))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "", | |
"range": true, | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"title": "Per pod p99 latency", | |
"type": "timeseries" | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 12 | |
}, | |
"id": 36, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Distributor", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": { | |
"1xx": "#EAB839", | |
"2xx": "#7EB26D", | |
"3xx": "#6ED0E0", | |
"4xx": "#EF843C", | |
"5xx": "#E24D42", | |
"error": "#E24D42", | |
"success": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 10, | |
"fillGradient": 0, | |
"gridPos": { | |
"h": 7, | |
"w": 8, | |
"x": 0, | |
"y": 13 | |
}, | |
"hiddenSeries": false, | |
"id": 10, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"options": { | |
"alertThreshold": true | |
}, | |
"percentage": false, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum by (status) (\n label_replace(label_replace(rate(cortex_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", route=~\"/distributor.Distributor/Push|/httpgrpc.*|api_(v1|prom)_push\"}[$__rate_interval]),\n \"status\", \"${1}xx\", \"status_code\", \"([0-9])..\"),\n \"status\", \"${1}\", \"status_code\", \"([a-z]+)\"))\n", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "{{status}}", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"timeRegions": [], | |
"title": "Requests / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
], | |
"yaxis": { | |
"align": false | |
} | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 1, | |
"fillGradient": 0, | |
"gridPos": { | |
"h": 7, | |
"w": 8, | |
"x": 8, | |
"y": 13 | |
}, | |
"hiddenSeries": false, | |
"id": 11, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"options": { | |
"alertThreshold": true | |
}, | |
"percentage": false, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum by (le) (cluster_job_route:cortex_request_duration_seconds_bucket:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", route=~\"/distributor.Distributor/Push|/httpgrpc.*|api_(v1|prom)_push\"})) * 1e3", | |
"format": "time_series", | |
"intervalFactor": 2, | |
"legendFormat": "99th Percentile", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.50, sum by (le) (cluster_job_route:cortex_request_duration_seconds_bucket:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", route=~\"/distributor.Distributor/Push|/httpgrpc.*|api_(v1|prom)_push\"})) * 1e3", | |
"format": "time_series", | |
"intervalFactor": 2, | |
"legendFormat": "50th Percentile", | |
"refId": "B", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "1e3 * sum(cluster_job_route:cortex_request_duration_seconds_sum:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", route=~\"/distributor.Distributor/Push|/httpgrpc.*|api_(v1|prom)_push\"}) / sum(cluster_job_route:cortex_request_duration_seconds_count:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", route=~\"/distributor.Distributor/Push|/httpgrpc.*|api_(v1|prom)_push\"})", | |
"format": "time_series", | |
"intervalFactor": 2, | |
"legendFormat": "Average", | |
"refId": "C", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"timeRegions": [], | |
"title": "Latency", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ms", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
], | |
"yaxis": { | |
"align": false | |
} | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 0, | |
"fillGradient": 0, | |
"gridPos": { | |
"h": 7, | |
"w": 8, | |
"x": 16, | |
"y": 13 | |
}, | |
"hiddenSeries": false, | |
"id": 12, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": false, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"options": { | |
"alertThreshold": true | |
}, | |
"percentage": false, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum by(le, pod) (rate(cortex_request_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", route=~\"/distributor.Distributor/Push|/httpgrpc.*|api_(v1|prom)_push\"}[$__rate_interval])))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"timeRegions": [], | |
"title": "Per pod p99 latency", | |
"tooltip": { | |
"shared": true, | |
"sort": 2, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "s", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
], | |
"yaxis": { | |
"align": false | |
} | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 20 | |
}, | |
"id": 37, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Ingester", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": { | |
"1xx": "#EAB839", | |
"2xx": "#7EB26D", | |
"3xx": "#6ED0E0", | |
"4xx": "#EF843C", | |
"5xx": "#E24D42", | |
"error": "#E24D42", | |
"success": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 10, | |
"fillGradient": 0, | |
"gridPos": { | |
"h": 7, | |
"w": 8, | |
"x": 0, | |
"y": 21 | |
}, | |
"hiddenSeries": false, | |
"id": 13, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"options": { | |
"alertThreshold": true | |
}, | |
"percentage": false, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum by (status) (\n label_replace(label_replace(rate(cortex_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\",route=\"/cortex.Ingester/Push\"}[$__rate_interval]),\n \"status\", \"${1}xx\", \"status_code\", \"([0-9])..\"),\n \"status\", \"${1}\", \"status_code\", \"([a-z]+)\"))\n", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "{{status}}", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"timeRegions": [], | |
"title": "Requests / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
], | |
"yaxis": { | |
"align": false | |
} | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 1, | |
"fillGradient": 0, | |
"gridPos": { | |
"h": 7, | |
"w": 8, | |
"x": 8, | |
"y": 21 | |
}, | |
"hiddenSeries": false, | |
"id": 14, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"options": { | |
"alertThreshold": true | |
}, | |
"percentage": false, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum by (le) (cluster_job_route:cortex_request_duration_seconds_bucket:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", route=\"/cortex.Ingester/Push\"})) * 1e3", | |
"format": "time_series", | |
"intervalFactor": 2, | |
"legendFormat": "99th Percentile", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.50, sum by (le) (cluster_job_route:cortex_request_duration_seconds_bucket:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", route=\"/cortex.Ingester/Push\"})) * 1e3", | |
"format": "time_series", | |
"intervalFactor": 2, | |
"legendFormat": "50th Percentile", | |
"refId": "B", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "1e3 * sum(cluster_job_route:cortex_request_duration_seconds_sum:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", route=\"/cortex.Ingester/Push\"}) / sum(cluster_job_route:cortex_request_duration_seconds_count:sum_rate{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", route=\"/cortex.Ingester/Push\"})", | |
"format": "time_series", | |
"intervalFactor": 2, | |
"legendFormat": "Average", | |
"refId": "C", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"timeRegions": [], | |
"title": "Latency", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ms", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
], | |
"yaxis": { | |
"align": false | |
} | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 0, | |
"fillGradient": 0, | |
"gridPos": { | |
"h": 7, | |
"w": 8, | |
"x": 16, | |
"y": 21 | |
}, | |
"hiddenSeries": false, | |
"id": 15, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": false, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"options": { | |
"alertThreshold": true | |
}, | |
"percentage": false, | |
"pluginVersion": "9.1.0-7d815a1dpre", | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum by(le, pod) (rate(cortex_request_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", route=\"/cortex.Ingester/Push\"}[$__rate_interval])))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"timeRegions": [], | |
"title": "Per pod p99 latency", | |
"tooltip": { | |
"shared": true, | |
"sort": 2, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "s", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
], | |
"yaxis": { | |
"align": false | |
} | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 28 | |
}, | |
"id": 38, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Distributor - key-value store for high-availability (HA) deduplication", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": { | |
"1xx": "#EAB839", | |
"2xx": "#7EB26D", | |
"3xx": "#6ED0E0", | |
"4xx": "#EF843C", | |
"5xx": "#E24D42", | |
"error": "#E24D42", | |
"success": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 10, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 0, | |
"y": 29 | |
}, | |
"id": 16, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum by (status) (\n label_replace(label_replace(rate(cortex_kv_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-hatracker\"}[$__rate_interval]),\n \"status\", \"${1}xx\", \"status_code\", \"([0-9])..\"),\n \"status\", \"${1}\", \"status_code\", \"([a-z]+)\"))\n", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "{{status}}", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Requests / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 12, | |
"y": 29 | |
}, | |
"id": 17, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum(rate(cortex_kv_request_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-hatracker\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "99th Percentile", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.50, sum(rate(cortex_kv_request_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-hatracker\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "50th Percentile", | |
"refId": "B", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_kv_request_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-hatracker\"}[$__rate_interval])) * 1e3 / sum(rate(cortex_kv_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-hatracker\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "Average", | |
"refId": "C", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Latency", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ms", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 36 | |
}, | |
"id": 39, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Distributor - key-value store for distributors ring", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": { | |
"1xx": "#EAB839", | |
"2xx": "#7EB26D", | |
"3xx": "#6ED0E0", | |
"4xx": "#EF843C", | |
"5xx": "#E24D42", | |
"error": "#E24D42", | |
"success": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 10, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 0, | |
"y": 37 | |
}, | |
"id": 18, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum by (status) (\n label_replace(label_replace(rate(cortex_kv_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-(lifecycler|ring)\"}[$__rate_interval]),\n \"status\", \"${1}xx\", \"status_code\", \"([0-9])..\"),\n \"status\", \"${1}\", \"status_code\", \"([a-z]+)\"))\n", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "{{status}}", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Requests / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 12, | |
"y": 37 | |
}, | |
"id": 19, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum(rate(cortex_kv_request_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-(lifecycler|ring)\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "99th Percentile", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.50, sum(rate(cortex_kv_request_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-(lifecycler|ring)\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "50th Percentile", | |
"refId": "B", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_kv_request_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-(lifecycler|ring)\"}[$__rate_interval])) * 1e3 / sum(rate(cortex_kv_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\", kv_name=~\"distributor-(lifecycler|ring)\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "Average", | |
"refId": "C", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Latency", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ms", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 44 | |
}, | |
"id": 40, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Ingester - key-value store for the ingesters ring", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": { | |
"1xx": "#EAB839", | |
"2xx": "#7EB26D", | |
"3xx": "#6ED0E0", | |
"4xx": "#EF843C", | |
"5xx": "#E24D42", | |
"error": "#E24D42", | |
"success": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 10, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 0, | |
"y": 45 | |
}, | |
"id": 20, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum by (status) (\n label_replace(label_replace(rate(cortex_kv_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", kv_name=~\"ingester-.*\"}[$__rate_interval]),\n \"status\", \"${1}xx\", \"status_code\", \"([0-9])..\"),\n \"status\", \"${1}\", \"status_code\", \"([a-z]+)\"))\n", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "{{status}}", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Requests / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 12, | |
"y": 45 | |
}, | |
"id": 21, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum(rate(cortex_kv_request_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", kv_name=~\"ingester-.*\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "99th Percentile", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.50, sum(rate(cortex_kv_request_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", kv_name=~\"ingester-.*\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "50th Percentile", | |
"refId": "B", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_kv_request_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", kv_name=~\"ingester-.*\"}[$__rate_interval])) * 1e3 / sum(rate(cortex_kv_request_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\", kv_name=~\"ingester-.*\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "Average", | |
"refId": "C", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Latency", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ms", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 52 | |
}, | |
"id": 41, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Ingester - shipper", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": { | |
"failed": "#E24D42", | |
"successful": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Uploaded blocks / sec\nThe rate of blocks being uploaded from the ingesters\nto object storage.\n\n", | |
"fill": 10, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 0, | |
"y": 53 | |
}, | |
"id": 22, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_shipper_uploads_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval])) - sum(rate(cortex_ingester_shipper_upload_failures_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "successful", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_shipper_upload_failures_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "failed", | |
"refId": "B", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Uploaded blocks / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Upload latency\nThe average, median (50th percentile), and 99th percentile time\nthe ingesters take to upload blocks to object storage.\n\n", | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 12, | |
"y": 53 | |
}, | |
"id": 23, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum(rate(thanos_objstore_bucket_operation_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\",component=\"ingester\",operation=\"upload\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "99th Percentile", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.50, sum(rate(thanos_objstore_bucket_operation_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\",component=\"ingester\",operation=\"upload\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "50th Percentile", | |
"refId": "B", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(thanos_objstore_bucket_operation_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\",component=\"ingester\",operation=\"upload\"}[$__rate_interval])) * 1e3 / sum(rate(thanos_objstore_bucket_operation_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\",component=\"ingester\",operation=\"upload\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "Average", | |
"refId": "C", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Upload latency", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ms", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 60 | |
}, | |
"id": 42, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Ingester - TSDB head", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": { | |
"failed": "#E24D42", | |
"successful": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Compactions per second\nIngesters maintain a local TSDB per-tenant on disk. Each TSDB maintains a head block for each\nactive time series; these blocks get periodically compacted (by default, every 2h).\nThis panel shows the rate of compaction operations across all TSDBs on all ingesters.\n\n", | |
"fill": 10, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 0, | |
"y": 61 | |
}, | |
"id": 24, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_compactions_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "successful", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_compactions_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "failed", | |
"refId": "B", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Compactions / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Compaction latency\nThe average, median (50th percentile), and 99th percentile time ingesters take to compact TSDB head blocks\non the local filesystem.\n\n", | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 12, | |
"x": 12, | |
"y": 61 | |
}, | |
"id": 25, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.99, sum(rate(cortex_ingester_tsdb_compaction_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "99th Percentile", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "histogram_quantile(0.50, sum(rate(cortex_ingester_tsdb_compaction_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval])) by (le)) * 1e3", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "50th Percentile", | |
"refId": "B", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_compaction_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval])) * 1e3 / sum(rate(cortex_ingester_tsdb_compaction_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "Average", | |
"refId": "C", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Compactions latency", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ms", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 68 | |
}, | |
"id": 43, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Ingester - TSDB write ahead log (WAL)", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": { | |
"failed": "#E24D42", | |
"successful": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### WAL truncations per second\nThe WAL is truncated each time a new TSDB block is written. This panel measures the rate of\ntruncations.\n\n", | |
"fill": 10, | |
"gridPos": { | |
"h": 7, | |
"w": 6, | |
"x": 0, | |
"y": 69 | |
}, | |
"id": 26, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_wal_truncations_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval])) - sum(rate(cortex_ingester_tsdb_wal_truncations_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "successful", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_wal_truncations_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "failed", | |
"refId": "B", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "WAL truncations / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": { | |
"failed": "#E24D42", | |
"successful": "#7EB26D" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Checkpoints created per second\nCheckpoints are created as part of the WAL truncation process.\nThis metric measures the rate of checkpoint creation.\n\n", | |
"fill": 10, | |
"gridPos": { | |
"h": 7, | |
"w": 6, | |
"x": 6, | |
"y": 69 | |
}, | |
"id": 27, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_checkpoint_creations_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval])) - sum(rate(cortex_ingester_tsdb_checkpoint_creations_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "successful", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_checkpoint_creations_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "failed", | |
"refId": "B", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Checkpoints created / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "short", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### WAL truncations latency (including checkpointing)\nAverage time taken to perform a full WAL truncation,\nincluding the time taken for the checkpointing to complete.\n\n", | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 6, | |
"x": 12, | |
"y": 69 | |
}, | |
"id": 28, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_wal_truncate_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval])) / sum(rate(cortex_ingester_tsdb_wal_truncate_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "avg", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "WAL truncations latency (includes checkpointing)", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "s", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": { | |
"WAL": "#E24D42", | |
"mmap-ed chunks": "#E28A42" | |
}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"fill": 10, | |
"gridPos": { | |
"h": 7, | |
"w": 6, | |
"x": 18, | |
"y": 69 | |
}, | |
"id": 29, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 0, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": true, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_wal_corruptions_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "WAL", | |
"refId": "A", | |
"step": 10 | |
}, | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(rate(cortex_ingester_tsdb_mmap_chunk_corruptions_total{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}[$__rate_interval]))", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "mmap-ed chunks", | |
"refId": "B", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Corruptions / sec", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ops", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"collapsed": false, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"gridPos": { | |
"h": 1, | |
"w": 24, | |
"x": 0, | |
"y": 76 | |
}, | |
"id": 44, | |
"panels": [], | |
"targets": [ | |
{ | |
"datasource": { | |
"type": "prometheus", | |
"uid": "P1809F7CD0C75ACF3" | |
}, | |
"refId": "A" | |
} | |
], | |
"title": "Exemplars", | |
"type": "row" | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Distributor exemplars incoming rate\nThe rate of exemplars that have come in to the distributor, including rejected or deduped exemplars.\n\n", | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 6, | |
"x": 0, | |
"y": 77 | |
}, | |
"id": 30, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(cluster_namespace_job:cortex_distributor_exemplars_in:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\"})", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "incoming exemplars", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Distributor exemplars incoming rate", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ex/s", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Distributor exemplars received rate\nThe rate of received exemplars, excluding rejected and deduped exemplars.\nThis number can be sensibly lower than incoming rate because we dedupe the HA sent exemplars, and then reject based on time, see `cortex_discarded_exemplars_total` for specific reasons rates.\n\n", | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 6, | |
"x": 6, | |
"y": 77 | |
}, | |
"id": 31, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(cluster_namespace_job:cortex_distributor_received_exemplars:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\"})", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "received exemplars", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Distributor exemplars received rate", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ex/s", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Ingester ingested exemplars rate\nThe rate of exemplars ingested in the ingesters.\nEvery exemplar is sent to the replication factor number of ingesters, so the sum of rates from all ingesters is divided by the replication factor.\nThis ingested exemplars rate should match the distributor's received exemplars rate.\n\n", | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 6, | |
"x": 12, | |
"y": 77 | |
}, | |
"id": 32, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(\n cluster_namespace_job:cortex_ingester_ingested_exemplars:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}\n / on(cluster, namespace) group_left\n max by (cluster, namespace) (cortex_distributor_replication_factor{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\"})\n)\n", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "ingested exemplars", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Ingester ingested exemplars rate", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ex/s", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
}, | |
{ | |
"aliasColors": {}, | |
"bars": false, | |
"dashLength": 10, | |
"dashes": false, | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"description": "### Ingester appended exemplars rate\nThe rate of exemplars appended in the ingesters.\nThis can be lower than ingested exemplars rate since TSDB does not append the same exemplar twice, and those can be frequent.\n\n", | |
"fill": 1, | |
"gridPos": { | |
"h": 7, | |
"w": 6, | |
"x": 18, | |
"y": 77 | |
}, | |
"id": 33, | |
"legend": { | |
"avg": false, | |
"current": false, | |
"max": false, | |
"min": false, | |
"show": true, | |
"total": false, | |
"values": false | |
}, | |
"lines": true, | |
"linewidth": 1, | |
"links": [], | |
"nullPointMode": "null as zero", | |
"percentage": false, | |
"pointradius": 5, | |
"points": false, | |
"renderer": "flot", | |
"seriesOverrides": [], | |
"spaceLength": 10, | |
"stack": false, | |
"steppedLine": false, | |
"targets": [ | |
{ | |
"datasource": { | |
"uid": "$datasource" | |
}, | |
"expr": "sum(\n cluster_namespace_job:cortex_ingester_tsdb_exemplar_exemplars_appended:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/((ingester.*|cortex|mimir))\"}\n / on(cluster, namespace) group_left\n max by (cluster, namespace) (cortex_distributor_replication_factor{cluster=~\"$cluster\", job=~\"($namespace)/((m3-aggregations-)?(distributor|cortex|mimir))\"})\n)\n", | |
"format": "time_series", | |
"interval": "15s", | |
"intervalFactor": 2, | |
"legendFormat": "appended exemplars", | |
"refId": "A", | |
"step": 10 | |
} | |
], | |
"thresholds": [], | |
"title": "Ingester appended exemplars rate", | |
"tooltip": { | |
"shared": false, | |
"sort": 0, | |
"value_type": "individual" | |
}, | |
"type": "graph", | |
"xaxis": { | |
"mode": "time", | |
"show": true, | |
"values": [] | |
}, | |
"yaxes": [ | |
{ | |
"format": "ex/s", | |
"logBase": 1, | |
"min": 0, | |
"show": true | |
}, | |
{ | |
"format": "short", | |
"logBase": 1, | |
"show": false | |
} | |
] | |
} | |
], | |
"refresh": "10s", | |
"schemaVersion": 36, | |
"style": "dark", | |
"tags": [ | |
"mimir" | |
], | |
"templating": { | |
"list": [ | |
{ | |
"current": { | |
"selected": false, | |
"text": "ops-cortex", | |
"value": "ops-cortex" | |
}, | |
"hide": 0, | |
"includeAll": false, | |
"label": "Data Source", | |
"multi": false, | |
"name": "datasource", | |
"options": [], | |
"query": "prometheus", | |
"refresh": 1, | |
"regex": "", | |
"skipUrlSync": false, | |
"type": "datasource" | |
}, | |
{ | |
"allValue": ".+", | |
"current": { | |
"selected": false, | |
"text": [ | |
"prod-us-east-0" | |
], | |
"value": [ | |
"prod-us-east-0" | |
] | |
}, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "$datasource" | |
}, | |
"definition": "", | |
"hide": 0, | |
"includeAll": true, | |
"label": "cluster", | |
"multi": true, | |
"name": "cluster", | |
"options": [], | |
"query": { | |
"query": "label_values(cortex_build_info, cluster)", | |
"refId": "ops-cortex-cluster-Variable-Query" | |
}, | |
"refresh": 1, | |
"regex": "", | |
"skipUrlSync": false, | |
"sort": 2, | |
"tagValuesQuery": "", | |
"tagsQuery": "", | |
"type": "query", | |
"useTags": false | |
}, | |
{ | |
"allValue": ".+", | |
"current": { | |
"selected": false, | |
"text": [ | |
"mimir-dedicated-20" | |
], | |
"value": [ | |
"mimir-dedicated-20" | |
] | |
}, | |
"datasource": { | |
"type": "prometheus", | |
"uid": "$datasource" | |
}, | |
"definition": "", | |
"hide": 0, | |
"includeAll": true, | |
"label": "namespace", | |
"multi": true, | |
"name": "namespace", | |
"options": [], | |
"query": { | |
"query": "label_values(cortex_build_info{cluster=~\"$cluster\"}, namespace)", | |
"refId": "ops-cortex-namespace-Variable-Query" | |
}, | |
"refresh": 1, | |
"regex": "", | |
"skipUrlSync": false, | |
"sort": 2, | |
"tagValuesQuery": "", | |
"tagsQuery": "", | |
"type": "query", | |
"useTags": false | |
} | |
] | |
}, | |
"time": { | |
"from": "now-1h", | |
"to": "now" | |
}, | |
"timepicker": { | |
"refresh_intervals": [ | |
"5s", | |
"10s", | |
"30s", | |
"1m", | |
"5m", | |
"15m", | |
"30m", | |
"1h", | |
"2h", | |
"1d" | |
], | |
"time_options": [ | |
"5m", | |
"15m", | |
"1h", | |
"6h", | |
"12h", | |
"24h", | |
"2d", | |
"7d", | |
"30d" | |
] | |
}, | |
"timezone": "", | |
"title": "Mimir / Writes", | |
"uid": "8280707b8f16e7b87b840fc1cc92d4c5", | |
"version": 1, | |
"weekStart": "" | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment