From 815d78ffd2135e845b5ea7a3b90a6b8e71b67368 Mon Sep 17 00:00:00 2001 From: Kiichiro YUKAWA Date: Tue, 23 Apr 2024 09:20:01 +0900 Subject: [PATCH] :chart_with_upwards_trend: Add client metrics panels for continuous benchmark job (#2481) Signed-off-by: vankichi --- .../10-vald-benchmark-operator.yaml | 656 +++++++++++++++--- 1 file changed, 561 insertions(+), 95 deletions(-) diff --git a/k8s/metrics/grafana/dashboards/10-vald-benchmark-operator.yaml b/k8s/metrics/grafana/dashboards/10-vald-benchmark-operator.yaml index e14dd51bbe8..737db1218e6 100644 --- a/k8s/metrics/grafana/dashboards/10-vald-benchmark-operator.yaml +++ b/k8s/metrics/grafana/dashboards/10-vald-benchmark-operator.yaml @@ -108,7 +108,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -188,7 +188,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -267,7 +267,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -350,7 +350,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -435,7 +435,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -515,7 +515,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -595,7 +595,7 @@ data: "wideLayout": true }, "pluginVersin": "8.0.1", - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -664,7 +664,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -734,7 +734,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -803,7 +803,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -872,7 +872,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -952,7 +952,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -1021,7 +1021,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -1091,7 +1091,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -1160,7 +1160,7 @@ data: "textMode": "auto", "wideLayout": true }, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "targets": [ { "datasource": { @@ -1187,9 +1187,9 @@ data: "x": 0, "y": 12 }, - "id": 39, + "id": 51, "panels": [], - "title": "Operator Metrics", + "title": "Benchmark Job Metrics", "type": "row" }, { @@ -1216,7 +1216,315 @@ data: "y": 13 }, "hiddenSeries": false, - "id": 22, + "id": 48, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "nullPointMode": "null", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "10.4.2", + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "disableTextWrap": false, + "editorMode": "code", + "exemplar": true, + "expr": "sum(irate(container_cpu_usage_seconds_total{namespace=\"$Namespace\", pod=~\"$JobPodName\", image=~\".*$JobReplicaSet.*\"}[$interval])) by (pod) and on() count(kube_pod_created{pod=~\"$JobPodName\"}) >= 1", + "fullMetaSearch": false, + "includeNullMetadata": true, + "interval": "", + "legendFormat": "{{pod}}", + "range": true, + "refId": "A", + "useBackend": false + } + ], + "thresholds": [], + "timeRegions": [], + "title": "CPU", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "show": true, + "values": [] + }, + "yaxes": [ + { + "$$hashKey": "object:76", + "format": "short", + "logBase": 1, + "min": "0", + "show": true + }, + { + "$$hashKey": "object:77", + "format": "short", + "logBase": 1, + "show": true + } + ], + "yaxis": { + "align": false + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "fieldConfig": { + "defaults": { + "links": [] + }, + "overrides": [] + }, + "fill": 0, + "fillGradient": 0, + "gridPos": { + "h": 8, + "w": 12, + "x": 12, + "y": 13 + }, + "hiddenSeries": false, + "id": 54, + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "nullPointMode": "null", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "10.4.2", + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(container_memory_working_set_bytes{namespace=\"$Namespace\", pod=~\"$JobPodName\", image=~\".*$JobReplicaSet.*\"}) by (pod) and on() count(kube_pod_created{pod=~\"$JobPodName\"}) >= 1", + "interval": "", + "legendFormat": "{{pod}}", + "range": true, + "refId": "A" + } + ], + "thresholds": [], + "timeRegions": [], + "title": "Memory working set", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "show": true, + "values": [] + }, + "yaxes": [ + { + "$$hashKey": "object:154", + "format": "decbytes", + "logBase": 1, + "min": "0", + "show": true + }, + { + "$$hashKey": "object:155", + "format": "short", + "logBase": 1, + "show": true + } + ], + "yaxis": { + "align": false + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "fieldConfig": { + "defaults": { + "links": [] + }, + "overrides": [] + }, + "fill": 0, + "fillGradient": 0, + "gridPos": { + "h": 8, + "w": 12, + "x": 0, + "y": 21 + }, + "hiddenSeries": false, + "id": 49, + "interval": "", + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "nullPointMode": "null", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "10.4.2", + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ + { + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "editorMode": "code", + "expr": "sum(irate(client_completed_rpcs{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$JobReplicaSet\", target_pod=~\"$JobPodName\"}[$interval])) by (grpc_client_method, grpc_client_status)", + "interval": "", + "intervalFactor": 1, + "legendFormat": "{{grpc_client_method}} ({{grpc_client_status}})", + "range": true, + "refId": "A" + }, + { + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "editorMode": "code", + "expr": "sum(irate(client_completed_rpcs{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$JobReplicaSet\", target_pod=~\"$JobPodName\"}[$interval])) by (grpc_client_status)", + "interval": "", + "intervalFactor": 1, + "legendFormat": "Total ({{grpc_client_status}})", + "range": true, + "refId": "B" + } + ], + "thresholds": [], + "timeRegions": [], + "title": "Completed RPCs /s", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "logBase": 1, + "min": "0", + "show": true + }, + { + "format": "short", + "logBase": 1, + "show": true + } + ], + "yaxis": { + "align": false + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "fieldConfig": { + "defaults": { + "links": [] + }, + "overrides": [] + }, + "fill": 0, + "fillGradient": 0, + "gridPos": { + "h": 8, + "w": 12, + "x": 12, + "y": 21 + }, + "hiddenSeries": false, + "id": 50, + "interval": "", "legend": { "avg": false, "current": false, @@ -1233,7 +1541,7 @@ data: "alertThreshold": true }, "percentage": false, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "pointradius": 2, "points": false, "renderer": "flot", @@ -1248,10 +1556,10 @@ data: "uid": "prometheus" }, "editorMode": "code", - "exemplar": true, - "expr": "sum(irate(container_cpu_usage_seconds_total{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}[$interval])) by (pod) and on() count(kube_statefulset_created{statefulset=\"$ReplicaSet\"}) >= 1", + "expr": "histogram_quantile(0.5, sum(rate(client_latency_bucket{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$JobReplicaSet\", target_pod=~\"$JobPodName\"}[$interval])) by (le, grpc_client_method))", "interval": "", - "legendFormat": "{{pod}}", + "intervalFactor": 1, + "legendFormat": "{{grpc_client_method}} p50", "range": true, "refId": "A" }, @@ -1261,11 +1569,10 @@ data: "uid": "prometheus" }, "editorMode": "code", - "exemplar": true, - "expr": "sum(irate(container_cpu_usage_seconds_total{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}[$interval])) by (pod) and on() count(kube_deployment_created{deployment=\"$ReplicaSet\"}) >= 1", - "hide": false, + "expr": "histogram_quantile(0.95, sum(rate(client_latency_bucket{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$JobReplicaSet\", target_pod=~\"$JobPodName\"}[$interval])) by (le, grpc_client_method))", "interval": "", - "legendFormat": "{{pod}}", + "intervalFactor": 1, + "legendFormat": "{{grpc_client_method}} p95", "range": true, "refId": "B" }, @@ -1275,18 +1582,17 @@ data: "uid": "prometheus" }, "editorMode": "code", - "exemplar": true, - "expr": "sum(irate(container_cpu_usage_seconds_total{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}[$interval])) by (pod) and on() count(kube_daemonset_created{daemonset=\"$ReplicaSet\"}) >= 1", - "hide": false, + "expr": "histogram_quantile(0.99, sum(rate(client_latency_bucket{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$JobReplicaSet\", target_pod=~\"$JobPodName\"}[$interval])) by (le, grpc_client_method))", "interval": "", - "legendFormat": "{{pod}}", + "intervalFactor": 1, + "legendFormat": "{{grpc_client_method}} p99", "range": true, "refId": "C" } ], "thresholds": [], "timeRegions": [], - "title": "CPU", + "title": "Latency", "tooltip": { "shared": true, "sort": 0, @@ -1300,14 +1606,12 @@ data: }, "yaxes": [ { - "$$hashKey": "object:76", - "format": "short", + "format": "ms", "logBase": 1, "min": "0", "show": true }, { - "$$hashKey": "object:77", "format": "short", "logBase": 1, "show": true @@ -1337,11 +1641,11 @@ data: "gridPos": { "h": 8, "w": 12, - "x": 12, - "y": 13 + "x": 0, + "y": 29 }, "hiddenSeries": false, - "id": 27, + "id": 52, "legend": { "avg": false, "current": false, @@ -1358,7 +1662,7 @@ data: "alertThreshold": true }, "percentage": false, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "pointradius": 2, "points": false, "renderer": "flot", @@ -1373,45 +1677,114 @@ data: "uid": "prometheus" }, "editorMode": "code", - "exemplar": true, - "expr": "sum(container_memory_working_set_bytes{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}) by (pod) and on() count(kube_statefulset_created{statefulset=\"$ReplicaSet\"}) >= 1", + "expr": "goroutine_count{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=~\"$JobReplicaSet\", target_pod=~\"$JobPodName\"}", "interval": "", - "legendFormat": "{{pod}}", + "intervalFactor": 1, + "legendFormat": "{{target_pod}}", "range": true, "refId": "A" + } + ], + "thresholds": [], + "timeRegions": [], + "title": "goroutine count", + "tooltip": { + "shared": true, + "sort": 0, + "value_type": "individual" + }, + "type": "graph", + "xaxis": { + "mode": "time", + "show": true, + "values": [] + }, + "yaxes": [ + { + "format": "short", + "logBase": 1, + "min": "0", + "show": true }, { - "datasource": { - "type": "prometheus", - "uid": "prometheus" - }, - "editorMode": "code", - "exemplar": true, - "expr": "sum(container_memory_working_set_bytes{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}) by (pod) and on() count(kube_deployment_created{deployment=\"$ReplicaSet\"}) >= 1", - "hide": false, - "interval": "", - "legendFormat": "{{pod}}", - "range": true, - "refId": "B" + "format": "short", + "logBase": 1, + "show": true + } + ], + "yaxis": { + "align": false + } + }, + { + "aliasColors": {}, + "bars": false, + "dashLength": 10, + "dashes": false, + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "fieldConfig": { + "defaults": { + "links": [] }, + "overrides": [] + }, + "fill": 0, + "fillGradient": 0, + "gridPos": { + "h": 8, + "w": 12, + "x": 12, + "y": 29 + }, + "hiddenSeries": false, + "id": 53, + "interval": "", + "legend": { + "avg": false, + "current": false, + "max": false, + "min": false, + "show": true, + "total": false, + "values": false + }, + "lines": true, + "linewidth": 1, + "nullPointMode": "null", + "options": { + "alertThreshold": true + }, + "percentage": false, + "pluginVersion": "10.4.2", + "pointradius": 2, + "points": false, + "renderer": "flot", + "seriesOverrides": [], + "spaceLength": 10, + "stack": false, + "steppedLine": false, + "targets": [ { "datasource": { "type": "prometheus", "uid": "prometheus" }, "editorMode": "code", - "exemplar": true, - "expr": "sum(container_memory_working_set_bytes{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}) by (pod) and on() count(kube_daemonset_created{daemonset=\"$ReplicaSet\"}) >= 1", - "hide": false, + "expr": "increase(gc_count{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=~\"$JobReplicaSet\", target_node=~\".+\"}[$interval])", + "format": "time_series", + "instant": false, "interval": "", - "legendFormat": "{{pod}}", - "range": true, - "refId": "C" + "intervalFactor": 1, + "legendFormat": "{{target_pod}}", + "refId": "A" } ], "thresholds": [], "timeRegions": [], - "title": "Memory working set", + "title": "GC count /s", "tooltip": { "shared": true, "sort": 0, @@ -1425,14 +1798,11 @@ data: }, "yaxes": [ { - "$$hashKey": "object:154", - "format": "decbytes", + "format": "short", "logBase": 1, - "min": "0", "show": true }, { - "$$hashKey": "object:155", "format": "short", "logBase": 1, "show": true @@ -1442,6 +1812,19 @@ data: "align": false } }, + { + "collapsed": false, + "gridPos": { + "h": 1, + "w": 24, + "x": 0, + "y": 37 + }, + "id": 39, + "panels": [], + "title": "Operator Metrics", + "type": "row" + }, { "aliasColors": {}, "bars": false, @@ -1463,11 +1846,10 @@ data: "h": 8, "w": 12, "x": 0, - "y": 21 + "y": 38 }, "hiddenSeries": false, - "id": 30, - "interval": "", + "id": 22, "legend": { "avg": false, "current": false, @@ -1484,7 +1866,7 @@ data: "alertThreshold": true }, "percentage": false, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "pointradius": 2, "points": false, "renderer": "flot", @@ -1499,10 +1881,10 @@ data: "uid": "prometheus" }, "editorMode": "code", - "expr": "sum(irate(server_completed_rpcs{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$ReplicaSet\", target_pod=~\"$PodName\"}[$interval])) by (grpc_server_method, grpc_server_status)", + "exemplar": true, + "expr": "sum(irate(container_cpu_usage_seconds_total{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}[$interval])) by (pod) and on() count(kube_statefulset_created{statefulset=\"$ReplicaSet\"}) >= 1", "interval": "", - "intervalFactor": 1, - "legendFormat": "{{grpc_server_method}} ({{grpc_server_status}})", + "legendFormat": "{{pod}}", "range": true, "refId": "A" }, @@ -1512,17 +1894,32 @@ data: "uid": "prometheus" }, "editorMode": "code", - "expr": "sum(irate(server_completed_rpcs{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$ReplicaSet\", target_pod=~\"$PodName\"}[$interval])) by (grpc_server_status)", + "exemplar": true, + "expr": "sum(irate(container_cpu_usage_seconds_total{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}[$interval])) by (pod) and on() count(kube_deployment_created{deployment=\"$ReplicaSet\"}) >= 1", + "hide": false, "interval": "", - "intervalFactor": 1, - "legendFormat": "Total ({{grpc_server_status}})", + "legendFormat": "{{pod}}", "range": true, "refId": "B" + }, + { + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "editorMode": "code", + "exemplar": true, + "expr": "sum(irate(container_cpu_usage_seconds_total{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}[$interval])) by (pod) and on() count(kube{daemonset=\"$ReplicaSet\"}) >= 1", + "hide": false, + "interval": "", + "legendFormat": "{{pod}}", + "range": true, + "refId": "C" } ], "thresholds": [], "timeRegions": [], - "title": "Completed RPCs /s", + "title": "CPU", "tooltip": { "shared": true, "sort": 0, @@ -1536,12 +1933,14 @@ data: }, "yaxes": [ { + "$$hashKey": "object:76", "format": "short", "logBase": 1, "min": "0", "show": true }, { + "$$hashKey": "object:77", "format": "short", "logBase": 1, "show": true @@ -1572,11 +1971,10 @@ data: "h": 8, "w": 12, "x": 12, - "y": 21 + "y": 38 }, "hiddenSeries": false, - "id": 32, - "interval": "", + "id": 27, "legend": { "avg": false, "current": false, @@ -1593,7 +1991,7 @@ data: "alertThreshold": true }, "percentage": false, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "pointradius": 2, "points": false, "renderer": "flot", @@ -1608,10 +2006,10 @@ data: "uid": "prometheus" }, "editorMode": "code", - "expr": "histogram_quantile(0.5, sum(rate(server_latency_bucket{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$ReplicaSet\", target_pod=~\"$PodName\"}[$interval])) by (le, grpc_server_method))", + "exemplar": true, + "expr": "sum(container_memory_working_set_bytes{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}) by (pod) and on() count(kube_statefulset_created{statefulset=\"$ReplicaSet\"}) >= 1", "interval": "", - "intervalFactor": 1, - "legendFormat": "{{grpc_server_method}} p50", + "legendFormat": "{{pod}}", "range": true, "refId": "A" }, @@ -1621,10 +2019,11 @@ data: "uid": "prometheus" }, "editorMode": "code", - "expr": "histogram_quantile(0.95, sum(rate(server_latency_bucket{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$ReplicaSet\", target_pod=~\"$PodName\"}[$interval])) by (le, grpc_server_method))", + "exemplar": true, + "expr": "sum(container_memory_working_set_bytes{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}) by (pod) and on() count(kube_deployment_created{deployment=\"$ReplicaSet\"}) >= 1", + "hide": false, "interval": "", - "intervalFactor": 1, - "legendFormat": "{{grpc_server_method}} p95", + "legendFormat": "{{pod}}", "range": true, "refId": "B" }, @@ -1634,17 +2033,18 @@ data: "uid": "prometheus" }, "editorMode": "code", - "expr": "histogram_quantile(0.99, sum(rate(server_latency_bucket{exported_kubernetes_namespace=\"$Namespace\", kubernetes_name=\"$ReplicaSet\", target_pod=~\"$PodName\"}[$interval])) by (le, grpc_server_method))", + "exemplar": true, + "expr": "sum(container_memory_working_set_bytes{namespace=\"$Namespace\", container=\"$ReplicaSet\", pod=~\"$PodName\", image!=\"\"}) by (pod) and on() count(kube_daemonset_created{daemonset=\"$ReplicaSet\"}) >= 1", + "hide": false, "interval": "", - "intervalFactor": 1, - "legendFormat": "{{grpc_server_method}} p99", + "legendFormat": "{{pod}}", "range": true, "refId": "C" } ], "thresholds": [], "timeRegions": [], - "title": "Latency", + "title": "Memory working set", "tooltip": { "shared": true, "sort": 0, @@ -1658,12 +2058,14 @@ data: }, "yaxes": [ { - "format": "ms", + "$$hashKey": "object:154", + "format": "decbytes", "logBase": 1, "min": "0", "show": true }, { + "$$hashKey": "object:155", "format": "short", "logBase": 1, "show": true @@ -1694,7 +2096,7 @@ data: "h": 8, "w": 12, "x": 0, - "y": 29 + "y": 46 }, "hiddenSeries": false, "id": 36, @@ -1714,7 +2116,7 @@ data: "alertThreshold": true }, "percentage": false, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "pointradius": 2, "points": false, "renderer": "flot", @@ -1789,7 +2191,7 @@ data: "h": 8, "w": 12, "x": 12, - "y": 29 + "y": 46 }, "hiddenSeries": false, "id": 38, @@ -1810,7 +2212,7 @@ data: "alertThreshold": true }, "percentage": false, - "pluginVersion": "10.4.0", + "pluginVersion": "10.4.2", "pointradius": 2, "points": false, "renderer": "flot", @@ -1933,7 +2335,7 @@ data: { "allValue": ".+", "current": { - "selected": false, + "selected": true, "text": "All", "value": "$__all" }, @@ -1961,6 +2363,69 @@ data: "type": "query", "useTags": false }, + { + "current": { + "selected": false, + "text": "vald-benchmark-job", + "value": "vald-benchmark-job" + }, + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "definition": "label_values(app_version_info{server_name=~\"benchmark job.*\"},kubernetes_name)", + "hide": 0, + "includeAll": false, + "label": "job_name", + "multi": false, + "name": "JobReplicaSet", + "options": [], + "query": { + "qryType": 1, + "query": "label_values(app_version_info{server_name=~\"benchmark job.*\"},kubernetes_name)", + "refId": "PrometheusVariableQueryEditor-VariableQuery" + }, + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tagsQuery": "", + "type": "query", + "useTags": false + }, + { + "allValue": ".+", + "current": { + "selected": false, + "text": "All", + "value": "$__all" + }, + "datasource": { + "type": "prometheus", + "uid": "prometheus" + }, + "definition": "label_values(app_version_info{server_name=~\"benchmark job.*\", kubernetes_name=~\"$JobReplicaSet\"},target_pod)", + "hide": 0, + "includeAll": true, + "label": "job_pod", + "multi": false, + "name": "JobPodName", + "options": [], + "query": { + "qryType": 1, + "query": "label_values(app_version_info{server_name=~\"benchmark job.*\", kubernetes_name=~\"$JobReplicaSet\"},target_pod)", + "refId": "PrometheusVariableQueryEditor-VariableQuery" + }, + "refresh": 1, + "regex": "", + "skipUrlSync": false, + "sort": 0, + "tagValuesQuery": "", + "tagsQuery": "", + "type": "query", + "useTags": false + }, { "auto": false, "auto_count": 30, @@ -2021,6 +2486,7 @@ data: } ], "query": "1m,2m,5m,10m,30m,1h,6h,12h,1d", + "queryValue": "", "refresh": 2, "skipUrlSync": false, "type": "interval"