From 0cac46d187dc274844e5e23e54872f5e338f2c0e Mon Sep 17 00:00:00 2001
From: Stephan Burns <34520077+Sleuth56@users.noreply.github.com>
Date: Mon, 11 May 2026 14:50:28 -0400
Subject: [PATCH] Fix broken datasource causing panels not to load
Signed-off-by: Stephan Burns <34520077+Sleuth56@users.noreply.github.com>
---
dashboards/vlagent.json | 365 +++++++++++++++++-----------------------
1 file changed, 156 insertions(+), 209 deletions(-)
diff --git a/dashboards/vlagent.json b/dashboards/vlagent.json
index 1d83fdd160..415604cabe 100644
--- a/dashboards/vlagent.json
+++ b/dashboards/vlagent.json
@@ -1,53 +1,4 @@
{
- "__inputs": [
- {
- "name": "DS_PROMETHEUS",
- "label": "prometheus",
- "description": "",
- "type": "datasource",
- "pluginId": "prometheus",
- "pluginName": "Prometheus"
- }
- ],
- "__elements": {},
- "__requires": [
- {
- "type": "grafana",
- "id": "grafana",
- "name": "Grafana",
- "version": "12.3.0"
- },
- {
- "type": "datasource",
- "id": "prometheus",
- "name": "Prometheus",
- "version": "1.0.0"
- },
- {
- "type": "panel",
- "id": "stat",
- "name": "Stat",
- "version": ""
- },
- {
- "type": "panel",
- "id": "table",
- "name": "Table",
- "version": ""
- },
- {
- "type": "panel",
- "id": "text",
- "name": "Text",
- "version": ""
- },
- {
- "type": "panel",
- "id": "timeseries",
- "name": "Time series",
- "version": ""
- }
- ],
"annotations": {
"list": [
{
@@ -71,7 +22,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"enable": true,
"expr": "sum(vm_app_version{job=~\"$job\", instance=~\"$instance\"}) by(short_version) unless (sum(vm_app_version{job=~\"$job\", instance=~\"$instance\"} offset $__interval) by(short_version))",
@@ -84,7 +35,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"enable": true,
"expr": "sum(changes(vm_app_start_timestamp{job=~\"$job\", instance=~\"$instance\"}[$__interval])) by(job, instance)",
@@ -181,14 +132,14 @@
"content": "
$version
",
"mode": "markdown"
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"title": "Version",
"type": "text"
},
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows number of generated error messages in logs over last 30m. Non-zero value may be a sign of connectivity or misconfiguration errors.",
"fieldConfig": {
@@ -244,12 +195,12 @@
"textMode": "auto",
"wideLayout": true
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"expr": "sum(increase(vm_log_messages_total{job=~\"$job\", instance=~\"$instance\", level!=\"info\"}[30m]))",
"interval": "",
@@ -263,7 +214,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Persistent queue size shows size of pending logs in bytes which hasn't been flushed to remote storage yet. \nIncreasing of value might be a sign of connectivity issues. In such cases, vlagent starts to flush pending data on disk with attempt to send it later once connection is restored.",
"fieldConfig": {
@@ -312,12 +263,12 @@
"textMode": "auto",
"wideLayout": true
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"expr": "sum(vlagent_remotewrite_pending_data_bytes{job=~\"$job\", instance=~\"$instance\"})",
"interval": "",
@@ -331,7 +282,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the cumulative number of log entries ingested. \n\nThe size is calculated before compression.",
"fieldConfig": {
@@ -375,12 +326,12 @@
"textMode": "auto",
"wideLayout": true
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "sum(rate(vl_bytes_ingested_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval]))",
@@ -396,7 +347,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Total number of available CPUs for selected vlagents. ",
"fieldConfig": {
@@ -444,12 +395,12 @@
"textMode": "auto",
"wideLayout": true
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -467,7 +418,7 @@
},
{
"datasource": {
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"fieldConfig": {
"defaults": {
@@ -581,16 +532,15 @@
"cellHeight": "sm",
"showHeader": true
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"expr": "sort((time() - vm_app_start_timestamp{job=~\"$job\", instance=~\"$instance\"}) or (up{job=~\"$job\", instance=~\"$instance\"}))",
"format": "table",
- "hide": false,
"instant": true,
"interval": "",
"legendFormat": "{{instance}}",
@@ -610,7 +560,7 @@
},
{
"datasource": {
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"fieldConfig": {
"defaults": {
@@ -695,12 +645,12 @@
"sort": "asc"
}
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"expr": "sort(sum(up{job=~\"$job\", instance=~\"$instance\"}) by (job, instance))",
"format": "time_series",
@@ -716,7 +666,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Total size of available memory for selected vlagents.",
"fieldConfig": {
@@ -764,12 +714,12 @@
"textMode": "auto",
"wideLayout": true
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -801,7 +751,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows ingestion rate in number of log entries and bytes per second.",
"fieldConfig": {
@@ -905,17 +855,16 @@
"sort": "desc"
}
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "sum(rate(vl_rows_ingested_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by (type) > 0",
"format": "time_series",
- "hide": false,
"intervalFactor": 1,
"legendFormat": "{{type}}",
"range": true,
@@ -924,11 +873,10 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"editorMode": "code",
"expr": "sum(rate(vl_bytes_ingested_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by (type) > 0",
- "hide": false,
"instant": false,
"legendFormat": "{{type}} (bytes)",
"range": true,
@@ -941,7 +889,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Shows the persistent queue size of pending logs in bytes >2MB which hasn't been flushed to remote storage yet. \n\nIncreasing of value might be a sign of connectivity issues. In such cases, vlagent starts to flush pending data on disk with attempt to send it later once connection is restored.\n\nRemote write URLs are hidden by default but might be unveiled once `-remoteWrite.showURL` is set to true.\n\nClick on the line and choose Drilldown to show the persistent queue size per instance.\n",
"fieldConfig": {
@@ -1041,12 +989,12 @@
"sort": "none"
}
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"exemplar": true,
@@ -1063,7 +1011,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "* `*` - unsupported query path\n* `/insert` - [inserts](https://docs.victoriametrics.com/victorialogs/data-ingestion/)\n* `/select` - [reads](https://docs.victoriametrics.com/victorialogs/querying/)\n* `/metrics` - scraping of system metrics",
"fieldConfig": {
@@ -1151,12 +1099,12 @@
"sort": "desc"
}
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(vl_http_requests_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by (path) > 0",
@@ -1174,7 +1122,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Shows rate of dropped logs from persistent queue. vlagent drops log lines from queue if in-memory and on-disk queues are full and it is unable to flush them to remote storage.\nThe max size of on-disk queue is configured by `-remoteWrite.maxDiskUsagePerURL` flag.",
"fieldConfig": {
@@ -1267,12 +1215,12 @@
"sort": "none"
}
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(vm_persistentqueue_bytes_dropped_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by (path) > 0",
@@ -1288,7 +1236,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Shows the rate of logging the messages by their level. Unexpected spike in rate is a good reason to check logs.",
"fieldConfig": {
@@ -1376,18 +1324,17 @@
"sort": "desc"
}
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"exemplar": true,
"expr": "sum(rate(vm_log_messages_total{job=~\"$job\",instance=~\"$instance\", level!=\"info\"}[$__rate_interval])) by (job, level) > 0",
"format": "time_series",
- "hide": false,
"interval": "5m",
"intervalFactor": 1,
"legendFormat": "{{job}} - {{level}}",
@@ -1401,7 +1348,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Errors rate shows rate for multiple metrics that track possible errors in vlagent, such as network or parsing errors.",
"fieldConfig": {
@@ -1494,12 +1441,12 @@
"sort": "desc"
}
},
- "pluginVersion": "12.3.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(vm_http_request_errors_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job, protocol) > 0",
@@ -1511,7 +1458,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(vm_protoparser_read_errors_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job, type) > 0",
@@ -1523,7 +1470,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(vm_ingestserver_request_errors_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job, type) > 0",
@@ -1535,7 +1482,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(vm_protoparser_unmarshal_errors_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job, type) > 0",
@@ -1547,7 +1494,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(vm_promscrape_dial_errors_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job) > 0",
@@ -1573,7 +1520,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Percentage of used RSS memory (resident).\nThe RSS memory shows the amount of memory recently accessed by the application. It includes anonymous memory and data from recently accessed files (aka page cache).\nThe application's performance will significantly degrade when memory usage is close to 100%.\n\nClick on the line and choose Drilldown to show memory usage per instance",
"fieldConfig": {
@@ -1662,12 +1609,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"exemplar": true,
@@ -1684,7 +1631,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"fieldConfig": {
"defaults": {
@@ -1772,12 +1719,12 @@
"sort": "none"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"exemplar": false,
@@ -1796,7 +1743,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Share for memory allocated by the process itself. When memory usage reaches 100% it will be likely OOM-killed.\nSafe memory usage % considered to be below 80%\n\nClick on the line and choose Drilldown to show memory usage per instance",
"fieldConfig": {
@@ -1879,12 +1826,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"exemplar": false,
@@ -1901,7 +1848,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Shows CPU pressure based on [Pressure Stall Information](https://docs.kernel.org/accounting/psi.html).\n\nThe lower the better.",
"fieldConfig": {
@@ -1981,12 +1928,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(process_pressure_cpu_waiting_seconds_total{job=~\"$job\"}[$__rate_interval])) by (job, instance)",
@@ -2000,7 +1947,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(process_pressure_cpu_stalled_seconds_total{job=~\"$job\"}[$__rate_interval])) by (job, instance)",
@@ -2019,7 +1966,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows memory pressure based on [Pressure Stall Information](https://docs.kernel.org/accounting/psi.html).\n\nThe lower the better.",
"fieldConfig": {
@@ -2099,12 +2046,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "sum(rate(process_pressure_memory_waiting_seconds_total{job=~\"$job\"}[$__rate_interval])) by (job, instance)",
@@ -2118,7 +2065,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"editorMode": "code",
"expr": "sum(rate(process_pressure_memory_stalled_seconds_total{job=~\"$job\"}[$__rate_interval])) by (job, instance)",
@@ -2137,7 +2084,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Shows the number of bytes read/write from the storage layer when vlagent has to buffer data on disk or read already buffered data.\n\nClick on the line and choose Drilldown to show CPU usage per instance",
"fieldConfig": {
@@ -2238,12 +2185,12 @@
"sort": "none"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(process_io_storage_read_bytes_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job) ",
@@ -2258,7 +2205,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(process_io_storage_written_bytes_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job)",
@@ -2277,7 +2224,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"fieldConfig": {
"defaults": {
@@ -2358,12 +2305,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "sum(max_over_time(go_goroutines{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job)",
@@ -2381,7 +2328,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows IO pressure based on [Pressure Stall Information](https://docs.kernel.org/accounting/psi.html).\n\nThe lower the better.",
"fieldConfig": {
@@ -2461,12 +2408,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "sum(rate(process_pressure_io_waiting_seconds_total{job=~\"$job\"}[$__rate_interval])) by (job, instance)",
@@ -2480,7 +2427,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"editorMode": "code",
"expr": "sum(rate(process_pressure_io_stalled_seconds_total{job=~\"$job\"}[$__rate_interval])) by (job, instance)",
@@ -2499,7 +2446,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"fieldConfig": {
"defaults": {
@@ -2580,12 +2527,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(max_over_time(process_num_threads{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job)",
@@ -2602,7 +2549,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Network usage shows the bytes rate for data accepted by vlagent and pushed via remotewrite protocol.\nDiscrepancies are possible because of different protocols used for ingesting, scraping and writing data.",
"fieldConfig": {
@@ -2697,12 +2644,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(vm_tcplistener_read_bytes_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job) * 8 \n+ sum(rate(vm_promscrape_conn_bytes_read_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job) * 8",
@@ -2714,7 +2661,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"editorMode": "code",
"expr": "sum(rate(vlagent_remotewrite_conn_bytes_written_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job) * 8",
@@ -2730,7 +2677,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the percent of CPU spent on garbage collection.\n\nIf % is high, then CPU usage can be decreased by changing GOGC to higher values. Increasing GOGC value will increase memory usage, and decrease CPU usage.\n\nTry searching for keyword `GOGC` at https://docs.victoriametrics.com/victoriametrics/troubleshooting/ ",
"fieldConfig": {
@@ -2812,12 +2759,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "max(\n rate(go_gc_cpu_seconds_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval]) \n / rate(process_cpu_seconds_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])\n ) by(job)",
@@ -2835,7 +2782,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the time goroutines have spent in runnable state before actually running. The lower is better.\n\nHigh values or values exceeding the threshold is usually a sign of insufficient CPU resources or CPU throttling. \n\nVerify that service has enough CPU resources. Otherwise, the service could work unreliably with delays in processing.",
"fieldConfig": {
@@ -2917,12 +2864,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "max(histogram_quantile(0.99, sum(rate(go_sched_latencies_seconds_bucket{job=~\"$job\"}[$__rate_interval])) by (job, instance, le))) by(job)",
@@ -2940,7 +2887,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the rate of allocations in memory. Sudden increase in allocations would mean increased pressure on Go Garbage Collector and can saturate CPU resources of the application.",
"fieldConfig": {
@@ -3018,12 +2965,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "sum(rate(go_memstats_alloc_bytes_total{job=~\"$job\"}[$__rate_interval])) by (job, instance)",
@@ -3041,7 +2988,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Panel shows the percentage of open file descriptors in the OS per instance.\nReaching the limit of open files (100%) can cause various issues and must be prevented.\n\nSee how to change limits here https://medium.com/@muhammadtriwibowo/set-permanently-ulimit-n-open-files-in-ubuntu-4d61064429a",
"fieldConfig": {
@@ -3123,12 +3070,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "max(\n max_over_time(process_open_fds{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])\n /\n process_max_fds{job=~\"$job\", instance=~\"$instance\"}\n) by(job)",
@@ -3160,7 +3107,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows write saturation of the persistent queue. If the threshold of 0.9sec is reached, then the persistent queue is saturated by more than 90% and vlagent won't be able to keep up with flushing data on disk. In this case, consider to decrease load on the vlagent or improve the disk throughput.",
"fieldConfig": {
@@ -3244,12 +3191,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -3266,7 +3213,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows read saturation of the persistent queue. If the threshold of 0.9sec is reached, then the persistent queue is saturated by more than 90% and vlagent won't be able to keep up with reading data from the disk. In this case, consider to decrease load on the vlagent or improve the disk throughput.",
"fieldConfig": {
@@ -3350,12 +3297,12 @@
"sort": "none"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -3372,7 +3319,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the rate of dropped data blocks in cases when remote storage replies with `400 Bad Request` and `409 Conflict` HTTP responses.",
"fieldConfig": {
@@ -3455,12 +3402,12 @@
"sort": "none"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -3477,7 +3424,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the rate of dropped log lines in cases when -remoteWrite.dropSamplesOnOverload or multiple -remoteWrite.disableOnDiskQueue options are set",
"fieldConfig": {
@@ -3560,12 +3507,12 @@
"sort": "none"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -3582,7 +3529,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"fieldConfig": {
"defaults": {
@@ -3662,12 +3609,12 @@
}
]
},
- "pluginVersion": "9.2.3",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": false,
@@ -3709,7 +3656,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the number of restarts per job. The chart can be useful to identify periodic process restarts and correlate them with potential issues or anomalies. Normally, processes shouldn't restart unless restart was inited by user. The reason of restarts should be figured out by checking the logs of each specific service. ",
"fieldConfig": {
@@ -3791,12 +3738,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "sum(changes(vm_app_start_timestamp{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval]) > 0) by(job)",
@@ -3826,7 +3773,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows how many concurrent inserts are taking place.\n\nIf the number of concurrent inserts hitting the `limit` or is close to the `limit` constantly - it might be a sign of a resource shortage.\n\n If vlagent's CPU usage and remote write connection saturation are at normal level, it might be that `-maxConcurrentInserts` cmd-line flag need to be increased.",
"fieldConfig": {
@@ -3906,12 +3853,12 @@
"sort": "desc"
}
},
- "pluginVersion": "9.2.6",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -3924,7 +3871,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"editorMode": "code",
"exemplar": true,
@@ -3941,7 +3888,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"description": "Shows the rate of write errors in ingestserver (UDP, TCP connections) and HTTP server.",
"fieldConfig": {
@@ -4021,12 +3968,12 @@
"sort": "desc"
}
},
- "pluginVersion": "9.2.6",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"exemplar": true,
"expr": "sum(rate(vm_ingestserver_request_errors_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(type, net) > 0",
@@ -4037,7 +3984,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"exemplar": true,
"expr": "sum(rate(vlagent_http_request_errors_total{job=~\"$job\", instance=~\"$instance\", protocol!=\"\"}[$__rate_interval])) by(protocol) > 0",
@@ -4066,7 +4013,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the rate of requests to configured remote write endpoints by url and status code.\n\nRemote write URLs are hidden by default but might be unveiled once `-remoteWrite.showURL` is set to true.\n\n",
"fieldConfig": {
@@ -4148,12 +4095,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -4170,7 +4117,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the global rate for number of written bytes via remote write connections.",
"fieldConfig": {
@@ -4251,12 +4198,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -4273,7 +4220,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows requests retry rate by url. Number of retries is unlimited but protected with delays up to 1m between attempts.\n\nRemote write URLs are hidden by default but might be unveiled once `-remoteWrite.showURL` is set to true.\n\n",
"fieldConfig": {
@@ -4354,12 +4301,12 @@
"sort": "none"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -4376,7 +4323,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows current number of established connections to remote write endpoints.\n\n",
"fieldConfig": {
@@ -4457,12 +4404,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -4479,7 +4426,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows saturation of every connection to remote storage. If the threshold of 90% is reached, then the connection is saturated (busy or slow) by more than 90%, so vlagent won't be able to keep up and can start buffering data. \n\nThis usually means that `-remoteWrite.queues` command-line flag must be increased in order to increase the number of connections per each remote storage.\n",
"fieldConfig": {
@@ -4560,12 +4507,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -4614,7 +4561,7 @@
"content": "Drilldown row is used by other panels on the dashboard to show more detailed metrics per-instance.",
"mode": "markdown"
},
- "pluginVersion": "9.2.3",
+ "pluginVersion": "12.4.0",
"title": "",
"transparent": true,
"type": "text"
@@ -4622,7 +4569,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "",
"fieldConfig": {
@@ -4701,12 +4648,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": false,
@@ -4725,7 +4672,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the used memory (resident).\nThe application's performance will significantly degrade when memory usage is close to 100%.",
"fieldConfig": {
@@ -4804,12 +4751,12 @@
"sort": "desc"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -4826,7 +4773,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the persistent queue size of pending samples in bytes which hasn't been flushed to remote storage yet. \n\nIncreasing of value might be a sign of connectivity issues. In such cases, vlagent starts to flush pending data on disk with attempt to send it later once connection is restored.\n\nRemote write URLs are hidden by default but might be unveiled once `-remoteWrite.showURL` is set to true.",
"fieldConfig": {
@@ -4913,12 +4860,12 @@
"sort": "none"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"exemplar": true,
@@ -4935,7 +4882,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"description": "Shows the number of bytes read/write from the storage layer when vlagent has to buffer data on disk or read already buffered data.",
"fieldConfig": {
@@ -5030,12 +4977,12 @@
"sort": "none"
}
},
- "pluginVersion": "11.5.0",
+ "pluginVersion": "12.4.0",
"targets": [
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"editorMode": "code",
"expr": "sum(rate(process_io_storage_read_bytes_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job, instance)",
@@ -5050,7 +4997,7 @@
{
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"editorMode": "code",
"expr": "sum(rate(process_io_storage_written_bytes_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])) by(job,instance)",
@@ -5088,7 +5035,7 @@
},
"includeAll": false,
"label": "Datasource",
- "name": "DS_PROMETHEUS",
+ "name": "ds",
"options": [],
"query": "prometheus",
"refresh": 1,
@@ -5099,7 +5046,7 @@
"current": {},
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"definition": "label_values(vm_app_version{version=~\"^vlagent.*\"}, job)",
"includeAll": true,
@@ -5119,7 +5066,7 @@
"current": {},
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "$ds"
},
"definition": "label_values(vm_app_version{job=~\"$job\"}, instance)",
"includeAll": true,
@@ -5139,7 +5086,7 @@
"current": {},
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"definition": "label_values(vlagent_remotewrite_requests_total{job=~\"$job\", instance=~\"$instance\"}, url)",
"description": "The remote write URLs",
@@ -5159,7 +5106,7 @@
"current": {},
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${ds}"
},
"definition": "label_values(vm_app_version{job=~\"$job\", instance=~\"$instance\"},short_version)",
"hide": 2,
@@ -5178,7 +5125,7 @@
"baseFilters": [],
"datasource": {
"type": "prometheus",
- "uid": "$DS_PROMETHEUS"
+ "uid": "${DS_PROMETHEUS}"
},
"filters": [],
"name": "adhoc",
@@ -5209,4 +5156,4 @@
"version": 2,
"weekStart": "",
"id": null
-}
\ No newline at end of file
+}