|
@@ -0,0 +1,304 @@
|
|
|
+{
|
|
|
+ "__inputs": [
|
|
|
+ {
|
|
|
+ "name": "DS_TELEMETRY-POSTGRES",
|
|
|
+ "label": "telemetry-postgres",
|
|
|
+ "description": "",
|
|
|
+ "type": "datasource",
|
|
|
+ "pluginId": "postgres",
|
|
|
+ "pluginName": "PostgreSQL"
|
|
|
+ }
|
|
|
+ ],
|
|
|
+ "__elements": [],
|
|
|
+ "__requires": [
|
|
|
+ {
|
|
|
+ "type": "grafana",
|
|
|
+ "id": "grafana",
|
|
|
+ "name": "Grafana",
|
|
|
+ "version": "8.3.2"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "type": "panel",
|
|
|
+ "id": "hpcviz-idvl-hpcc-stream-net",
|
|
|
+ "name": "stream-net",
|
|
|
+ "version": "1.0.0"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "type": "datasource",
|
|
|
+ "id": "postgres",
|
|
|
+ "name": "PostgreSQL",
|
|
|
+ "version": "1.0.0"
|
|
|
+ }
|
|
|
+ ],
|
|
|
+ "editable": false,
|
|
|
+ "fiscalYearStartMonth": 0,
|
|
|
+ "graphTooltip": 0,
|
|
|
+ "id": null,
|
|
|
+ "iteration": 1647433675249,
|
|
|
+ "links": [],
|
|
|
+ "liveNow": false,
|
|
|
+ "panels": [
|
|
|
+ {
|
|
|
+ "datasource": {
|
|
|
+ "type": "postgres",
|
|
|
+ "uid": "telemetry-postgres"
|
|
|
+ },
|
|
|
+ "gridPos": {
|
|
|
+ "h": 15,
|
|
|
+ "w": 24,
|
|
|
+ "x": 0,
|
|
|
+ "y": 0
|
|
|
+ },
|
|
|
+ "id": 2,
|
|
|
+ "options": {
|
|
|
+ "userEncoded": true
|
|
|
+ },
|
|
|
+ "targets": [
|
|
|
+ {
|
|
|
+ "datasource": {
|
|
|
+ "type": "postgres",
|
|
|
+ "uid": "telemetry-postgres"
|
|
|
+ },
|
|
|
+ "format": "table",
|
|
|
+ "group": [],
|
|
|
+ "hide": false,
|
|
|
+ "metricColumn": "none",
|
|
|
+ "rawQuery": true,
|
|
|
+ "rawSql": "SELECT\n *\nFROM\n slurm.jobs\nWHERE\n user_id IN ($users)\n AND start_time < ${__to:date:seconds}\n AND end_time BETWEEN ${__from:date:seconds} and ${__to:date:seconds}",
|
|
|
+ "refId": "jobs",
|
|
|
+ "select": [
|
|
|
+ [
|
|
|
+ {
|
|
|
+ "params": [
|
|
|
+ "value"
|
|
|
+ ],
|
|
|
+ "type": "column"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ ],
|
|
|
+ "timeColumn": "time",
|
|
|
+ "where": [
|
|
|
+ {
|
|
|
+ "name": "$__timeFilter",
|
|
|
+ "params": [],
|
|
|
+ "type": "macro"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "datasource": {
|
|
|
+ "type": "postgres",
|
|
|
+ "uid": "telemetry-postgres"
|
|
|
+ },
|
|
|
+ "format": "time_series",
|
|
|
+ "group": [],
|
|
|
+ "hide": false,
|
|
|
+ "metricColumn": "none",
|
|
|
+ "rawQuery": true,
|
|
|
+ "rawSql": "SELECT\n $__timeGroupAlias(\"time\",$__interval),\n avg(CAST(value AS decimal)) AS \"memory_power\",\n CONCAT('| ',nodes.os_ip_addr) AS name\nFROM timeseries_metrics\nINNER JOIN nodes\nON nodes.servicetag = timeseries_metrics.system\nWHERE\n $__timeFilter(\"time\") AND\n label= 'PowerMetrics TotalMemoryPower'AND\n system IN ($servicetag)\nGROUP BY time,name\nORDER BY time",
|
|
|
+ "refId": "memory_power",
|
|
|
+ "select": [
|
|
|
+ [
|
|
|
+ {
|
|
|
+ "params": [
|
|
|
+ "value"
|
|
|
+ ],
|
|
|
+ "type": "column"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ ],
|
|
|
+ "timeColumn": "time",
|
|
|
+ "where": [
|
|
|
+ {
|
|
|
+ "name": "$__timeFilter",
|
|
|
+ "params": [],
|
|
|
+ "type": "macro"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "datasource": {
|
|
|
+ "type": "postgres",
|
|
|
+ "uid": "telemetry-postgres"
|
|
|
+ },
|
|
|
+ "format": "time_series",
|
|
|
+ "group": [],
|
|
|
+ "hide": false,
|
|
|
+ "metricColumn": "none",
|
|
|
+ "rawQuery": true,
|
|
|
+ "rawSql": "SELECT\n $__timeGroupAlias(\"time\",$__interval),\n avg(CAST(value AS decimal)) AS \"cpu_power\",\n CONCAT('| ',nodes.os_ip_addr) AS name\nFROM timeseries_metrics\nINNER JOIN nodes\nON nodes.servicetag = timeseries_metrics.system\nWHERE\n $__timeFilter(\"time\") AND\n label= 'PowerMetrics TotalCPUPower'AND\n system IN ($servicetag)\nGROUP BY time,name\nORDER BY time",
|
|
|
+ "refId": "cpu_power",
|
|
|
+ "select": [
|
|
|
+ [
|
|
|
+ {
|
|
|
+ "params": [
|
|
|
+ "value"
|
|
|
+ ],
|
|
|
+ "type": "column"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ ],
|
|
|
+ "timeColumn": "time",
|
|
|
+ "where": [
|
|
|
+ {
|
|
|
+ "name": "$__timeFilter",
|
|
|
+ "params": [],
|
|
|
+ "type": "macro"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "datasource": {
|
|
|
+ "type": "postgres",
|
|
|
+ "uid": "telemetry-postgres"
|
|
|
+ },
|
|
|
+ "format": "time_series",
|
|
|
+ "group": [],
|
|
|
+ "hide": false,
|
|
|
+ "metricColumn": "none",
|
|
|
+ "rawQuery": true,
|
|
|
+ "rawSql": "SELECT\n $__timeGroupAlias(\"time\",$__interval),\n avg(CAST(value AS decimal)) AS \"cpu1_temp\",\n CONCAT('| ',nodes.os_ip_addr) AS name\nFROM timeseries_metrics\nINNER JOIN nodes\nON nodes.servicetag = timeseries_metrics.system\nWHERE\n $__timeFilter(\"time\") AND\n label= 'CPU1 Temp TemperatureReading'AND\n system IN ($servicetag)\nGROUP BY time,name\nORDER BY time",
|
|
|
+ "refId": "cpu1_temp",
|
|
|
+ "select": [
|
|
|
+ [
|
|
|
+ {
|
|
|
+ "params": [
|
|
|
+ "value"
|
|
|
+ ],
|
|
|
+ "type": "column"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ ],
|
|
|
+ "timeColumn": "time",
|
|
|
+ "where": [
|
|
|
+ {
|
|
|
+ "name": "$__timeFilter",
|
|
|
+ "params": [],
|
|
|
+ "type": "macro"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "datasource": {
|
|
|
+ "type": "postgres",
|
|
|
+ "uid": "telemetry-postgres"
|
|
|
+ },
|
|
|
+ "format": "time_series",
|
|
|
+ "group": [],
|
|
|
+ "hide": false,
|
|
|
+ "metricColumn": "none",
|
|
|
+ "rawQuery": true,
|
|
|
+ "rawSql": "SELECT\n $__timeGroupAlias(\"time\",$__interval),\n avg(CAST(value AS decimal)) AS \"CPU2_Temp\",\n CONCAT('| ',nodes.os_ip_addr) AS name\nFROM timeseries_metrics\nINNER JOIN nodes\nON nodes.servicetag = timeseries_metrics.system\nWHERE\n $__timeFilter(\"time\") AND\n label= 'CPU2 Temp TemperatureReading' AND\n system IN ($servicetag)\nGROUP BY time,name\nORDER BY time",
|
|
|
+ "refId": "cpu2_temp",
|
|
|
+ "select": [
|
|
|
+ [
|
|
|
+ {
|
|
|
+ "params": [
|
|
|
+ "value"
|
|
|
+ ],
|
|
|
+ "type": "column"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ ],
|
|
|
+ "timeColumn": "time",
|
|
|
+ "where": [
|
|
|
+ {
|
|
|
+ "name": "$__timeFilter",
|
|
|
+ "params": [],
|
|
|
+ "type": "macro"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "datasource": {
|
|
|
+ "type": "postgres",
|
|
|
+ "uid": "telemetry-postgres"
|
|
|
+ },
|
|
|
+ "format": "time_series",
|
|
|
+ "group": [],
|
|
|
+ "hide": false,
|
|
|
+ "metricColumn": "none",
|
|
|
+ "rawQuery": true,
|
|
|
+ "rawSql": "SELECT\n $__timeGroupAlias(\"time\",$__interval),\n avg(CAST(value AS decimal)) AS \"NIC1_Temp\",\n CONCAT('| ',nodes.os_ip_addr) AS name\nFROM timeseries_metrics\nINNER JOIN nodes\nON nodes.servicetag = timeseries_metrics.system\nWHERE\n $__timeFilter(\"time\") AND\n label SIMILAR TO '% NIC 1 Port 1 Partition 1 TemperatureReading' AND\n system IN ($servicetag)\nGROUP BY time,name\nORDER BY time",
|
|
|
+ "refId": "nic1_temp",
|
|
|
+ "select": [
|
|
|
+ [
|
|
|
+ {
|
|
|
+ "params": [
|
|
|
+ "value"
|
|
|
+ ],
|
|
|
+ "type": "column"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ ],
|
|
|
+ "timeColumn": "time",
|
|
|
+ "where": [
|
|
|
+ {
|
|
|
+ "name": "$__timeFilter",
|
|
|
+ "params": [],
|
|
|
+ "type": "macro"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ }
|
|
|
+ ],
|
|
|
+ "title": "PowerMap",
|
|
|
+ "type": "hpcviz-idvl-hpcc-stream-net"
|
|
|
+ }
|
|
|
+ ],
|
|
|
+ "refresh": "",
|
|
|
+ "schemaVersion": 33,
|
|
|
+ "style": "dark",
|
|
|
+ "tags": [],
|
|
|
+ "templating": {
|
|
|
+ "list": [
|
|
|
+ {
|
|
|
+ "current": {},
|
|
|
+ "datasource": {
|
|
|
+ "type": "postgres",
|
|
|
+ "uid": "telemetry-postgres"
|
|
|
+ },
|
|
|
+ "definition": "SELECT DISTINCT servicetag as __value from nodes\n",
|
|
|
+ "hide": 0,
|
|
|
+ "includeAll": true,
|
|
|
+ "multi": true,
|
|
|
+ "name": "servicetag",
|
|
|
+ "options": [],
|
|
|
+ "query": "SELECT DISTINCT servicetag as __value from nodes\n",
|
|
|
+ "refresh": 1,
|
|
|
+ "regex": "",
|
|
|
+ "skipUrlSync": false,
|
|
|
+ "sort": 1,
|
|
|
+ "type": "query"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "current": {},
|
|
|
+ "datasource": {
|
|
|
+ "type": "postgres",
|
|
|
+ "uid": "telemetry-postgres"
|
|
|
+ },
|
|
|
+ "definition": "SELECT\n user_id as __value, user_name as __text, nodes as IP, nodes.os_ip_addr, nodes.servicetag\nFROM\n slurm.jobs\nINNER JOIN nodes\nON nodes.os_ip_addr = ANY(nodes)\nWHERE nodes.servicetag in ($servicetag) AND\n start_time < ${__to:date:seconds} AND end_time > ${__from:date:seconds}",
|
|
|
+ "hide": 0,
|
|
|
+ "includeAll": true,
|
|
|
+ "multi": true,
|
|
|
+ "name": "users",
|
|
|
+ "options": [],
|
|
|
+ "query": "SELECT\n user_id as __value, user_name as __text, nodes as IP, nodes.os_ip_addr, nodes.servicetag\nFROM\n slurm.jobs\nINNER JOIN nodes\nON nodes.os_ip_addr = ANY(nodes)\nWHERE nodes.servicetag in ($servicetag) AND\n start_time < ${__to:date:seconds} AND end_time > ${__from:date:seconds}",
|
|
|
+ "refresh": 1,
|
|
|
+ "regex": "",
|
|
|
+ "skipUrlSync": false,
|
|
|
+ "sort": 1,
|
|
|
+ "type": "query"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ },
|
|
|
+ "time": {
|
|
|
+ "from": "now-2d",
|
|
|
+ "to": "now"
|
|
|
+ },
|
|
|
+ "timepicker": {},
|
|
|
+ "timezone": "",
|
|
|
+ "title": "PowerMap",
|
|
|
+ "uid": "ou27WHLnk",
|
|
|
+ "version": 16,
|
|
|
+ "weekStart": ""
|
|
|
+}
|