{
"annotations": {
"list": [
{
"builtIn": 1,
"datasource": "-- Grafana --",
"enable": true,
"hide": true,
"iconColor": "rgba(0, 211, 255, 1)",
"name": "Annotations & Alerts",
"type": "dashboard"
}
]
},
"editable": true,
"gnetId": null,
"graphTooltip": 0,
"id": 2,
"links": [],
"panels": [
{
"datasource": null,
"fieldConfig": {
"defaults": {
"custom": {},
"mappings": [],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
}
},
"overrides": []
},
"gridPos": {
"h": 8,
"w": 7,
"x": 0,
"y": 0
},
"id": 2,
"options": {
"orientation": "auto",
"reduceOptions": {
"calcs": [
"mean"
],
"fields": "",
"values": false
},
"showThresholdLabels": false,
"showThresholdMarkers": true
},
"pluginVersion": "7.0.2",
"targets": [
{
"expr": "npu_chip_info_health_status{id=\"0\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片0",
"refId": "A"
},
{
"expr": "npu_chip_info_health_status{id=\"1\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片1",
"refId": "B"
},
{
"expr": "npu_chip_info_health_status{id=\"2\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片2",
"refId": "C"
},
{
"expr": "npu_chip_info_health_status{id=\"3\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片3",
"refId": "D"
},
{
"expr": "npu_chip_info_health_status{id=\"4\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片4",
"refId": "E"
},
{
"expr": "npu_chip_info_health_status{id=\"5\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片5",
"refId": "F"
},
{
"expr": "npu_chip_info_health_status{id=\"6\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片6",
"refId": "G"
},
{
"expr": "npu_chip_info_health_status{id=\"7\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片7",
"refId": "H"
}
],
"timeFrom": null,
"timeShift": null,
"title": "npu健康状态(nodeName)",
"type": "gauge"
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "Prometheus",
"fieldConfig": {
"defaults": {
"custom": {},
"mappings": [],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
}
},
"overrides": []
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
"h": 8,
"w": 8,
"x": 7,
"y": 0
},
"hiddenSeries": false,
"id": 6,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"nullPointMode": "null",
"options": {
"dataLinks": []
},
"percentage": false,
"pluginVersion": "7.0.3",
"pointradius": 2,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "npu_chip_info_temperature{id=\"0\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片0",
"refId": "A"
},
{
"expr": "npu_chip_info_temperature{id=\"1\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片1",
"refId": "B"
},
{
"expr": "npu_chip_info_temperature{id=\"2\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片2",
"refId": "C"
},
{
"expr": "npu_chip_info_temperature{id=\"3\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片3",
"refId": "D"
},
{
"expr": "npu_chip_info_temperature{id=\"4\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片4",
"refId": "E"
},
{
"expr": "npu_chip_info_temperature{id=\"5\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片5",
"refId": "F"
},
{
"expr": "npu_chip_info_temperature{id=\"6\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片6",
"refId": "G"
},
{
"expr": "npu_chip_info_temperature{id=\"7\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片7",
"refId": "H"
}
],
"thresholds": [],
"timeFrom": null,
"timeRegions": [],
"timeShift": null,
"title": "npu温度(nodeName)",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"datasource": null,
"fieldConfig": {
"defaults": {
"custom": {},
"mappings": [],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
}
},
"overrides": []
},
"gridPos": {
"h": 8,
"w": 8,
"x": 15,
"y": 0
},
"id": 12,
"options": {
"colorMode": "value",
"graphMode": "area",
"justifyMode": "auto",
"orientation": "auto",
"reduceOptions": {
"calcs": [
"mean"
],
"fields": "",
"values": false
}
},
"pluginVersion": "7.0.2",
"targets": [
{
"expr": "npu_chip_info_voltage{id=\"0\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片0",
"refId": "A"
},
{
"expr": "npu_chip_info_voltage{id=\"1\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片1",
"refId": "B"
},
{
"expr": "npu_chip_info_voltage{id=\"2\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片2",
"refId": "C"
},
{
"expr": "npu_chip_info_voltage{id=\"3\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片3",
"refId": "D"
},
{
"expr": "npu_chip_info_voltage{id=\"4\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片4",
"refId": "E"
},
{
"expr": "npu_chip_info_voltage{id=\"5\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片5",
"refId": "F"
},
{
"expr": "npu_chip_info_voltage{id=\"6\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片6",
"refId": "G"
},
{
"expr": "npu_chip_info_voltage{id=\"7\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片7",
"refId": "H"
}
],
"timeFrom": null,
"timeShift": null,
"title": "npu电压(nodeName)",
"type": "stat"
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": null,
"fieldConfig": {
"defaults": {
"custom": {
"align": null
},
"mappings": [],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
}
},
"overrides": []
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
"h": 8,
"w": 7,
"x": 0,
"y": 8
},
"hiddenSeries": false,
"id": 8,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"nullPointMode": "null",
"options": {
"dataLinks": []
},
"percentage": false,
"pluginVersion": "7.0.3",
"pointradius": 2,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "npu_chip_info_used_memory{id=\"0\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片0",
"refId": "A"
},
{
"expr": "npu_chip_info_used_memory{id=\"1\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片1",
"refId": "B"
},
{
"expr": "npu_chip_info_used_memory{id=\"2\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片2",
"refId": "C"
},
{
"expr": "npu_chip_info_used_memory{id=\"3\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片3",
"refId": "D"
},
{
"expr": "npu_chip_info_used_memory{id=\"4\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片4",
"refId": "E"
},
{
"expr": "npu_chip_info_used_memory{id=\"5\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片5",
"refId": "F"
},
{
"expr": "npu_chip_info_used_memory{id=\"6\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片6",
"refId": "G"
},
{
"expr": "npu_chip_info_used_memory{id=\"7\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片7",
"refId": "H"
}
],
"thresholds": [],
"timeFrom": null,
"timeRegions": [],
"timeShift": null,
"title": "npu内存使用(nodeName)",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": null,
"description": "",
"fieldConfig": {
"defaults": {
"custom": {
"align": null
},
"mappings": [],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
}
},
"overrides": []
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
"h": 8,
"w": 8,
"x": 7,
"y": 8
},
"hiddenSeries": false,
"id": 10,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"nullPointMode": "null",
"options": {
"dataLinks": []
},
"percentage": false,
"pluginVersion": "7.0.3",
"pointradius": 2,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "npu_chip_info_utilization{id=\"0\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片0",
"refId": "A"
},
{
"expr": "npu_chip_info_utilization{id=\"1\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片1",
"refId": "B"
},
{
"expr": "npu_chip_info_utilization{id=\"2\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片2",
"refId": "C"
},
{
"expr": "npu_chip_info_utilization{id=\"3\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片3",
"refId": "D"
},
{
"expr": "npu_chip_info_utilization{id=\"4\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片4",
"refId": "E"
},
{
"expr": "npu_chip_info_utilization{id=\"5\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片5",
"refId": "F"
},
{
"expr": "npu_chip_info_utilization{id=\"6\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片6",
"refId": "G"
},
{
"expr": "npu_chip_info_utilization{id=\"7\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片7",
"refId": "H"
}
],
"thresholds": [],
"timeFrom": null,
"timeRegions": [],
"timeShift": null,
"title": "npu_AI_Core使用率(nodeName)",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": null,
"fieldConfig": {
"defaults": {
"custom": {
"align": null
},
"mappings": [],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
}
},
"overrides": []
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
"h": 8,
"w": 8,
"x": 15,
"y": 8
},
"hiddenSeries": false,
"id": 4,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"nullPointMode": "null",
"options": {
"dataLinks": []
},
"percentage": false,
"pluginVersion": "7.0.3",
"pointradius": 2,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "npu_chip_info_power{id=\"0\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片0",
"refId": "A"
},
{
"expr": "npu_chip_info_power{id=\"1\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片1",
"refId": "B"
},
{
"expr": "npu_chip_info_power{id=\"2\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片2",
"refId": "C"
},
{
"expr": "npu_chip_info_power{id=\"3\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片3",
"refId": "D"
},
{
"expr": "npu_chip_info_power{id=\"4\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片4",
"refId": "E"
},
{
"expr": "npu_chip_info_power{id=\"5\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片5",
"refId": "F"
},
{
"expr": "npu_chip_info_power{id=\"6\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片6",
"refId": "G"
},
{
"expr": "npu_chip_info_power{id=\"7\",job=\"nodeName\"}",
"interval": "",
"legendFormat": "芯片7",
"refId": "H"
}
],
"thresholds": [],
"timeFrom": null,
"timeRegions": [],
"timeShift": null,
"title": "npu使用功耗(nodeName)",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": null,
"fieldConfig": {
"defaults": {
"custom": {}
},
"overrides": []
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
"h": 10,
"w": 7,
"x": 0,
"y": 16
},
"hiddenSeries": false,
"id": 20,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"nullPointMode": "null",
"options": {
"dataLinks": []
},
"percentage": false,
"pointradius": 2,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "container_memory_usage_bytes",
"interval": "",
"legendFormat": "",
"refId": "A"
}
],
"thresholds": [],
"timeFrom": null,
"timeRegions": [],
"timeShift": null,
"title": "容器内存使用量",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
},
{
"aliasColors": {},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": null,
"fieldConfig": {
"defaults": {
"custom": {}
},
"overrides": []
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
"h": 10,
"w": 7,
"x": 7,
"y": 16
},
"hiddenSeries": false,
"id": 18,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"nullPointMode": "null",
"options": {
"dataLinks": []
},
"percentage": false,
"pointradius": 2,
"points": false,
"renderer": "flot",
"seriesOverrides": [],
"spaceLength": 10,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(container_network_receive_bytes_total{image!=\"\"}[1m])) without (interface)",
"interval": "",
"legendFormat": "",
"refId": "A"
}
],
"thresholds": [],
"timeFrom": null,
"timeRegions": [],
"timeShift": null,
"title": "容器网络接收量速率",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": []
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
],
"yaxis": {
"align": false,
"alignLevel": null
}
}
],
"refresh": "5s",
"schemaVersion": 25,
"style": "dark",
"tags": [],
"templating": {
"list": []
},
"time": {
"from": "now-15m",
"to": "now"
},
"timepicker": {
"refresh_intervals": [
"10s",
"30s",
"1m",
"5m",
"15m",
"30m",
"1h",
"2h",
"1d"
]
},
"timezone": "",
"title": "nodeName",
"uid": "2kWOIniGz",
"version": 7
}