diff --git a/grafana/oke-workloads-to-gpuscanner-mapping-dashboard.json b/grafana_dashboards/oke-workloads-to-gpuscanner-mapping-dashboard.json similarity index 96% rename from grafana/oke-workloads-to-gpuscanner-mapping-dashboard.json rename to grafana_dashboards/oke-workloads-to-gpuscanner-mapping-dashboard.json index 5320b95..756a757 100644 --- a/grafana/oke-workloads-to-gpuscanner-mapping-dashboard.json +++ b/grafana_dashboards/oke-workloads-to-gpuscanner-mapping-dashboard.json @@ -81,7 +81,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "All details of the host", "fieldConfig": { @@ -154,7 +154,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -273,7 +273,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "Dr HPC V2 based passive checks scan results", "fieldConfig": { @@ -705,7 +705,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -723,7 +723,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -738,7 +738,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -753,7 +753,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -768,7 +768,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -783,7 +783,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -798,7 +798,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -813,7 +813,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -828,7 +828,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -843,7 +843,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -858,7 +858,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -873,7 +873,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -888,7 +888,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -903,7 +903,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -918,7 +918,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -937,7 +937,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -952,7 +952,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -967,7 +967,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -982,7 +982,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -997,7 +997,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1012,7 +1012,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1027,7 +1027,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1042,7 +1042,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1057,7 +1057,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1072,7 +1072,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1087,7 +1087,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1102,7 +1102,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1117,7 +1117,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1132,7 +1132,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1147,7 +1147,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1162,7 +1162,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1177,7 +1177,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1192,7 +1192,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1207,7 +1207,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1222,7 +1222,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1237,7 +1237,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1612,7 +1612,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "Active checks performance health check results", "fieldConfig": { @@ -1867,7 +1867,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -1885,7 +1885,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1900,7 +1900,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1915,7 +1915,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1930,7 +1930,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1945,7 +1945,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1960,7 +1960,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1975,7 +1975,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1990,7 +1990,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -2005,7 +2005,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -2020,7 +2020,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -2248,7 +2248,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "HBM BW", "fieldConfig": { @@ -2300,7 +2300,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "builder", @@ -2321,7 +2321,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "Flops utilizations by GPU and by Node", "fieldConfig": { @@ -2373,7 +2373,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -2394,7 +2394,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "RDMA Bandwidth by node", "fieldConfig": { @@ -2446,7 +2446,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "builder", "expr": "avg(oci_lens_rdma_np_cnp_sent{hostname=~\"$hostname\"}) by (hostname)", @@ -2475,7 +2475,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2564,7 +2564,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "DCGM_FI_DEV_GPU_TEMP{Hostname=~\"$hostname\"} OR gpu_junction_temperature{hostname=~\"$hostname\"}", @@ -2581,7 +2581,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2639,7 +2639,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "avg(DCGM_FI_DEV_POWER_USAGE{Hostname=~\"$hostname\"} OR gpu_power_usage{hostname=~\"$hostname\"})", @@ -2656,7 +2656,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2714,7 +2714,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "avg(DCGM_FI_DEV_GPU_TEMP{Hostname=~\"$hostname\"} OR gpu_junction_temperature{hostname=~\"$hostname\"}) ", @@ -2730,7 +2730,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2821,7 +2821,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "avg(DCGM_FI_DEV_GPU_UTIL{Hostname=~\"$hostname\"} OR gpu_gfx_activity{hostname=~\"$hostname\"})", @@ -2837,7 +2837,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2926,7 +2926,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "DCGM_FI_DEV_POWER_USAGE{Hostname=~\"$hostname\"} OR gpu_power_usage{hostname=~\"$hostname\"}", @@ -2942,7 +2942,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3033,7 +3033,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "DCGM_FI_PROF_PIPE_TENSOR_ACTIVE{Hostname=~\"$hostname\"} OR gpu_prof_tensor_active_percent{hostname=~\"$hostname\"}", @@ -3063,7 +3063,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3145,7 +3145,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "((node_filesystem_size_bytes{device!~\"rootfs\",instance=~\"${hostname:regex}\"} - node_filesystem_avail_bytes{device!~\"rootfs\",instance=~\"${hostname:regex}\"}) / node_filesystem_size_bytes{ device!~\"rootfs\",instance=~\"${hostname:regex}\"}) * 100", @@ -3160,7 +3160,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3242,7 +3242,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "builder", @@ -3267,7 +3267,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "Monitors hardware sensor temperatures and critical thresholds as exposed by Linux hwmon. Includes CPU, GPU, and motherboard sensors where available", "fieldConfig": { @@ -3374,7 +3374,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_celsius * on(chip, instance) group_left(chip_name) node_hwmon_chip_names{instance=~\"${hostname:regex}\"}", @@ -3389,7 +3389,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_crit_alarm_celsius{job=\"$job\"} * on(chip, instance) group_left(chip_name) node_hwmon_chip_names{job=\"$job\"}", @@ -3405,7 +3405,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_crit_celsius * on(chip, instance) group_left(chip_name) node_hwmon_chip_names", @@ -3421,7 +3421,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_crit_hyst_celsius{job=\"$job\"} * on(chip, instance) group_left(chip_name) node_hwmon_chip_names{job=\"$job\"}", @@ -3437,7 +3437,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_max_celsius{job=\"$job\"} * on(chip, instance) group_left(chip_name) node_hwmon_chip_names{job=\"$job\"}", @@ -3457,7 +3457,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3564,7 +3564,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": true, @@ -3584,7 +3584,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3666,7 +3666,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "sum(irate(node_cpu_seconds_total{ mode=\"system\",instance=~\"${hostname:regex}\"}[2m])) / scalar(count(count(node_cpu_seconds_total{instance=~\"${hostname:regex}\"}) by (cpu)))", @@ -3717,12 +3717,8 @@ { "allowCustomValue": false, "current": { - "text": [ - "recipe-llamastack-app-chatbot3-9d176edd" - ], - "value": [ - "recipe-llamastack-app-chatbot3-9d176edd" - ] + "text": "All", + "value": ["$__all"] }, "definition": "label_values(oci_lens_pod_node_info{namespace=~\"$k8snamespace\"},workload)", "description": "Choose the Kubernetes deployments/Job ", @@ -3749,7 +3745,7 @@ }, "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "definition": "label_values(oci_lens_pod_node_info{workload=~\"$k8sworkload\"},hostname)", "description": "OCI Host Names Mapped to K8s Node IP", diff --git a/grafana/resourcepools-to-gpuhealth-mapping-dashboard.json b/grafana_dashboards/resourcepools-to-gpuhealth-mapping-dashboard.json similarity index 95% rename from grafana/resourcepools-to-gpuhealth-mapping-dashboard.json rename to grafana_dashboards/resourcepools-to-gpuhealth-mapping-dashboard.json index d0129d5..512eb6e 100644 --- a/grafana/resourcepools-to-gpuhealth-mapping-dashboard.json +++ b/grafana_dashboards/resourcepools-to-gpuhealth-mapping-dashboard.json @@ -71,7 +71,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "All details of the host", "fieldConfig": { @@ -144,7 +144,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -263,7 +263,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -694,7 +694,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -712,7 +712,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -727,7 +727,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -742,7 +742,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -757,7 +757,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -772,7 +772,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -787,7 +787,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -802,7 +802,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -817,7 +817,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -832,7 +832,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -847,7 +847,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -862,7 +862,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -877,7 +877,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -892,7 +892,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -907,7 +907,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -926,7 +926,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -941,7 +941,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -956,7 +956,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -971,7 +971,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -986,7 +986,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1001,7 +1001,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1016,7 +1016,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1031,7 +1031,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1046,7 +1046,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1061,7 +1061,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1076,7 +1076,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1091,7 +1091,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1106,7 +1106,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1121,7 +1121,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1136,7 +1136,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1151,7 +1151,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1166,7 +1166,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1181,7 +1181,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1196,7 +1196,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1211,7 +1211,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1226,7 +1226,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1601,7 +1601,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "GPU & Host Performance Summary", "fieldConfig": { @@ -1856,7 +1856,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -1874,7 +1874,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1889,7 +1889,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1904,7 +1904,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1919,7 +1919,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1934,7 +1934,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1949,7 +1949,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1964,7 +1964,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1979,7 +1979,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -1994,7 +1994,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -2009,7 +2009,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": false, @@ -2233,7 +2233,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "HBM BW", "fieldConfig": { @@ -2285,7 +2285,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "builder", @@ -2306,7 +2306,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "Flops utilizations by GPU and by Node", "fieldConfig": { @@ -2358,7 +2358,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "code", @@ -2379,7 +2379,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "RDMA Bandwidth by node", "fieldConfig": { @@ -2431,7 +2431,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "builder", "expr": "avg(oci_lens_rdma_np_cnp_sent{hostname=~\"$hostname\"}) by (hostname)", @@ -2460,7 +2460,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2549,7 +2549,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "DCGM_FI_DEV_GPU_TEMP{Hostname=~\"$hostname\"} OR gpu_junction_temperature{hostname=~\"$hostname\"}", @@ -2566,7 +2566,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2624,7 +2624,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "avg(DCGM_FI_DEV_POWER_USAGE{Hostname=~\"$hostname\"} OR gpu_power_usage{hostname=~\"$hostname\"})", @@ -2641,7 +2641,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2699,7 +2699,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "avg(DCGM_FI_DEV_GPU_TEMP{Hostname=~\"$hostname\"} OR gpu_junction_temperature{hostname=~\"$hostname\"}) ", @@ -2715,7 +2715,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2806,7 +2806,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "avg(DCGM_FI_DEV_GPU_UTIL{Hostname=~\"$hostname\"} OR gpu_gfx_activity{hostname=~\"$hostname\"})", @@ -2822,7 +2822,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -2911,7 +2911,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "DCGM_FI_DEV_POWER_USAGE{Hostname=~\"$hostname\"} OR gpu_power_usage{hostname=~\"$hostname\"}", @@ -2927,7 +2927,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3018,7 +3018,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "DCGM_FI_PROF_PIPE_TENSOR_ACTIVE{Hostname=~\"$hostname\"} OR gpu_prof_tensor_active_percent{hostname=~\"$hostname\"}", @@ -3048,7 +3048,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3130,7 +3130,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "((node_filesystem_size_bytes{device!~\"rootfs\",instance=~\"${hostname:regex}\"} - node_filesystem_avail_bytes{device!~\"rootfs\",instance=~\"${hostname:regex}\"}) / node_filesystem_size_bytes{ device!~\"rootfs\",instance=~\"${hostname:regex}\"}) * 100", @@ -3145,7 +3145,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3227,7 +3227,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "disableTextWrap": false, "editorMode": "builder", @@ -3252,7 +3252,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "description": "Monitors hardware sensor temperatures and critical thresholds as exposed by Linux hwmon. Includes CPU, GPU, and motherboard sensors where available", "fieldConfig": { @@ -3359,7 +3359,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_celsius * on(chip, instance) group_left(chip_name) node_hwmon_chip_names{instance=~\"${hostname:regex}\"}", @@ -3374,7 +3374,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_crit_alarm_celsius{job=\"$job\"} * on(chip, instance) group_left(chip_name) node_hwmon_chip_names{job=\"$job\"}", @@ -3390,7 +3390,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_crit_celsius * on(chip, instance) group_left(chip_name) node_hwmon_chip_names", @@ -3406,7 +3406,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_crit_hyst_celsius{job=\"$job\"} * on(chip, instance) group_left(chip_name) node_hwmon_chip_names{job=\"$job\"}", @@ -3422,7 +3422,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "node_hwmon_temp_max_celsius{job=\"$job\"} * on(chip, instance) group_left(chip_name) node_hwmon_chip_names{job=\"$job\"}", @@ -3442,7 +3442,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3549,7 +3549,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "exemplar": true, @@ -3569,7 +3569,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "fieldConfig": { "defaults": { @@ -3651,7 +3651,7 @@ { "datasource": { "type": "prometheus", - "uid": "PBFA97CFB590B2093" + "uid": "{{DATASOURCE_PROMETHEUS}}" }, "editorMode": "code", "expr": "sum(irate(node_cpu_seconds_total{ mode=\"system\",instance=~\"${hostname:regex}\"}[2m])) / scalar(count(count(node_cpu_seconds_total{instance=~\"${hostname:regex}\"}) by (cpu)))", @@ -3681,7 +3681,7 @@ }, "datasource": { "type": "yesoreyeram-infinity-datasource", - "uid": "PD0067CAD9A63E081" + "uid": "{{DATASOURCE_INFINITY}}" }, "definition": "", "description": "Monitor resources by OCI Region.", @@ -3700,13 +3700,13 @@ "root_selector": "", "source": "url", "type": "json", - "url": "http://api.132.226.55.39.nip.io/monitoring-rings/750719b634775b87e80784dc08ee6b41/instances/", + "url": "{{INFINITY_DATASOURCE_BASE_URL}}/monitoring-rings/{{MONITORING_RING_ID}}/instances/", "url_options": { "data": "", "headers": [ { "key": "Authorization", - "value": "Token ad37cf7d9b520d27c4a06eae5a3c15a06e911bc0" + "value": "Token {{INFINITY_DATASOURCE_AUTH_TOKEN}}" } ], "method": "GET", @@ -3737,7 +3737,7 @@ }, "datasource": { "type": "yesoreyeram-infinity-datasource", - "uid": "PD0067CAD9A63E081" + "uid": "{{DATASOURCE_INFINITY}}" }, "definition": "", "description": "Filter by GPU Types", @@ -3756,13 +3756,13 @@ "root_selector": "", "source": "url", "type": "json", - "url": "http://api.132.226.55.39.nip.io/monitoring-rings/750719b634775b87e80784dc08ee6b41/instances/", + "url": "{{INFINITY_DATASOURCE_BASE_URL}}/monitoring-rings/{{MONITORING_RING_ID}}/instances/", "url_options": { "data": "", "headers": [ { "key": "Authorization", - "value": "Token ad37cf7d9b520d27c4a06eae5a3c15a06e911bc0" + "value": "Token {{INFINITY_DATASOURCE_AUTH_TOKEN}}" } ], "method": "GET", @@ -3799,7 +3799,7 @@ }, "datasource": { "type": "yesoreyeram-infinity-datasource", - "uid": "PD0067CAD9A63E081" + "uid": "{{DATASOURCE_INFINITY}}" }, "definition": "", "description": "OCI Host Names", @@ -3818,13 +3818,13 @@ "root_selector": "", "source": "url", "type": "json", - "url": "http://api.132.226.55.39.nip.io/monitoring-rings/750719b634775b87e80784dc08ee6b41/instances/", + "url": "{{INFINITY_DATASOURCE_BASE_URL}}/monitoring-rings/{{MONITORING_RING_ID}}/instances/", "url_options": { "data": "", "headers": [ { "key": "Authorization", - "value": "Token ad37cf7d9b520d27c4a06eae5a3c15a06e911bc0" + "value": "Token {{INFINITY_DATASOURCE_AUTH_TOKEN}}" } ], "method": "GET",