2020-08-04 20:09:52 -04:00
|
|
|
dashboard: 'K8s pod health'
|
|
|
|
priority: 2
|
|
|
|
|
|
|
|
templating:
|
|
|
|
variables:
|
|
|
|
pod:
|
|
|
|
label: 'Pod name'
|
|
|
|
type: metric_label_values
|
|
|
|
options:
|
|
|
|
series_selector: 'container_memory_working_set_bytes'
|
|
|
|
label: 'pod'
|
|
|
|
|
2019-12-17 07:08:11 -05:00
|
|
|
panel_groups:
|
|
|
|
- group: CPU metrics
|
|
|
|
panels:
|
|
|
|
- title: "CPU usage"
|
|
|
|
type: "line-chart"
|
2020-08-07 11:10:17 -04:00
|
|
|
y_label: "Cores per container"
|
2019-12-17 07:08:11 -05:00
|
|
|
metrics:
|
|
|
|
- id: pod_cpu_usage_seconds_total
|
2020-08-07 11:10:17 -04:00
|
|
|
query_range: >-
|
|
|
|
sum(
|
|
|
|
rate(container_cpu_usage_seconds_total{pod="{{pod}}",container!="POD"}[5m])
|
|
|
|
)
|
|
|
|
by (container)
|
2019-12-17 07:08:11 -05:00
|
|
|
unit: "cores"
|
2020-08-07 11:10:17 -04:00
|
|
|
label: container
|
|
|
|
|
|
|
|
- title: "CPU throttling"
|
|
|
|
type: "line-chart"
|
|
|
|
y_label: "Cores per container"
|
|
|
|
metrics:
|
|
|
|
- id: pod_cpu_cfs_throttle
|
|
|
|
query_range: >-
|
|
|
|
sum(
|
|
|
|
rate(container_cpu_cfs_throttled_seconds_total{pod="{{pod}}"}[5m])
|
|
|
|
)
|
|
|
|
by (container)
|
|
|
|
unit: "cores"
|
|
|
|
label: container
|
|
|
|
|
2019-12-17 07:08:11 -05:00
|
|
|
- group: Memory metrics
|
|
|
|
panels:
|
|
|
|
- title: "Memory usage working set"
|
|
|
|
type: "line-chart"
|
2020-08-07 11:10:17 -04:00
|
|
|
y_label: "Working set memory"
|
2019-12-17 07:08:11 -05:00
|
|
|
metrics:
|
|
|
|
- id: pod_memory_working_set
|
2020-08-07 11:10:17 -04:00
|
|
|
query_range: >-
|
|
|
|
sum(
|
|
|
|
container_memory_working_set_bytes{pod="{{pod}}",container!="POD"}
|
|
|
|
) by (container)
|
|
|
|
unit: "bytes"
|
|
|
|
label: container
|
|
|
|
|
2019-12-17 07:08:11 -05:00
|
|
|
- group: Network metrics
|
|
|
|
panels:
|
|
|
|
- title: "Network Receive (In)"
|
|
|
|
type: "line-chart"
|
2020-08-07 11:10:17 -04:00
|
|
|
y_label: "Received (bytes/sec)"
|
2019-12-17 07:08:11 -05:00
|
|
|
metrics:
|
|
|
|
- id: pod_network_receive
|
2020-08-07 11:10:17 -04:00
|
|
|
query_range: >-
|
|
|
|
sum(
|
|
|
|
rate(
|
|
|
|
container_network_receive_bytes_total{pod="{{pod}}"}[5m]
|
|
|
|
)
|
|
|
|
) by (pod)
|
|
|
|
unit: "bytes"
|
2020-08-04 20:09:52 -04:00
|
|
|
label: pod
|
2020-08-07 11:10:17 -04:00
|
|
|
|
2019-12-17 07:08:11 -05:00
|
|
|
- title: "Network Transmit (Out)"
|
|
|
|
type: "line-chart"
|
2020-08-07 11:10:17 -04:00
|
|
|
y_label: "Transmitted (bytes/sec)"
|
2019-12-17 07:08:11 -05:00
|
|
|
metrics:
|
|
|
|
- id: pod_network_transmit
|
2020-08-07 11:10:17 -04:00
|
|
|
query_range: >-
|
|
|
|
sum(
|
|
|
|
rate(
|
|
|
|
container_network_transmit_bytes_total{pod="{{pod}}"}[5m]
|
|
|
|
)
|
|
|
|
) by (pod)
|
|
|
|
unit: bytes
|
2020-08-04 20:09:52 -04:00
|
|
|
label: pod
|
2020-08-07 11:10:17 -04:00
|
|
|
|
2019-12-17 07:08:11 -05:00
|
|
|
- group: Disk metrics
|
|
|
|
panels:
|
|
|
|
- title: "Disk Reads"
|
|
|
|
type: "line-chart"
|
2020-08-07 11:10:17 -04:00
|
|
|
y_label: "Disk reads (bytes/sec)"
|
2019-12-17 07:08:11 -05:00
|
|
|
metrics:
|
|
|
|
- id: pod_disk_reads
|
2020-08-07 11:10:17 -04:00
|
|
|
query_range: >-
|
|
|
|
sum(
|
|
|
|
rate(
|
|
|
|
container_fs_reads_bytes_total{pod="{{pod}}", container!="POD"}[5m]
|
|
|
|
)
|
|
|
|
) by (container,device)
|
|
|
|
|
|
|
|
unit: "bytes / sec"
|
|
|
|
label: "{{container}} {{device}}"
|
|
|
|
|
2019-12-17 07:08:11 -05:00
|
|
|
- title: "Disk Writes"
|
|
|
|
type: "line-chart"
|
2020-08-07 11:10:17 -04:00
|
|
|
y_label: "Disk writes (bytes/sec)"
|
2019-12-17 07:08:11 -05:00
|
|
|
metrics:
|
|
|
|
- id: pod_disk_writes
|
2020-08-07 11:10:17 -04:00
|
|
|
query_range: >-
|
|
|
|
sum(
|
|
|
|
rate(
|
|
|
|
container_fs_writes_bytes_total{pod="{{pod}}", container!="POD"}[5m]
|
|
|
|
)
|
|
|
|
) by (container,device)
|
|
|
|
unit: "bytes / sec"
|
|
|
|
label: "{{container}} {{device}}"
|