blob: 083261a5574ca2c1d2afe1ecb9a34eff6e2bb344 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
|
panel_groups:
- group: 'Usage Variation'
panels:
- type: anomaly-chart
title: "Memory Usage Rate Anomalies"
y_label: "Memory Usage Rate"
metrics:
- id: container_memory_usage_bytes
query_range: avg(sum(rate(container_memory_usage_bytes[15m]))) /1024
label: "Memory Usage Rate"
unit: "kB"
- id: container_memory_usage_bytes_upper
query_range: 80000
label: "Memory Usage Rate Lower Limit"
unit: "kB"
- id: container_memory_usage_bytes_lower
query_range: 50000
label: "Memory Usage Rate Upper Limit"
unit: "kB"
- group: System metrics (Kubernetes)
panels:
- title: 'Container CPU Usage by Environment (seconds)'
type: 'heatmap'
metrics:
- id: container_cpu_usage_by_env
query_range: 'sum(rate(container_cpu_usage_seconds_total{environment=~"coredns|production|kube|kube-controller"}[1h])) by (environment)'
step: 3600
- title: 'Number of GitLab Runner requests by status'
type: 'heatmap'
metrics:
- id: number_of_runner_requests_by_status
query_range: 'sum(rate(gitlab_runner_api_request_statuses_total[60m])) by (status)'
step: 3600
- title: '95 percentile of request durations per handler (seconds)'
type: 'heatmap'
metrics:
- id: 95_percentile_of_request_durations_per_handler
query_range: 'histogram_quantile(0.95, sum(rate(prometheus_http_request_duration_seconds_bucket[1h])) by (handler,le))'
step: 3600
|