diff options
Diffstat (limited to 'docs')
-rw-r--r-- | docs/TIME.md | 2 | ||||
-rw-r--r-- | docs/example-16-compatibility-rules-new-to-old.yml | 6 | ||||
-rw-r--r-- | docs/node-mixin/alerts/alerts.libsonnet | 38 |
3 files changed, 45 insertions, 1 deletions
diff --git a/docs/TIME.md b/docs/TIME.md index f48c080..18773e0 100644 --- a/docs/TIME.md +++ b/docs/TIME.md | |||
@@ -4,7 +4,7 @@ | |||
4 | 4 | ||
5 | This collector is intended for usage with local NTPD like [ntp.org](http://ntp.org/), [chrony](https://chrony.tuxfamily.org/comparison.html) or [OpenNTPD](http://www.openntpd.org/). | 5 | This collector is intended for usage with local NTPD like [ntp.org](http://ntp.org/), [chrony](https://chrony.tuxfamily.org/comparison.html) or [OpenNTPD](http://www.openntpd.org/). |
6 | 6 | ||
7 | Note, some chrony packages have `local stratum 10` configuration value making chrony a valid server when it it is unsynchronised. This configuration makes one of `node_ntp_sanity` heuristics unreliable. | 7 | Note, some chrony packages have `local stratum 10` configuration value making chrony a valid server when it is unsynchronised. This configuration makes one of `node_ntp_sanity` heuristics unreliable. |
8 | 8 | ||
9 | Note, OpenNTPD does not listen for SNTP queries by default, you should add `listen on 127.0.0.1` configuration line to use this collector with OpenNTPD. | 9 | Note, OpenNTPD does not listen for SNTP queries by default, you should add `listen on 127.0.0.1` configuration line to use this collector with OpenNTPD. |
10 | 10 | ||
diff --git a/docs/example-16-compatibility-rules-new-to-old.yml b/docs/example-16-compatibility-rules-new-to-old.yml index 6d630cc..54aaa27 100644 --- a/docs/example-16-compatibility-rules-new-to-old.yml +++ b/docs/example-16-compatibility-rules-new-to-old.yml | |||
@@ -11,6 +11,8 @@ groups: | |||
11 | rules: | 11 | rules: |
12 | - expr: node_boot_time_seconds | 12 | - expr: node_boot_time_seconds |
13 | record: node_boot_time | 13 | record: node_boot_time |
14 | - expr: node_time_seconds | ||
15 | record: node_time | ||
14 | - expr: node_context_switches_total | 16 | - expr: node_context_switches_total |
15 | record: node_context_switches | 17 | record: node_context_switches |
16 | - expr: node_forks_total | 18 | - expr: node_forks_total |
@@ -117,6 +119,10 @@ groups: | |||
117 | record: node_memory_PageTables | 119 | record: node_memory_PageTables |
118 | - expr: node_memory_Shmem_bytes | 120 | - expr: node_memory_Shmem_bytes |
119 | record: node_memory_Shmem | 121 | record: node_memory_Shmem |
122 | - expr: node_memory_ShmemHugePages_bytes | ||
123 | record: node_memory_ShmemHugePages | ||
124 | - expr: node_memory_ShmemPmdMapped_bytes | ||
125 | record: node_memory_ShmemPmdMapped | ||
120 | - expr: node_memory_Slab_bytes | 126 | - expr: node_memory_Slab_bytes |
121 | record: node_memory_Slab | 127 | record: node_memory_Slab |
122 | - expr: node_memory_SReclaimable_bytes | 128 | - expr: node_memory_SReclaimable_bytes |
diff --git a/docs/node-mixin/alerts/alerts.libsonnet b/docs/node-mixin/alerts/alerts.libsonnet index caef02d..9ef18d5 100644 --- a/docs/node-mixin/alerts/alerts.libsonnet +++ b/docs/node-mixin/alerts/alerts.libsonnet | |||
@@ -210,6 +210,44 @@ | |||
210 | severity: 'warning', | 210 | severity: 'warning', |
211 | }, | 211 | }, |
212 | }, | 212 | }, |
213 | { | ||
214 | alert: 'NodeClockSkewDetected', | ||
215 | expr: ||| | ||
216 | ( | ||
217 | node_timex_offset_seconds > 0.05 | ||
218 | and | ||
219 | deriv(node_timex_offset_seconds[5m]) >= 0 | ||
220 | ) | ||
221 | or | ||
222 | ( | ||
223 | node_timex_offset_seconds < -0.05 | ||
224 | and | ||
225 | deriv(node_timex_offset_seconds[5m]) <= 0 | ||
226 | ) | ||
227 | ||| % $._config, | ||
228 | 'for': '10m', | ||
229 | labels: { | ||
230 | severity: 'warning', | ||
231 | }, | ||
232 | annotations: { | ||
233 | summary: 'Clock skew detected.', | ||
234 | message: 'Clock on {{ $labels.instance }} is out of sync by more than 300s. Ensure NTP is configured correctly on this host.', | ||
235 | }, | ||
236 | }, | ||
237 | { | ||
238 | alert: 'NodeClockNotSynchronising', | ||
239 | expr: ||| | ||
240 | min_over_time(node_timex_sync_status[5m]) == 0 | ||
241 | ||| % $._config, | ||
242 | 'for': '10m', | ||
243 | labels: { | ||
244 | severity: 'warning', | ||
245 | }, | ||
246 | annotations: { | ||
247 | summary: 'Clock not synchronising.', | ||
248 | message: 'Clock on {{ $labels.instance }} is not synchronising. Ensure NTP is configured on this host.', | ||
249 | }, | ||
250 | }, | ||
213 | ], | 251 | ], |
214 | }, | 252 | }, |
215 | ], | 253 | ], |