MOON

File: //proc/self/root/opt/netdata/netdata-configs/orig/health.d/audit.conf
# Alerts for the Linux audit subsystem.
# Monitors audit backlog utilization relative to failure mode,
# and detects audit event loss.

# Alert when audit backlog is filling up AND failure mode is panic (2).
# This combination means the system will kernel panic if the backlog overflows.
# Only fires when failure=2 (panic mode) — for other failure modes,
# audit_lost_events covers actual event loss.

 template: audit_backlog_utilization
       on: audit.backlog_utilization
    class: Utilization
     type: System
component: Audit
   lookup: max -1m unaligned of utilization
    units: %
    every: 10s
     warn: $this > 50 AND $audit.failure.panic == 1
     crit: $this > 80 AND $audit.failure.panic == 1
    delay: down 5m multiplier 1.5 max 1h
  summary: Audit backlog utilization (kernel panic risk)
     info: Linux audit backlog is filling up while failure mode is set to panic — kernel panic is imminent if backlog overflows
       to: sysadmin

# Alert when audit events are being lost (dropped).
# This indicates the audit subsystem cannot keep up with event volume.

 template: audit_lost_events
       on: audit.lost
    class: Errors
     type: System
component: Audit
   lookup: max -1m unaligned of lost
    units: events/s
    every: 10s
     warn: $this > 0
    delay: down 5m multiplier 1.5 max 1h
  summary: Audit subsystem losing events
     info: Linux audit subsystem is losing events (backlog overflow, rate limiting, or memory pressure)
       to: sysadmin