X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=12b945e0d4bee15bd7b6d64a29a74eeb1b506a38;hb=3704c766924ef12163e012f66af870816489198f;hp=99e8f9ef250123a0e1e1e86f622c48c5fcc43e51;hpb=50d24797b2a095b2043643d6a9a4b230eba71d20;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index 99e8f9e..12b945e 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -93,10 +93,6 @@ servers: address: 185.17.185.190 parents: gw-ubcece hostgroups: layer3-infrastructure - gw-linaro: - address: 64.28.108.36 - parents: gw-ubcece - hostgroups: layer3-infrastructure gw-manda: address: 82.195.78.118 parents: gw-ubcece @@ -174,18 +170,17 @@ servers: schumann: address: 212.227.126.54 parents: gw-1und1-sec - hostgroups: computers, service, stretch + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, stretch, security_mirror, hassrvfs, pe1950 wieck: address: 195.20.242.89 parents: gw-1und1-sec - hostgroups: computers, service, apache2-hosts, rsyncd-hosts, stretch, security_mirror, hasvarlogfs, no-bacula + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, stretch, security_mirror, hasvarlogfs, no-bacula, pe1950 # }}} # {{{ gw-accumu pettersson: address: 130.239.18.123 parents: gw-accumu - hostgroups: computers, hasbootfs, aacraid, nfs-client, service, apache2-hosts, jessie, autofs, sw-raid - ## No need to update to Stretch, casulana replaces it. It should eventually die. + hostgroups: computers, hasbootfs, aacraid, nfs-client, service, apache2-hosts, stretch, autofs, sw-raid mirror-accumu: address: 130.242.6.199 parents: gw-accumu2 @@ -370,7 +365,7 @@ servers: parents: gw-bytemark hostgroups: computers, hassrvfs, kvmdomains, stretch, postgres96-hosts, systemd-timesyncd ganeti-bytemark: - address: 82.195.75.111 + address: 5.153.231.1 parents: gw-bytemark hostgroups: notacomputer coccia: @@ -384,7 +379,7 @@ servers: philp: address: 5.153.231.13 parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, jessie, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, hassrvfs, kvmdomains, stretch, apache2-hosts, apache-https, systemd-timesyncd, broken_https_default_vhost rainier: address: 5.153.231.16 parents: ganeti-bytemark @@ -408,7 +403,7 @@ servers: donizetti: address: 5.153.231.20 parents: ganeti-bytemark - hostgroups: computers, general, kvmdomains, jessie, nfs-client, autofs, systemd-timesyncd + hostgroups: computers, general, kvmdomains, stretch, nfs-client, autofs, systemd-timesyncd moszumanska: address: 5.153.231.21 parents: ganeti-bytemark @@ -422,11 +417,11 @@ servers: ticharich: address: 5.153.231.23 parents: ganeti-bytemark - hostgroups: computers, general, kvmdomains, jessie, nfs-client, autofs, apache2-hosts, apache-https, service, broken_https_default_vhost, systemd-timesyncd + hostgroups: computers, general, kvmdomains, stretch, nfs-client, autofs, apache2-hosts, apache-https, service, broken_https_default_vhost, systemd-timesyncd petrova: address: 5.153.231.25 parents: ganeti-bytemark - hostgroups: computers, kvmdomains, jessie, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, kvmdomains, stretch, apache2-hosts, apache-https, systemd-timesyncd olin: address: 5.153.231.26 parents: ganeti-bytemark @@ -458,23 +453,11 @@ servers: gideon: address: 5.153.231.34 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, systemd-timesyncd lindsay: address: 5.153.231.36 parents: ganeti-bytemark hostgroups: computers, service, kvmdomains, stretch, autofs, nfs-client, systemd-timesyncd - mirror-bytemark: - address: 5.153.231.37 - parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, apache2-hosts, hassrvfs - mirror-bytemark-debian: - address: 5.153.231.45 - hostgroups: secondary-IPs - parents: mirror-bytemark - mirror-bytemark-security: - address: 5.153.231.46 - hostgroups: secondary-IPs - parents: mirror-bytemark sor: address: 5.153.231.38 parents: ganeti-bytemark @@ -503,7 +486,7 @@ servers: casulana: address: 5.153.231.41 parents: gw-bytemark - hostgroups: computers, service, stretch, hassrvfs, dl380, manyprocesses + hostgroups: computers, service, stretch, hassrvfs, dl380, manyprocesses, apache2-hosts # }}} # {{{ gw-c3sl santoro: @@ -588,17 +571,9 @@ servers: hostgroups: computers, service, dl360, stretch, drbd-hosts ganeti-csail: address: 128.31.0.49 - parents: gw-bytemark + parents: gw-csail hostgroups: notacomputer - falla: - address: 128.31.0.65 - parents: ganeti-csail - hostgroups: computers, freebsd, hassrvfs, porterbox, jessie, jessie-freebsd - fischer: - address: 128.31.0.35 - parents: ganeti-csail - hostgroups: computers, freebsd, hassrvfs, porterbox, jessie mirror-csail: address: 128.31.0.62 parents: ganeti-csail @@ -660,7 +635,7 @@ servers: cgi-grnet-01: address: 194.177.211.202 parents: gw-grnet - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, apache-https, xinetd-hosts, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, xinetd-hosts, systemd-timesyncd x86-grnet-01: address: 194.177.211.203 parents: ganeti-grnet @@ -724,25 +699,19 @@ servers: lw07: address: 185.17.185.187 parents: gw-leaseweb - hostgroups: computers, service, jessie, dl180, nfs-client, autofs, hassrvfs, postgres94-hosts, apache2-hosts + hostgroups: computers, service, jessie, dl180, nfs-client, autofs, hassrvfs, postgres94-hosts, apache2-hosts lw08: address: 185.17.185.189 parents: gw-leaseweb - hostgroups: computers, service, jessie, dl180, nfs-client, autofs, hassrvfs, apache2-hosts - # }}} - # {{{ gw-linaro - arm-linaro-01: - address: 64.28.108.83 - parents: gw-linaro - hostgroups: computers, hasbootfs, hassrvfs, buildd, stretch, broken_mq - arm-linaro-03: - address: 64.28.108.85 - parents: gw-linaro - hostgroups: computers, hasbootfs, hassrvfs, buildd, stretch, broken_mq - asachi: - address: 64.28.108.84 - parents: gw-linaro - hostgroups: computers, hasbootfs, hassrvfs, porterbox, stretch, broken_mq + hostgroups: computers, service, jessie, dl180, nfs-client, autofs, hassrvfs, apache2-hosts + lw09: + address: 185.17.185.181 + parents: gw-leaseweb + hostgroups: computers, service, stretch, dl180 + lw10: + address: 185.17.185.182 + parents: gw-leaseweb + hostgroups: computers, service, stretch, dl180 # }}} # {{{ gw-karlsruhe zemlinsky: @@ -755,11 +724,11 @@ servers: czerny: address: 82.195.75.109 parents: gw-manda - hostgroups: computers, service, dl380, acpid-hosts, stretch, drbd-hosts + hostgroups: computers, service, dl380, acpid-hosts, stretch, drbd-hosts, manyprocesses clementi: address: 82.195.75.103 parents: gw-manda - hostgroups: computers, service, dl380, acpid-hosts, stretch, drbd-hosts + hostgroups: computers, service, dl380, acpid-hosts, stretch, drbd-hosts, manyprocesses bendel: address: 82.195.75.100 parents: ganeti3 @@ -768,16 +737,6 @@ servers: address: 82.195.75.110 parents: ganeti3 hostgroups: computers, service, kvmdomains, stretch, hassrvfs, spamd, heavy-exim, highload - fils: - address: 82.195.75.89 - parents: ganeti3 - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph - fayrfax: - address: 82.195.75.82 - parents: ganeti3 - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph vento: address: 82.195.75.98 parents: ganeti3 @@ -821,7 +780,7 @@ servers: vogler: address: 82.195.75.92 parents: ganeti3 - hostgroups: computers, service, kvmdomains, jessie + hostgroups: computers, service, kvmdomains, stretch wolkenstein: address: 82.195.75.65 parents: ganeti3 @@ -858,11 +817,6 @@ servers: hostgroups: computers, buildd, hassrvfs, stretch, incomingmailrelayed # }}} # {{{ gw-osuosl - busoni: - address: 140.211.166.202 - parents: gw-osuosl - hostgroups: computers, service, dl360, hassrvfs, jessie, hasvarlogfs, apache2-hosts, no-bacula, apache-https - byrd: address: 140.211.166.200 parents: gw-osuosl @@ -884,10 +838,6 @@ servers: address: 140.211.166.197 parents: pieta hostgroups: computers, hassrvfs, buildd, jessie - pizzetti: - address: 140.211.166.198 - parents: pieta - hostgroups: computers, jessie, hassrvfs, porterbox partch: address: 140.211.15.152 parents: gw-osuosl @@ -897,7 +847,7 @@ servers: sallinen: address: 193.62.202.26 parents: gw-sanger - hostgroups: computers, service, stretch, dl380, nfs-client, autofs + hostgroups: computers, service, stretch, dl380, nfs-client, autofs, postgres96-hosts sibelius: address: 193.62.202.28 parents: gw-sanger @@ -939,66 +889,6 @@ servers: parents: gw-skroutz1, gw-skroutz2 hostgroups: computers, stretch, service, sw-raid, hassrvfs, apache2-hosts # }}} - # {{{ gw-ubcece - sw-ubcece: - hostgroups: layer2-infrastructure - contacts: lfilipoz - pingable: false - check_command: dsa_check_always_ok - sw-ubcece-mcld: - hostgroups: layer2-infrastructure - parents: sw-ubcece - contacts: lfilipoz - pingable: false - check_command: dsa_check_always_ok - sw-ubcece-kais: - hostgroups: layer2-infrastructure - parents: sw-ubcece - contacts: lfilipoz - pingable: false - check_command: dsa_check_always_ok - spontini: - address: 206.12.19.14 - parents: sw-ubcece-mcld - hostgroups: computers, buildd, hasbootfs, hassrvfs, sparc, wheezy - contacts: lfilipoz - ubc-bl7: - address: 206.12.19.217 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl6: - address: 206.12.19.216 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl2: - address: 206.12.19.212 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl3: - address: 206.12.19.213 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl4: - address: 206.12.19.214 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl8: - address: 206.12.19.218 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - # MSA 2000 (2012i) - giustini: - address: 192.168.2.6 - parents: sw-ubcece-kais - hostgroups: notacomputer - # unless we implement runfrom for host alive checks - pingable: false - check_command: dsa_check_always_ok -# locke: -# address: 206.12.19.120 -# parents: sw-ubcece-kais -# hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hasvicepa - # }}} # {{{ ubc-gateway ubc-enc2bl01: address: 209.87.16.1 @@ -1025,16 +915,6 @@ servers: address: 209.87.16.21 parents: ubc-gateway hostgroups: computers, buildd, hassrvfs, kvmdomains, stretch, systemd-timesyncd - finzi: - address: 209.87.16.22 - parents: ubc-gateway - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph - fano: - address: 209.87.16.23 - parents: ubc-gateway - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph elgar: address: 209.87.16.24 parents: ubc-gateway @@ -1090,7 +970,7 @@ servers: tye: address: 209.87.16.37 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, jessie, heavy-exim, apache2-hosts, apache-https, nfs-client, autofs, hassrvfs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, heavy-exim, apache2-hosts, apache-https, nfs-client, autofs, hassrvfs, systemd-timesyncd ullmann: address: 209.87.16.38 parents: ubc-gateway @@ -1111,11 +991,11 @@ servers: godard: address: 209.87.16.44 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd, postfix-hosts, postgres96-hosts + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd, postfix-hosts, postgres96-hosts, manyprocesses debussy: address: 209.87.16.46 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, apache2-hosts, apache-https, broken_https_default_vhost # }}} # {{{ gw-umn #saens: @@ -1214,10 +1094,6 @@ hostgroups: extinfo-icon_image: base/debian.png extinfo-icon_image_alt: Debian GNU/Linux extinfo-notes_url: https://db.debian.org/machines.cgi?host=%s - layer2-infrastructure: - alias: Layer 2 Devices - extinfo-icon_image: base/switch40.png - extinfo-icon_image_alt: switch layer3-infrastructure: alias: Layer 3 Devices extinfo-icon_image: base/switch40.png @@ -1225,10 +1101,6 @@ hostgroups: notacomputer: alias: Systems that are not really systems. Yeah :) private: 1 - freebsd: - alias: freebsd - private: 1 - extinfo-icon_image_alt: Debian GNU/kFreeBSD armhf: alias: armhf private: 1 @@ -1272,13 +1144,14 @@ hostgroups: aacraid: alias: Hosts with Adaptec AACraid private: 1 + pe1950: + alias: Dell PowerEdge 1950 hosts + private: 1 wheezy: alias: Hosts running wheezy jessie: alias: Hosts running jessie - jessie-freebsd: - alias: kFreebsd hosts running jessie stretch: alias: Hosts running stretch @@ -1508,7 +1381,7 @@ services: name: disk usage on /var/lib/postgresql servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /var/lib/postgresql" - hosts: sibelius, busoni, buxtehude, lw07, fasolo + hosts: sibelius, buxtehude, lw07, fasolo - name: disk usage on /var/log servicegroups: diskspace @@ -1530,24 +1403,44 @@ services: nrpe: "/usr/lib/nagios/plugins/check_disk 90 94 /srv/snapshot.debian.org" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-1 + name: disk usage on /srv/farm-snapshot/farm-2017-0 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-0" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2017-1 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-1" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2017-2 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-2" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2017-3 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-3" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2017-4 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-1" + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-4" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-2 + name: disk usage on /srv/farm-snapshot/farm-2017-5 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2" + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-5" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-3 + name: disk usage on /srv/farm-snapshot/farm-2017-6 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-3" + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-6" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-4 + name: disk usage on /srv/farm-snapshot/farm-2017-7 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-4" + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-7" hosts: sibelius - name: disk usage on /srv/ftp-master.debian.org @@ -1632,14 +1525,6 @@ services: name: processes - total hostgroups: manyprocesses nrpe: "/usr/lib/nagios/plugins/check_procs 1500 1700" - - - name: swap usage - percent - nrpe: "/usr/lib/nagios/plugins/check_swap -w 20% -c 10%" - hostgroups: computers - - - name: swap usage - mb - nrpe: "/usr/lib/nagios/plugins/check_swap -w 20000 -c 5000" - hostgroups: computers - name: free memory - mb nrpe: "/usr/lib/nagios/plugins/dsa-check-memory -m mb" @@ -1654,15 +1539,10 @@ services: hostgroups: computers excludehosts: zelenka, zandonai excludehostgroups: jessie, stretch - - - name: process - getty - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C agetty -a /sbin/getty" - hostgroups: jessie-freebsd - name: process - getty nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C agetty -a /sbin/agetty" hostgroups: jessie, stretch - excludehostgroups: freebsd - name: processes - zombies @@ -1673,7 +1553,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-entropy" event_handler: dsa_event_handler_restart_ekey hostgroups: computers - excludehostgroups: freebsd - name: system - filesystem check nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-filesystems" @@ -1727,12 +1606,7 @@ services: servicegroups: backup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u bacula -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" hostgroups: computers - excludehostgroups: freebsd, alioth - - - name: process - bacula-fd - servicegroups: backup - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" - hostgroups: freebsd + excludehostgroups: alioth - name: network backup status - draghi @@ -1769,9 +1643,8 @@ services: - name: upgraded libraries servicegroups: security - nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-libs" + nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-libs --ignore-younger=1h" hostgroups: computers - excludehostgroups: freebsd check_interval: 60 retry_interval: 15 notification_interval: 10080 @@ -1779,26 +1652,23 @@ services: name: installed firewall nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/ferm.conf" hostgroups: computers - excludehostgroups: freebsd - name: puppetized firewall nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/conf.d/defs.conf" hostgroups: computers - excludehostgroups: freebsd - name: process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ulogd -a '/usr/sbin/ulogd -d'" hostgroups: computers - excludehostgroups: freebsd, sparc, jessie, stretch + excludehostgroups: sparc, jessie, stretch - name: process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u ulog -C ulogd -a '/usr/sbin/ulogd --daemon --uid ulog'" hostgroups: jessie, stretch - excludehostgroups: freebsd - name: unexpected process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C ulogd" - hostgroups: freebsd, sparc + hostgroups: sparc #### - name: process - samhain @@ -1826,16 +1696,11 @@ services: name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" hostgroups: computers - excludehostgroups: freebsd, jessie, stretch - - - name: process - syslog-ng - nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:2 -c 2: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" - hostgroups: freebsd + excludehostgroups: jessie, stretch - name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -F'" hostgroups: jessie, stretch - excludehostgroups: freebsd - name: remote logging on lotti @@ -1893,11 +1758,6 @@ services: name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a 'munin-node'" hostgroups: computers - excludehostgroups: freebsd - - - name: process - munin-node - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C perl -a '/usr/bin/perl -wT /usr/sbin/munin-node'" - hostgroups: freebsd - name: network service - munin-node check: check_tcp!4949 @@ -1921,7 +1781,7 @@ services: name: system time synced nrpe: "/usr/lib/nagios/plugins/dsa-check-timedatectl -s" hostgroups: computers - excludehostgroups: systemd-timesyncd, freebsd, wheezy + excludehostgroups: systemd-timesyncd, wheezy servicegroups: time - name: system time synced @@ -1937,10 +1797,7 @@ services: - name: process - irqbalance nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C irqbalance -a '/usr/sbin/irqbalance'" - #hosts: casulana hostgroups: computers - #excludehostgroups: single-cpu, freebsd - excludehostgroups: freebsd excludehosts: harris, smetana ### - @@ -1952,11 +1809,7 @@ services: name: process - ud-replicated nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C ud-replicated -a '/usr/bin/python /usr/bin/ud-replicated'" hostgroups: computers - excludehostgroups: freebsd, alioth - - - name: process - ud-replicated - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C python2.7 -a '/usr/bin/python /usr/bin/ud-replicated'" - hostgroups: freebsd + excludehostgroups: alioth ### - name: process - monit @@ -2003,16 +1856,11 @@ services: name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C udevd -a 'udevd'" hostgroups: computers - excludehostgroups: freebsd, jessie, stretch + excludehostgroups: jessie, stretch - name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C systemd-udevd -a '/lib/systemd/systemd-udevd'" hostgroups: jessie, stretch - excludehostgroups: freebsd - - - name: unexpected process - udev - nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C udevd" - hostgroups: freebsd ### - name: process - acpid @@ -2039,19 +1887,13 @@ services: name: process - stunnel4 - puppet-ekeyd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u stunnel4 -C stunnel4 -a '/usr/bin/stunnel4 /etc/stunnel/puppet-ekeyd.conf'" hostgroups: wheezy, jessie, stretch - excludehostgroups: freebsd, alioth + excludehostgroups: alioth - name: process - stunnel4 - puppet-ekeyd is crazy nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-stunnel-sanity" hostgroups: computers - excludehostgroups: freebsd, alioth - excludehosts: czerny, grnet-node01, storace, ubc-bl2 - ### - - - name: process - rngd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C rngd -a '/usr/sbin/rngd -r /dev/hwrng'" - hostgroups: kvmdomains - excludehostgroups: stretch + excludehostgroups: alioth + excludehosts: czerny, grnet-node01, storace # }}} # {{{ anti-services - @@ -2152,12 +1994,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --no-controller-ok --ignore-controller='P700m'" check_interval: 120 hostgroups: bm-bl - - - name: HW - hpacucli status - servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --no-battery" - check_interval: 120 - hosts: busoni ### # - # name: HW - edac status @@ -2208,12 +2044,10 @@ services: servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-drbd -d All" hostgroups: drbd-hosts - excludehosts: ubc-bl2, ubc-bl3, ubc-bl6, ubc-bl7, ubc-bl8 - - name: RAID - DRBD - servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/dsa-check-drbd -d All --ok-no-devices" - hosts: ubc-bl2, ubc-bl3, ubc-bl6, ubc-bl7, ubc-bl8 + name: HW - OpenManage status + nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-openmanage" + hostgroups: pe1950 # }}} # }}} # {{{ ### mail stuff @@ -2223,7 +2057,7 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u Debian-exim -C exim4 -a '/usr/sbin/exim4 -bd -q'" hostgroups: computers excludehostgroups: postfix-hosts, mail-relay - excludehosts: master, busoni, quantz, buxtehude + excludehosts: master, quantz, buxtehude - name: process - exim nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:25 -c 1: -u Debian-exim -C exim4 -a '/usr/sbin/exim4 -bd -q'" @@ -2233,11 +2067,11 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1: -C exim4" hostgroups: computers excludehostgroups: postfix-hosts - excludehosts: master, busoni, quantz, buxtehude + excludehosts: master, quantz, buxtehude - name: process - exim nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:300 -c 1:500 -C exim4 -a '/usr/sbin/exim4'" - hosts: master, busoni, quantz, buxtehude + hosts: master, quantz, buxtehude - name: mail queue nrpe: "/usr/lib/nagios/plugins/check_mailq -M exim -w 1000 -c 2000" @@ -2283,17 +2117,17 @@ services: excludehostgroups: jessie, stretch - name: process - spamd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamassassin.pid --create-prefs --max-children 5 --helper-home-dir'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamd.pid --create-prefs --max-children 5 --helper-home-dir'" hostgroups: spamd excludehosts: picconi excludehostgroups: wheezy - name: process - spamd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamassassin.pid --create-prefs --max-children 20 --min-spare=5 --helper-home-dir'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamd.pid --create-prefs --max-children 20 --min-spare=5 --helper-home-dir'" hosts: picconi - name: process - spamd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamassassin.pid --create-prefs --max-children 10 --helper-home-dir'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamd.pid --create-prefs --max-children 10 --helper-home-dir'" hosts: bendel - name: process - spamd - child @@ -2307,7 +2141,7 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C spamd" hostgroups: computers excludehostgroups: spamd - excludehosts: bendel, busoni + excludehosts: bendel - name: unwanted process - greylistd @@ -2478,7 +2312,7 @@ services: name: network service - http check: check_http hostgroups: apache2-hosts - excludehosts: klecker + excludehosts: klecker, casulana depends: process - apache2 - master - name: network service - http @@ -2567,18 +2401,11 @@ services: hosts: storace, backuphost # }}} # {{{ buildd - - - name: process - buildd - servicegroups: buildd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C perl -a '/usr/bin/buildd'" - hosts: fano, finzi, fils, fayrfax - contact_groups: buildd - name: process - buildd servicegroups: buildd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C buildd -a '/usr/bin/buildd'" hostgroups: buildd - excludehosts: fano, finzi, fils, fayrfax contact_groups: buildd - name: processes - zombie schroot @@ -2878,10 +2705,6 @@ services: name: DNS SOA sync - 144-28.118.59.86.in-addr.arpa check: "dsa_check_soas_add!denis.debian.org!144-28.118.59.86.in-addr.arpa" hosts: global - - - name: DNS SOA sync - alioth.debian.org - check: "dsa_check_soas_add!denis.debian.org!alioth.debian.org" - hosts: global - name: DNS SOA sync - debconf.net check: "dsa_check_soas_add!denis.debian.org!debconf.net" @@ -2925,25 +2748,6 @@ services: runfrom: denis # }}} # {{{ storage - - - name: ping alive check - remotecheck: "/usr/lib/nagios/plugins/check_ping -H $HOSTADDRESS$ -w 50,10% -c 200,30%" - runfrom: ubc-bl8 - hosts: giustini - check_interval: 5 - max_check_attempts: 4 - retry_interval: 1 - - - name: Overall Unit Status - remotecheck: "/usr/lib/nagios/plugins/check_snmp -H $HOSTADDRESS$ -C public -P 2c -o connUnitStatus -n -c 3 -w 3" - runfrom: ubc-bl8 - hosts: giustini - - - name: event log - remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=11298 $HOSTADDRESS$ public" - runfrom: ubc-bl8 - hosts: giustini - ### - name: process - multipathd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:15 -c 1: -u root -C multipathd -a '/sbin/multipathd'" @@ -3007,9 +2811,8 @@ services: # {{{ misc - name: system - all services running - nrpe: "/usr/bin/sudo /bin/systemctl is-system-running" + nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-systemd-services" hostgroups: jessie, stretch - excludehostgroups: freebsd ### - name: process - slapd @@ -3059,6 +2862,11 @@ services: check: dsa_check_cert!5061 check_interval: 60 hosts: vogler + - + name: freeradius process + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u freerad -C freeradius -a '/usr/sbin/freeradius -xx'" + check_interval: 60 + hosts: vogler #### - name: puppetmaster cert @@ -3078,3 +2886,5 @@ services: # }}} # vim: set ts=2 sw=2 et ai si fdm=marker: + +