X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=a432e4e729a08aa8841efcc3b3a67075efe12a5f;hb=e313f7d1d139ad3de5ae8d99a49f33244fc3aacb;hp=7ea069c6240bd3060c7e15950d60283cbd80d08c;hpb=4826f01dd77fbcbd97be4109401ca156f3673c14;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index 7ea069c..a432e4e 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -170,17 +170,19 @@ servers: schumann: address: 212.227.126.54 parents: gw-1und1-sec - hostgroups: computers, service, stretch + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, stretch, security_mirror, hassrvfs, pe1950 wieck: address: 195.20.242.89 parents: gw-1und1-sec - hostgroups: computers, service, apache2-hosts, rsyncd-hosts, stretch, security_mirror, hasvarlogfs, no-bacula + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, stretch, security_mirror, hasvarlogfs, no-bacula, pe1950 # }}} # {{{ gw-accumu pettersson: address: 130.239.18.123 parents: gw-accumu hostgroups: computers, hasbootfs, aacraid, nfs-client, service, apache2-hosts, stretch, autofs, sw-raid + contacts: zobel, tfheen, lfilipoz, zumbi, jcristau, pabs, aurel32, dsa-nsa + contact_groups: "" mirror-accumu: address: 130.242.6.199 parents: gw-accumu2 @@ -379,7 +381,7 @@ servers: philp: address: 5.153.231.13 parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, stretch, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, hassrvfs, kvmdomains, stretch, apache2-hosts, apache-https, systemd-timesyncd, broken_https_default_vhost rainier: address: 5.153.231.16 parents: ganeti-bytemark @@ -458,18 +460,6 @@ servers: address: 5.153.231.36 parents: ganeti-bytemark hostgroups: computers, service, kvmdomains, stretch, autofs, nfs-client, systemd-timesyncd - mirror-bytemark: - address: 5.153.231.37 - parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, apache2-hosts, hassrvfs - mirror-bytemark-debian: - address: 5.153.231.45 - hostgroups: secondary-IPs - parents: mirror-bytemark - mirror-bytemark-security: - address: 5.153.231.46 - hostgroups: secondary-IPs - parents: mirror-bytemark sor: address: 5.153.231.38 parents: ganeti-bytemark @@ -498,7 +488,9 @@ servers: casulana: address: 5.153.231.41 parents: gw-bytemark - hostgroups: computers, service, stretch, hassrvfs, dl380, manyprocesses + hostgroups: computers, service, stretch, hassrvfs, dl380, manyprocesses, apache2-hosts + contacts: zobel, tfheen, lfilipoz, zumbi, jcristau, pabs, aurel32, dsa-nsa + contact_groups: "" # }}} # {{{ gw-c3sl santoro: @@ -583,7 +575,7 @@ servers: hostgroups: computers, service, dl360, stretch, drbd-hosts ganeti-csail: address: 128.31.0.49 - parents: gw-bytemark + parents: gw-csail hostgroups: notacomputer mirror-csail: @@ -720,6 +712,10 @@ servers: address: 185.17.185.181 parents: gw-leaseweb hostgroups: computers, service, stretch, dl180 + lw10: + address: 185.17.185.182 + parents: gw-leaseweb + hostgroups: computers, service, stretch, dl180 # }}} # {{{ gw-karlsruhe zemlinsky: @@ -923,16 +919,6 @@ servers: address: 209.87.16.21 parents: ubc-gateway hostgroups: computers, buildd, hassrvfs, kvmdomains, stretch, systemd-timesyncd - finzi: - address: 209.87.16.22 - parents: ubc-gateway - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph - fano: - address: 209.87.16.23 - parents: ubc-gateway - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph elgar: address: 209.87.16.24 parents: ubc-gateway @@ -1009,7 +995,7 @@ servers: godard: address: 209.87.16.44 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd, postfix-hosts, postgres96-hosts + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd, postfix-hosts, postgres96-hosts, manyprocesses debussy: address: 209.87.16.46 parents: ubc-gateway @@ -1109,20 +1095,11 @@ hostgroups: computers: alias: computers private: 1 - extinfo-icon_image: base/debian.png - extinfo-icon_image_alt: Debian GNU/Linux - extinfo-notes_url: https://db.debian.org/machines.cgi?host=%s layer3-infrastructure: alias: Layer 3 Devices - extinfo-icon_image: base/switch40.png - extinfo-icon_image_alt: router notacomputer: alias: Systems that are not really systems. Yeah :) private: 1 - freebsd: - alias: freebsd - private: 1 - extinfo-icon_image_alt: Debian GNU/kFreeBSD armhf: alias: armhf private: 1 @@ -1166,6 +1143,9 @@ hostgroups: aacraid: alias: Hosts with Adaptec AACraid private: 1 + pe1950: + alias: Dell PowerEdge 1950 hosts + private: 1 wheezy: alias: Hosts running wheezy @@ -1367,6 +1347,12 @@ services: check_interval: 5 max_check_attempts: 4 retry_interval: 1 + - + name: network - v6 gw + nrpe: "/usr/lib/nagios/plugins/dsa-check-ipv6-default-gw" + hostgroups: computers + check_interval: 60 + excludehostgroups: alioth # }}} # {{{ ### disk usage - @@ -1424,42 +1410,42 @@ services: - name: disk usage on /srv/farm-snapshot/farm-2017-0 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-0" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-0" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-2017-1 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-1" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-1" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-2017-2 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-2" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-2" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-2017-3 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-3" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-3" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-2017-4 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-4" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-4" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-2017-5 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-5" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-5" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-2017-6 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-6" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-6" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-2017-7 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-7" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-7" hosts: sibelius - name: disk usage on /srv/ftp-master.debian.org @@ -1469,37 +1455,47 @@ services: - name: disk usage on /storage/snapshot-farm-1 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-1" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-1" hosts: lw01 - name: disk usage on /storage/snapshot-farm-2 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-2" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-2" hosts: lw02 - name: disk usage on /storage/snapshot-farm-3 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-3" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-3" hosts: lw03 - name: disk usage on /storage/snapshot-farm-4 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-4" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-4" hosts: lw04 + - + name: disk usage on /storage/snapshot-farm-90 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-09" + hosts: lw09 + - + name: disk usage on /storage/snapshot-farm-10 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-10" + hosts: lw10 - name: disk usage on /srv/morgue.debian.org/ servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 95 90 /srv/morgue.debian.org" + nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/morgue.debian.org" hosts: lw03 - name: disk usage on /srv/QNAP-big/ servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 80 /srv/QNAP-big" + nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /srv/QNAP-big" hosts: storace - name: disk usage on /srv/QNAP-tiny servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 80 /srv/QNAP-tiny" + nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/QNAP-tiny" hosts: storace # }}} # {{{ ### system @@ -1562,7 +1558,6 @@ services: name: process - getty nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C agetty -a /sbin/agetty" hostgroups: jessie, stretch - excludehostgroups: freebsd - name: processes - zombies @@ -1573,7 +1568,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-entropy" event_handler: dsa_event_handler_restart_ekey hostgroups: computers - excludehostgroups: freebsd - name: system - filesystem check nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-filesystems" @@ -1627,12 +1621,7 @@ services: servicegroups: backup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u bacula -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" hostgroups: computers - excludehostgroups: freebsd, alioth - - - name: process - bacula-fd - servicegroups: backup - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" - hostgroups: freebsd + excludehostgroups: alioth - name: network backup status - draghi @@ -1669,9 +1658,8 @@ services: - name: upgraded libraries servicegroups: security - nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-libs" + nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-libs --ignore-younger=1h" hostgroups: computers - excludehostgroups: freebsd check_interval: 60 retry_interval: 15 notification_interval: 10080 @@ -1679,26 +1667,23 @@ services: name: installed firewall nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/ferm.conf" hostgroups: computers - excludehostgroups: freebsd - name: puppetized firewall nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/conf.d/defs.conf" hostgroups: computers - excludehostgroups: freebsd - name: process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ulogd -a '/usr/sbin/ulogd -d'" hostgroups: computers - excludehostgroups: freebsd, sparc, jessie, stretch + excludehostgroups: sparc, jessie, stretch - name: process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u ulog -C ulogd -a '/usr/sbin/ulogd --daemon --uid ulog'" hostgroups: jessie, stretch - excludehostgroups: freebsd - name: unexpected process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C ulogd" - hostgroups: freebsd, sparc + hostgroups: sparc #### - name: process - samhain @@ -1726,16 +1711,11 @@ services: name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" hostgroups: computers - excludehostgroups: freebsd, jessie, stretch - - - name: process - syslog-ng - nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:2 -c 2: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" - hostgroups: freebsd + excludehostgroups: jessie, stretch - name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -F'" hostgroups: jessie, stretch - excludehostgroups: freebsd - name: remote logging on lotti @@ -1793,11 +1773,6 @@ services: name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a 'munin-node'" hostgroups: computers - excludehostgroups: freebsd - - - name: process - munin-node - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C perl -a '/usr/bin/perl -wT /usr/sbin/munin-node'" - hostgroups: freebsd - name: network service - munin-node check: check_tcp!4949 @@ -1821,7 +1796,7 @@ services: name: system time synced nrpe: "/usr/lib/nagios/plugins/dsa-check-timedatectl -s" hostgroups: computers - excludehostgroups: systemd-timesyncd, freebsd, wheezy + excludehostgroups: systemd-timesyncd, wheezy servicegroups: time - name: system time synced @@ -1838,7 +1813,6 @@ services: name: process - irqbalance nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C irqbalance -a '/usr/sbin/irqbalance'" hostgroups: computers - excludehostgroups: freebsd excludehosts: harris, smetana ### - @@ -1850,11 +1824,7 @@ services: name: process - ud-replicated nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C ud-replicated -a '/usr/bin/python /usr/bin/ud-replicated'" hostgroups: computers - excludehostgroups: freebsd, alioth - - - name: process - ud-replicated - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C python2.7 -a '/usr/bin/python /usr/bin/ud-replicated'" - hostgroups: freebsd + excludehostgroups: alioth ### - name: process - monit @@ -1901,16 +1871,11 @@ services: name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C udevd -a 'udevd'" hostgroups: computers - excludehostgroups: freebsd, jessie, stretch + excludehostgroups: jessie, stretch - name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C systemd-udevd -a '/lib/systemd/systemd-udevd'" hostgroups: jessie, stretch - excludehostgroups: freebsd - - - name: unexpected process - udev - nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C udevd" - hostgroups: freebsd ### - name: process - acpid @@ -1937,12 +1902,12 @@ services: name: process - stunnel4 - puppet-ekeyd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u stunnel4 -C stunnel4 -a '/usr/bin/stunnel4 /etc/stunnel/puppet-ekeyd.conf'" hostgroups: wheezy, jessie, stretch - excludehostgroups: freebsd, alioth + excludehostgroups: alioth - name: process - stunnel4 - puppet-ekeyd is crazy nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-stunnel-sanity" hostgroups: computers - excludehostgroups: freebsd, alioth + excludehostgroups: alioth excludehosts: czerny, grnet-node01, storace # }}} # {{{ anti-services @@ -2094,6 +2059,10 @@ services: servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-drbd -d All" hostgroups: drbd-hosts + - + name: HW - OpenManage status + nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-openmanage" + hostgroups: pe1950 # }}} # }}} # {{{ ### mail stuff @@ -2358,7 +2327,7 @@ services: name: network service - http check: check_http hostgroups: apache2-hosts - excludehosts: klecker + excludehosts: klecker, casulana depends: process - apache2 - master - name: network service - http @@ -2447,18 +2416,11 @@ services: hosts: storace, backuphost # }}} # {{{ buildd - - - name: process - buildd - servicegroups: buildd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C perl -a '/usr/bin/buildd'" - hosts: fano, finzi - contact_groups: buildd - name: process - buildd servicegroups: buildd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C buildd -a '/usr/bin/buildd'" hostgroups: buildd - excludehosts: fano, finzi contact_groups: buildd - name: processes - zombie schroot @@ -2758,10 +2720,6 @@ services: name: DNS SOA sync - 144-28.118.59.86.in-addr.arpa check: "dsa_check_soas_add!denis.debian.org!144-28.118.59.86.in-addr.arpa" hosts: global - - - name: DNS SOA sync - alioth.debian.org - check: "dsa_check_soas_add!denis.debian.org!alioth.debian.org" - hosts: global - name: DNS SOA sync - debconf.net check: "dsa_check_soas_add!denis.debian.org!debconf.net" @@ -2868,9 +2826,8 @@ services: # {{{ misc - name: system - all services running - nrpe: "/usr/bin/sudo /bin/systemctl is-system-running" + nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-systemd-services" hostgroups: jessie, stretch - excludehostgroups: freebsd ### - name: process - slapd @@ -2920,6 +2877,11 @@ services: check: dsa_check_cert!5061 check_interval: 60 hosts: vogler + - + name: freeradius process + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u freerad -C freeradius -a '/usr/sbin/freeradius -xx'" + check_interval: 60 + hosts: vogler #### - name: puppetmaster cert