X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=0df6e497a3468a1b4eafb9c9e2eed4d933366ee9;hb=3fd2d79b557757398275242cebc72a71209b410d;hp=6ae71b824f661c1347ba65ac9587bfde5a0047a2;hpb=aeb6cbda8a77f88c91e4f35af91c84ab70012037;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index 6ae71b8..24ce505 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -85,18 +85,10 @@ servers: address: 72.52.94.70 parents: gw-ubcece hostgroups: layer3-infrastructure - gw-karlsruhe: - address: 129.143.59.214 - parents: gw-ubcece - hostgroups: layer3-infrastructure gw-leaseweb: address: 185.17.185.190 parents: gw-ubcece hostgroups: layer3-infrastructure - gw-linaro: - address: 64.28.108.36 - parents: gw-ubcece - hostgroups: layer3-infrastructure gw-manda: address: 82.195.78.118 parents: gw-ubcece @@ -147,7 +139,7 @@ servers: parents: gw-ubcece hostgroups: layer3-infrastructure gw-unicamp: - address: 177.220.10.129 + address: 143.106.167.113 parents: gw-ubcece hostgroups: layer3-infrastructure gw-utwente: @@ -174,22 +166,23 @@ servers: schumann: address: 212.227.126.54 parents: gw-1und1-sec - hostgroups: computers, service, stretch + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, stretch, security_mirror, hassrvfs, pe1950 wieck: address: 195.20.242.89 parents: gw-1und1-sec - hostgroups: computers, service, apache2-hosts, rsyncd-systemd-hosts, stretch, security_mirror, hasvarlogfs, no-bacula + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, stretch, security_mirror, hasvarlogfs, no-bacula, pe1950 # }}} # {{{ gw-accumu pettersson: address: 130.239.18.123 parents: gw-accumu - hostgroups: computers, hasbootfs, aacraid, nfs-client, service, apache2-hosts, jessie, autofs, sw-raid - ## No need to update to Stretch, casulana replaces it. It should eventually die. + hostgroups: computers, hasbootfs, aacraid, nfs-client, service, apache2-hosts, stretch, autofs, sw-raid + contacts: zobel, tfheen, lfilipoz, zumbi, jcristau, pabs, aurel32, dsa-nsa + contact_groups: "" mirror-accumu: address: 130.242.6.199 parents: gw-accumu2 - hostgroups: computers, service, stretch, apache2-hosts, hassrvfs, rsyncd-hosts, xinetd-hosts + hostgroups: computers, service, stretch, apache2-hosts, hassrvfs, rsyncd-hosts # }}} # {{{ gw-aql eller: @@ -245,15 +238,15 @@ servers: arm-arm-01: address: 217.140.96.58 parents: gw-arm - hostgroups: computers, hassrvfs, buildd, stretch, broken_mq + hostgroups: computers, hassrvfs, buildd, stretch, broken_mq, sw-raid arm-arm-03: address: 217.140.96.60 parents: gw-arm - hostgroups: computers, hassrvfs, buildd, stretch, broken_mq + hostgroups: computers, hassrvfs, buildd, stretch, broken_mq, sw-raid arm-arm-04: address: 217.140.96.61 parents: gw-arm - hostgroups: computers, hassrvfs, buildd, stretch, broken_mq + hostgroups: computers, hassrvfs, buildd, stretch, broken_mq, sw-raid harris: address: 217.140.96.66 parents: gw-arm @@ -271,7 +264,7 @@ servers: fasolo: address: 138.16.160.17 parents: gw-brown - hostgroups: computers, service, apache2-hosts, apache-https, dl380, rsyncd-systemd-hosts, stretch, hassrvfs, postgres96-hosts, manyprocesses + hostgroups: computers, service, apache2-hosts, apache-https, dl380, rsyncd-hosts, stretch, hassrvfs, postgres96-hosts, manyprocesses # }}} # {{{ gw-bytemark bm-bl1: @@ -338,11 +331,11 @@ servers: milanollo2: address: 5.153.231.9 parents: milanollo - hostgroups: secondary-IPs + hostgroups: secondary-IPs, rsyncd-hosts picconi: address: 5.153.231.3 parents: gw-bytemark - hostgroups: computers, service, kvmdomains, jessie, apache2-hosts, nfs-client, autofs, heavy-exim, spamd, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, apache2-hosts, nfs-client, autofs, heavy-exim, spamd, apache-https, systemd-timesyncd senfter: address: 5.153.231.4 parents: gw-bytemark @@ -368,9 +361,9 @@ servers: bmdb1: address: 5.153.231.10 parents: gw-bytemark - hostgroups: computers, hassrvfs, kvmdomains, stretch, postgres94-hosts, postgres96-hosts, systemd-timesyncd + hostgroups: computers, hassrvfs, kvmdomains, stretch, postgres96-hosts, systemd-timesyncd ganeti-bytemark: - address: 82.195.75.111 + address: 5.153.231.1 parents: gw-bytemark hostgroups: notacomputer coccia: @@ -384,7 +377,7 @@ servers: philp: address: 5.153.231.13 parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, jessie, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, hassrvfs, kvmdomains, stretch, apache2-hosts, apache-https, systemd-timesyncd, broken_https_default_vhost rainier: address: 5.153.231.16 parents: ganeti-bytemark @@ -396,7 +389,7 @@ servers: delfin: address: 5.153.231.17 parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, jessie, apache2-hosts, apache-https, nfs-client, autofs, systemd-timesyncd + hostgroups: computers, hassrvfs, kvmdomains, stretch, apache2-hosts, apache-https, nfs-client, autofs, systemd-timesyncd wuiet: address: 5.153.231.18 parents: ganeti-bytemark @@ -408,25 +401,19 @@ servers: donizetti: address: 5.153.231.20 parents: ganeti-bytemark - hostgroups: computers, general, kvmdomains, jessie, nfs-client, autofs, systemd-timesyncd - moszumanska: - address: 5.153.231.21 - parents: ganeti-bytemark - contact_groups: alioth-admins - hostgroups: computers, general, wheezy, postgres91-hosts, apache2-hosts, acpid-hosts, apache-https, brokensamhain, no-bacula, bind9-hosts, xinetd-hosts, alioth, heavy-exim, spamd - no-servicegroups: true + hostgroups: computers, general, kvmdomains, stretch, nfs-client, autofs, systemd-timesyncd dillon: address: 5.153.231.22 parents: ganeti-bytemark - hostgroups: computers, general, kvmdomains, jessie, nfs-client, autofs, hassrvfs, systemd-timesyncd + hostgroups: computers, general, kvmdomains, stretch, nfs-client, autofs, hassrvfs, systemd-timesyncd ticharich: address: 5.153.231.23 parents: ganeti-bytemark - hostgroups: computers, general, kvmdomains, jessie, nfs-client, autofs, apache2-hosts, apache-https, service, broken_https_default_vhost, systemd-timesyncd + hostgroups: computers, general, kvmdomains, stretch, nfs-client, autofs, apache2-hosts, apache-https, service, broken_https_default_vhost, systemd-timesyncd petrova: address: 5.153.231.25 parents: ganeti-bytemark - hostgroups: computers, kvmdomains, jessie, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, kvmdomains, stretch, apache2-hosts, apache-https, systemd-timesyncd olin: address: 5.153.231.26 parents: ganeti-bytemark @@ -438,7 +425,7 @@ servers: quantz: address: 5.153.231.28 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, nfs-client, heavy-exim, apache2-hosts, autofs, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, nfs-client, heavy-exim, apache2-hosts, autofs, apache-https, systemd-timesyncd respighi: address: 5.153.231.29 parents: ganeti-bytemark @@ -450,35 +437,23 @@ servers: x86-bm-01: address: 5.153.231.32 parents: ganeti-bytemark - hostgroups: computers, kvmdomains, stretch, no-bacula, systemd-timesyncd + hostgroups: computers, pybuildd, hassrvfs, kvmdomains, stretch, systemd-timesyncd tate: address: 5.153.231.33 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, autofs, nfs-client, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, autofs, nfs-client, apache2-hosts, apache-https, systemd-timesyncd gideon: address: 5.153.231.34 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, systemd-timesyncd lindsay: address: 5.153.231.36 parents: ganeti-bytemark hostgroups: computers, service, kvmdomains, stretch, autofs, nfs-client, systemd-timesyncd - mirror-bytemark: - address: 5.153.231.37 - parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, systemd-timesyncd, apache2-hosts, hassrvfs - mirror-bytemark-debian: - address: 5.153.231.45 - hostgroups: secondary-IPs - parents: mirror-bytemark - mirror-bytemark-security: - address: 5.153.231.46 - hostgroups: secondary-IPs - parents: mirror-bytemark sor: address: 5.153.231.38 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, autofs, nfs-client, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, autofs, nfs-client, systemd-timesyncd jerea: address: 5.153.231.39 parents: ganeti-bytemark @@ -486,30 +461,32 @@ servers: mekeel: address: 5.153.231.40 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, nfs-client, autofs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, nfs-client, autofs, systemd-timesyncd pinel: address: 5.153.231.42 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, nfs-client, autofs, heavy-exim, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, nfs-client, autofs, heavy-exim, systemd-timesyncd rusca: address: 5.153.231.43 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, systemd-timesyncd manziarly: address: 5.153.231.44 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, autofs, nfs-client, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, autofs, nfs-client, apache2-hosts, apache-https, systemd-timesyncd casulana: address: 5.153.231.41 parents: gw-bytemark - hostgroups: computers, service, stretch, hassrvfs, dl380, manyprocesses + hostgroups: computers, service, stretch, hassrvfs, dl380, manyprocesses, apache2-hosts + contacts: zobel, tfheen, lfilipoz, zumbi, jcristau, pabs, aurel32, dsa-nsa + contact_groups: "" # }}} # {{{ gw-c3sl santoro: address: 200.17.202.197 parents: gw-c3sl - hostgroups: computers, service, apache2-hosts, rsyncd-systemd-hosts, hassrvfs, stretch, high-RTT, security_mirror, no-bacula, apache-https + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, hassrvfs, stretch, high-RTT, security_mirror, no-bacula, apache-https contacts: faw # }}} # {{{ gw-cecsit @@ -520,11 +497,11 @@ servers: mirror-anu2: address: 150.203.164.60 parents: mirror-anu - hostgroups: secondary-IPs + hostgroups: secondary-IPs, rsyncd-hosts mirror-anu3: address: 150.203.164.61 parents: mirror-anu - hostgroups: secondary-IPs, security_mirror + hostgroups: secondary-IPs, security_mirror, rsyncd-hosts mirror-anu4: address: 150.203.164.62 parents: mirror-anu @@ -534,11 +511,11 @@ servers: conova-node01: address: 217.196.149.227 parents: gw-conova - hostgroups: computers, stretch, service, sw-raid + hostgroups: computers, stretch, service, sw-raid, drbd-hosts conova-node02: address: 217.196.149.228 parents: gw-conova - hostgroups: computers, stretch, service, sw-raid + hostgroups: computers, stretch, service, sw-raid, drbd-hosts ganeti-conova: address: 217.196.149.235 parents: gw-conova @@ -546,22 +523,22 @@ servers: mirror-conova: address: 217.196.149.229 parents: gw-conova - hostgroups: computers, stretch, service, apache2-hosts, apache-https + hostgroups: computers, stretch, service, apache2-hosts mirror-conova-debian: address: 217.196.149.232 hostgroups: secondary-IPs parents: mirror-conova mirror-conova-security: address: 217.196.149.233 - hostgroups: secondary-IPs + hostgroups: secondary-IPs, rsyncd-hosts, security_mirror parents: mirror-conova mirror-conova-archive: address: 217.196.149.234 - hostgroups: secondary-IPs + hostgroups: secondary-IPs, rsyncd-hosts parents: mirror-conova mirror-conova-syncproxy4-eu: address: 217.196.149.237 - hostgroups: secondary-IPs + hostgroups: secondary-IPs, rsyncd-hosts, https-service parents: mirror-conova arm-conova-01: @@ -576,6 +553,11 @@ servers: address: 217.196.149.236 parents: ganeti-conova hostgroups: computers, hassrvfs, porterbox, stretch + + schmelzer: + address: 185.69.161.161 + parents: gw-conova + hostgroups: computers, service, stretch, r540, manyprocesses, apache2-hosts, rsyncd-hosts, apache-https, systemd-timesyncd # }}} # {{{ gw-csail csail-node01: @@ -588,21 +570,13 @@ servers: hostgroups: computers, service, dl360, stretch, drbd-hosts ganeti-csail: address: 128.31.0.49 - parents: gw-bytemark + parents: gw-csail hostgroups: notacomputer - falla: - address: 128.31.0.65 - parents: ganeti-csail - hostgroups: computers, freebsd, hassrvfs, porterbox, jessie, jessie-freebsd - fischer: - address: 128.31.0.35 - parents: ganeti-csail - hostgroups: computers, freebsd, hassrvfs, porterbox, jessie mirror-csail: address: 128.31.0.62 parents: ganeti-csail - hostgroups: computers, service, hassrvfs, kvmdomains, stretch, apache2-hosts, rsyncd-systemd-hosts, apache-https, systemd-timesyncd + hostgroups: computers, service, hassrvfs, kvmdomains, stretch, apache2-hosts, rsyncd-hosts, apache-https, systemd-timesyncd x86-csail-01: address: 128.31.0.50 parents: ganeti-csail @@ -614,11 +588,11 @@ servers: soriano: address: 128.31.0.67 parents: ganeti-csail - hostgroups: computers, service, kvmdomains, hassrvfs, jessie, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, hassrvfs, stretch, apache2-hosts, apache-https, systemd-timesyncd pkgmirror-csail: address: 128.31.0.51 parents: ganeti-csail - hostgroups: computers, service, kvmdomains, jessie, apache2-hosts, no-bacula, apache-https, hassrvfs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, apache2-hosts, no-bacula, apache-https, hassrvfs, systemd-timesyncd, varnish-hosts usper: address: 128.31.0.69 parents: ganeti-csail @@ -634,7 +608,7 @@ servers: sechter: address: 128.61.240.73 parents: gw-gatech - hostgroups: computers, service, apache2-hosts, rsyncd-systemd-hosts, sw-raid, hasbootfs, hassrvfs, stretch, security_mirror + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, sw-raid, hasbootfs, hassrvfs, stretch, security_mirror # }}} # {{{ gw-grnet ganeti-grnet: @@ -660,11 +634,11 @@ servers: cgi-grnet-01: address: 194.177.211.202 parents: gw-grnet - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, apache-https, xinetd-hosts, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, xinetd-hosts, systemd-timesyncd x86-grnet-01: address: 194.177.211.203 parents: ganeti-grnet - hostgroups: computers, buildd, hassrvfs, kvmdomains, stretch, systemd-timesyncd + hostgroups: computers, pybuildd, hassrvfs, kvmdomains, stretch, systemd-timesyncd vittoria: address: 194.177.211.205 parents: ganeti-grnet @@ -676,11 +650,11 @@ servers: porta: address: 194.177.211.207 parents: ganeti-grnet - hostgroups: computers, service, hassrvfs, kvmdomains, stretch, rsyncd-systemd-hosts, systemd-timesyncd + hostgroups: computers, service, hassrvfs, kvmdomains, stretch, rsyncd-hosts, systemd-timesyncd melartin: address: 194.177.211.208 parents: ganeti-grnet - hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, postgres96-hosts + hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, postgres96-hosts, hassrvfs static-master-grnet-01: address: 194.177.211.209 parents: ganeti-grnet @@ -690,11 +664,11 @@ servers: mirror-isc: address: 149.20.4.13 parents: gw-isc - hostgroups: computers, service, apache2-hosts, apache-https, dl360, hassrvfs, xinetd-hosts, stretch, security_mirror + hostgroups: computers, service, apache2-hosts, apache-https, dl360, hassrvfs, xinetd-hosts, stretch mirror-isc2: address: 149.20.4.14 parents: mirror-isc - hostgroups: secondary-IPs + hostgroups: secondary-IPs, rsyncd-hosts, security_mirror mirror-isc3: address: 149.20.4.15 parents: mirror-isc @@ -702,94 +676,80 @@ servers: mirror-isc-syncproxy: address: 149.20.4.16 parents: mirror-isc - hostgroups: secondary-IPs + hostgroups: secondary-IPs, rsyncd-hosts # }}} # {{{ gw-leaseweb lw01: address: 185.17.185.177 parents: gw-leaseweb - hostgroups: computers, service, jessie, dl180, nfs-server, rsyncd-systemd-hosts + hostgroups: computers, service, stretch, dl180, nfs-server, rsyncd-hosts lw02: address: 185.17.185.178 parents: gw-leaseweb - hostgroups: computers, service, jessie, dl180, nfs-server, rsyncd-systemd-hosts + hostgroups: computers, service, stretch, dl180, nfs-server, rsyncd-hosts lw03: address: 185.17.185.179 parents: gw-leaseweb - hostgroups: computers, service, jessie, dl180, nfs-server, rsyncd-systemd-hosts + hostgroups: computers, service, stretch, dl180, nfs-server, rsyncd-hosts lw04: address: 185.17.185.180 parents: gw-leaseweb - hostgroups: computers, service, jessie, dl180, nfs-server, rsyncd-systemd-hosts + hostgroups: computers, service, stretch, dl180, nfs-server, rsyncd-hosts lw07: address: 185.17.185.187 parents: gw-leaseweb - hostgroups: computers, service, jessie, dl180, nfs-client, autofs, hassrvfs, postgres94-hosts, apache2-hosts + hostgroups: computers, service, stretch, dl180, nfs-client, autofs, hassrvfs, postgres96-hosts, apache2-hosts, haproxy-hosts, haproxy-https-host, varnish-hosts + lw07-2: + address: 185.17.185.185 + parents: lw07 + hostgroups: secondary-IPs, https-service + lw08: address: 185.17.185.189 parents: gw-leaseweb - hostgroups: computers, service, jessie, dl180, nfs-client, autofs, hassrvfs, apache2-hosts - # }}} - # {{{ gw-linaro - arm-linaro-01: - address: 64.28.108.83 - parents: gw-linaro - hostgroups: computers, hasbootfs, hassrvfs, buildd, stretch, broken_mq - arm-linaro-03: - address: 64.28.108.85 - parents: gw-linaro - hostgroups: computers, hasbootfs, hassrvfs, buildd, stretch, broken_mq - asachi: - address: 64.28.108.84 - parents: gw-linaro - hostgroups: computers, hasbootfs, hassrvfs, porterbox, stretch, broken_mq - # }}} - # {{{ gw-karlsruhe - zemlinsky: - address: 129.143.160.6 - parents: gw-karlsruhe - hostgroups: computers, buildd, stretch - contacts: pkern + hostgroups: computers, service, stretch, dl180, nfs-client, autofs, hassrvfs, apache2-hosts + lw09: + address: 185.17.185.181 + parents: gw-leaseweb + hostgroups: computers, service, stretch, dl180 + lw10: + address: 185.17.185.182 + parents: gw-leaseweb + hostgroups: computers, service, stretch, dl180 # }}} # {{{ gw-manda czerny: address: 82.195.75.109 parents: gw-manda - hostgroups: computers, service, dl380, acpid-hosts, jessie, drbd-hosts + hostgroups: computers, service, dl380, acpid-hosts, stretch, drbd-hosts, manyprocesses clementi: address: 82.195.75.103 parents: gw-manda - hostgroups: computers, service, dl380, acpid-hosts, jessie, drbd-hosts + hostgroups: computers, service, dl380, acpid-hosts, stretch, drbd-hosts, manyprocesses + manda-node03: + address: 82.195.75.69 + parents: gw-manda + hostgroups: computers, service, stretch, r540, drbd-hosts, manyprocesses + manda-node04: + address: 82.195.75.70 + parents: gw-manda + hostgroups: computers, service, stretch, r540, drbd-hosts, manyprocesses bendel: address: 82.195.75.100 parents: ganeti3 - hostgroups: computers, service, hasbootfs, kvmdomains, hassrvfs, apache2-hosts, jessie, postfix-hosts, heavy-postfix, apache-https, amavis-hosts, hasvarlogfs + hostgroups: computers, service, hasbootfs, kvmdomains, hassrvfs, apache2-hosts, stretch, postfix-hosts, heavy-postfix, apache-https, amavis-hosts, hasvarlogfs master: address: 82.195.75.110 parents: ganeti3 - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, spamd, heavy-exim, highload - fils: - address: 82.195.75.89 - parents: ganeti3 - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph - fayrfax: - address: 82.195.75.82 - parents: ganeti3 - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, spamd, heavy-exim, highload vento: address: 82.195.75.98 parents: ganeti3 hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, heavy-exim - lully: - address: 82.195.75.99 - parents: ganeti3 - hostgroups: computers, service, hasbootfs, kvmdomains, stretch, hasvarlogfs draghi: address: 82.195.75.106 parents: ganeti3 - hostgroups: computers, service, hasbootfs, hassrvfs, apache2-hosts, spamd, heavy-exim, kvmdomains, xinetd-hosts, apache-https, stretch + hostgroups: computers, service, hassrvfs, apache2-hosts, spamd, heavy-exim, kvmdomains, xinetd-hosts, apache-https, stretch geo1: address: 82.195.75.105 parents: ganeti3 @@ -797,11 +757,11 @@ servers: handel: address: 82.195.75.104 parents: ganeti3 - hostgroups: computers, service, kvmdomains, apache2-hosts, stretch, postgres96-hosts + hostgroups: computers, service, kvmdomains, apache2-hosts, stretch, postgres96-hosts, hassrvfs kaufmann: address: 82.195.75.107 parents: ganeti3 - hostgroups: computers, service, apache2-hosts, rsyncd-systemd-hosts, kvmdomains, stretch, apache-https + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, kvmdomains, stretch, apache-https ganeti3: address: 82.195.75.111 parents: gw-manda @@ -809,7 +769,7 @@ servers: wilder: address: 82.195.75.112 parents: ganeti3 - hostgroups: computers, service, hassrvfs, apache2-hosts, kvmdomains, jessie, apache-https, rsyncd-systemd-hosts + hostgroups: computers, service, hassrvfs, apache2-hosts, kvmdomains, stretch, apache-https, rsyncd-hosts mailly: address: 82.195.75.114 parents: ganeti3 @@ -821,11 +781,11 @@ servers: vogler: address: 82.195.75.92 parents: ganeti3 - hostgroups: computers, service, kvmdomains, jessie + hostgroups: computers, service, kvmdomains, stretch wolkenstein: address: 82.195.75.65 parents: ganeti3 - hostgroups: computers, hasbootfs, hassrvfs, kvmdomains, service, xinetd-hosts, apache2-hosts, jessie, apache-https + hostgroups: computers, hasbootfs, hassrvfs, kvmdomains, service, xinetd-hosts, apache2-hosts, stretch, apache-https mips-manda-01: address: 82.195.75.66 parents: gw-manda @@ -845,7 +805,7 @@ servers: seger: address: 82.195.75.93 parents: ganeti3 - hostgroups: computers, service, apache2-hosts, hassrvfs, hasbootfs, rsyncd-systemd-hosts, uploadqueue, kvmdomains, apache-https, postgres94-hosts, jessie + hostgroups: computers, service, apache2-hosts, hassrvfs, rsyncd-hosts, kvmdomains, apache-https, postgres96-hosts, stretch suchon: address: 82.195.75.68 parents: ganeti3 @@ -855,14 +815,9 @@ servers: zani: address: 148.100.88.22 parents: gw-marist - hostgroups: computers, buildd, hassrvfs, stretch, incomingmailrelayed + hostgroups: computers, pybuildd, hassrvfs, stretch, incomingmailrelayed # }}} # {{{ gw-osuosl - busoni: - address: 140.211.166.202 - parents: gw-osuosl - hostgroups: computers, service, dl360, hassrvfs, jessie, hasvarlogfs, apache2-hosts, no-bacula, apache-https - byrd: address: 140.211.166.200 parents: gw-osuosl @@ -870,7 +825,16 @@ servers: beach: address: 140.211.166.201 parents: byrd - hostgroups: computers, service, kvmdomains, stretch, apache2-hosts, hassrvfs, rsyncd-systemd-hosts, apache-https + hostgroups: computers, service, kvmdomains, stretch, apache2-hosts, hassrvfs, rsyncd-hosts, apache-https + + pijper: + address: 140.211.166.194 + parents: gw-osuosl + hostgroups: computers, stretch, service, manyprocesses + loghost-osuosl-01: + address: 140.211.166.202 + parents: pijper + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, systemd-timesyncd pieta: address: 140.211.166.195 @@ -878,46 +842,33 @@ servers: hostgroups: computers, stretch, service, manyprocesses ppc64el-osuosl-01: address: 140.211.166.196 - parents: pieta + parents: pijper hostgroups: computers, hassrvfs, buildd, stretch - powerpc-osuosl-01: - address: 140.211.166.197 - parents: pieta - hostgroups: computers, hassrvfs, buildd, jessie - pizzetti: - address: 140.211.166.198 - parents: pieta - hostgroups: computers, jessie, hassrvfs, porterbox - partch: - address: 140.211.15.152 - parents: gw-osuosl - hostgroups: computers, jessie, hassrvfs, porterbox, sw-raid # }}} # {{{ gw-sanger sallinen: address: 193.62.202.26 parents: gw-sanger - hostgroups: computers, service, stretch, dl380, nfs-client, autofs + hostgroups: computers, service, stretch, dl380, nfs-client, autofs, postgres96-hosts, apache2-hosts, haproxy-hosts, haproxy-https-host, varnish-hosts + sallinen-2: + address: 193.62.202.27 + parents: sallinen + hostgroups: secondary-IPs, https-service sibelius: address: 193.62.202.28 parents: gw-sanger - hostgroups: computers, postgres94-hosts, service, apache2-hosts, sw-raid, jessie, rsyncd-systemd-hosts, hasvarlogfs, multipath-hosts, nfs-server - contacts: tjrc1, dave - smetana: - address: 193.62.202.29 - parents: gw-sanger - hostgroups: computers, sw-raid, sparc, wheezy, no-bacula + hostgroups: computers, service, apache2-hosts, sw-raid, jessie, rsyncd-hosts, hasvarlogfs, multipath-hosts, nfs-server, varnish-hosts contacts: tjrc1, dave # }}} # {{{ gw-scanplus lobos: address: 212.211.132.250 parents: gw-scanplus-lobos - hostgroups: computers, service, apache2-hosts, rsyncd-systemd-hosts, dl380, hassrvfs, stretch, security_mirror + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, hassrvfs, stretch, security_mirror villa: address: 212.211.132.32 parents: gw-scanplus-villa - hostgroups: computers, service, apache2-hosts, rsyncd-systemd-hosts, dl360, hassrvfs, stretch, security_mirror + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl360, hassrvfs, stretch, security_mirror # }}} # {{{ gw-sil eberlin: @@ -939,66 +890,6 @@ servers: parents: gw-skroutz1, gw-skroutz2 hostgroups: computers, stretch, service, sw-raid, hassrvfs, apache2-hosts # }}} - # {{{ gw-ubcece - sw-ubcece: - hostgroups: layer2-infrastructure - contacts: lfilipoz - pingable: false - check_command: dsa_check_always_ok - sw-ubcece-mcld: - hostgroups: layer2-infrastructure - parents: sw-ubcece - contacts: lfilipoz - pingable: false - check_command: dsa_check_always_ok - sw-ubcece-kais: - hostgroups: layer2-infrastructure - parents: sw-ubcece - contacts: lfilipoz - pingable: false - check_command: dsa_check_always_ok - spontini: - address: 206.12.19.14 - parents: sw-ubcece-mcld - hostgroups: computers, buildd, hasbootfs, hassrvfs, sparc, wheezy - contacts: lfilipoz - ubc-bl7: - address: 206.12.19.217 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl6: - address: 206.12.19.216 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl2: - address: 206.12.19.212 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl3: - address: 206.12.19.213 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl4: - address: 206.12.19.214 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - ubc-bl8: - address: 206.12.19.218 - parents: sw-ubcece-kais - hostgroups: computers, bl460, acpid-hosts, service, jessie, drbd-hosts, multipath-hosts - # MSA 2000 (2012i) - giustini: - address: 192.168.2.6 - parents: sw-ubcece-kais - hostgroups: notacomputer - # unless we implement runfrom for host alive checks - pingable: false - check_command: dsa_check_always_ok -# locke: -# address: 206.12.19.120 -# parents: sw-ubcece-kais -# hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hasvicepa - # }}} # {{{ ubc-gateway ubc-enc2bl01: address: 209.87.16.1 @@ -1020,29 +911,19 @@ servers: rachmaninoff: address: 209.87.16.20 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, jessie, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd x86-ubc-01: address: 209.87.16.21 parents: ubc-gateway hostgroups: computers, buildd, hassrvfs, kvmdomains, stretch, systemd-timesyncd - finzi: - address: 209.87.16.22 - parents: ubc-gateway - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph - fano: - address: 209.87.16.23 - parents: ubc-gateway - hostgroups: computers, freebsd, jessie, buildd, hassrvfs - contacts: christoph elgar: address: 209.87.16.24 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, jessie, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd gombert: address: 209.87.16.25 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, jessie, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, apache2-hosts, apache-https, systemd-timesyncd nono: address: 209.87.16.26 parents: ubc-gateway @@ -1058,11 +939,11 @@ servers: menotti: address: 209.87.16.29 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd danzi: address: 209.87.16.30 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, jessie, postgres94-hosts, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, postgres96-hosts, systemd-timesyncd geo2: address: 209.87.16.31 parents: ubc-gateway @@ -1078,7 +959,7 @@ servers: sonntag: address: 209.87.16.34 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, jessie, nfs-client, autofs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, nfs-client, autofs, systemd-timesyncd tchaikovsky: address: 209.87.16.35 parents: ubc-gateway @@ -1090,7 +971,7 @@ servers: tye: address: 209.87.16.37 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, jessie, heavy-exim, apache2-hosts, apache-https, nfs-client, autofs, hassrvfs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, stretch, heavy-exim, apache2-hosts, apache-https, nfs-client, autofs, hassrvfs, systemd-timesyncd ullmann: address: 209.87.16.38 parents: ubc-gateway @@ -1111,25 +992,33 @@ servers: godard: address: 209.87.16.44 parents: ubc-gateway - hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd, postfix-hosts, postgres96-hosts + hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd, postfix-hosts, postgres96-hosts, crazymanyprocesses + debussy: + address: 209.87.16.46 + parents: ubc-gateway + hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, apache2-hosts, apache-https, broken_https_default_vhost + grabbe: + address: 209.87.16.48 + parents: ubc-gateway + hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, apache2-hosts, apache-https # }}} # {{{ gw-umn #saens: # address: 128.101.240.212 # parents: gw-umn - # hostgroups: computers, service, apache2-hosts, rsyncd-systemd-hosts, dl380, hasvarfs, hasusrfs, hasorgfs, xinetd-hosts, wheezy, security_mirror, no-bacula + # hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, hasvarfs, hasusrfs, hasorgfs, xinetd-hosts, wheezy, security_mirror, no-bacula mirror-umn: address: 128.101.240.212 parents: gw-umn - hostgroups: computers, service, apache2-hosts, apache-https, dl360, hassrvfs, stretch, security_mirror + hostgroups: computers, service, apache2-hosts, apache-https, dl360, hassrvfs, stretch mirror-umn2: address: 128.101.240.215 parents: mirror-umn - hostgroups: secondary-IPs + hostgroups: secondary-IPs, rsyncd-hosts, security_mirror mirror-umn3: address: 128.101.240.216 parents: mirror-umn - hostgroups: secondary-IPs + hostgroups: secondary-IPs, rsyncd-hosts mirror-umn4: address: 128.101.240.217 parents: mirror-umn @@ -1137,19 +1026,15 @@ servers: # }}} # {{{ gw-unicamp prokofiev: - address: 177.220.10.140 + address: 143.106.167.124 parents: gw-unicamp hostgroups: computers, stretch, service, manyprocesses - powerpc-unicamp-01: - address: 177.220.10.141 - parents: prokofiev - hostgroups: computers, hassrvfs, buildd, jessie ppc64el-unicamp-01: - address: 177.220.10.142 + address: 143.106.167.121 parents: prokofiev hostgroups: computers, hassrvfs, buildd, stretch plummer: - address: 177.220.10.143 + address: 143.106.167.122 parents: prokofiev hostgroups: computers, porterbox, hassrvfs, stretch # }}} @@ -1157,7 +1042,7 @@ servers: klecker: address: 130.89.148.10 parents: gw-utwente - hostgroups: computers, service, apache2-hosts, apache-https, rsyncd-systemd-hosts, dl380, jessie, incomingmailrelayed2025, hassrvfs + hostgroups: computers, service, apache2-hosts, apache-https, rsyncd-hosts, dl380, stretch, incomingmailrelayed2025, hassrvfs klecker-ftp: address: 130.89.148.12 parents: klecker @@ -1170,6 +1055,10 @@ servers: address: 130.89.148.14 parents: klecker hostgroups: secondary-IPs + smit: + address: 130.89.148.78 + parents: gw-utwente + hostgroups: computers, service, stretch, r540, manyprocesses, incomingmailrelayed2025 # }}} # {{{ gw-ynic henze: @@ -1199,7 +1088,7 @@ servers: setoguchi: address: 133.242.99.74 parents: gw-sakura - hostgroups: computers, service, stretch, no-bacula, hassrvfs, apache2-hosts, rsyncd-systemd-hosts, security_mirror + hostgroups: computers, service, stretch, no-bacula, hassrvfs, apache2-hosts, rsyncd-hosts, security_mirror # }}} # {{{ ############################# host groups ############################# @@ -1207,30 +1096,14 @@ hostgroups: computers: alias: computers private: 1 - extinfo-icon_image: base/debian.png - extinfo-icon_image_alt: Debian GNU/Linux - extinfo-notes_url: https://db.debian.org/machines.cgi?host=%s - layer2-infrastructure: - alias: Layer 2 Devices - extinfo-icon_image: base/switch40.png - extinfo-icon_image_alt: switch layer3-infrastructure: alias: Layer 3 Devices - extinfo-icon_image: base/switch40.png - extinfo-icon_image_alt: router notacomputer: alias: Systems that are not really systems. Yeah :) private: 1 - freebsd: - alias: freebsd - private: 1 - extinfo-icon_image_alt: Debian GNU/kFreeBSD armhf: alias: armhf private: 1 - sparc: - alias: sparc - private: 1 porterbox: alias: developer accessible porter machines @@ -1238,6 +1111,8 @@ hostgroups: alias: machines running services buildd: alias: buildd systems + pybuildd: + alias: buildd systems running pybuildd general: alias: general purpose developer accessible machines @@ -1268,13 +1143,15 @@ hostgroups: aacraid: alias: Hosts with Adaptec AACraid private: 1 + pe1950: + alias: Dell PowerEdge 1950 hosts + private: 1 + r540: + alias: Dell PowerEdge R540 hosts + private: 1 - wheezy: - alias: Hosts running wheezy jessie: alias: Hosts running jessie - jessie-freebsd: - alias: kFreebsd hosts running jessie stretch: alias: Hosts running stretch @@ -1311,20 +1188,11 @@ hostgroups: alias: hosts running amavis private: 1 rsyncd-hosts: - alias: hosts providing rsync services via xinetd - private: 1 - rsyncd-systemd-hosts: - alias: hosts providing rsync services via systemd + alias: hosts providing rsync services private: 1 xinetd-hosts: alias: hosts providing services via xinetd private: 1 - postgres91-hosts: - alias: hosts running postgres91 - private: 1 - postgres94-hosts: - alias: hosts running postgres94 - private: 1 postgres96-hosts: alias: hosts running postgres96 private: 1 @@ -1346,11 +1214,25 @@ hostgroups: apache-https: alias: hosts with https services private: 1 + https-service: + alias: https service for secondary addresses + private: 1 broken_https_default_vhost: alias: https default vhost does not say 200 OK private: 1 manyprocesses: alias: hosts with lots and lots of (kernel) processes + crazymanyprocesses: + alias: hosts with stupidly lots of processes + varnish-hosts: + alias: hosts running varnish + private: 1 + haproxy-hosts: + alias: hosts running haproxy + private: 1 + haproxy-https-host: + alias: "host providing https on the standard port via haproxy" + private: 1 no-bacula: alias: hosts which are not being backed up with bacula @@ -1402,9 +1284,6 @@ hostgroups: high-RTT: alias: machines with high round trip times private: 1 - alioth: - alias: machines that just are just awkward - private: 1 #openstack-compute: # alias: nodes that run OpenStack compute # private: 1 @@ -1471,6 +1350,11 @@ services: check_interval: 5 max_check_attempts: 4 retry_interval: 1 + - + name: network - v6 gw + nrpe: "/usr/lib/nagios/plugins/dsa-check-ipv6-default-gw" + hostgroups: computers + check_interval: 60 # }}} # {{{ ### disk usage - @@ -1504,7 +1388,7 @@ services: name: disk usage on /var/lib/postgresql servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /var/lib/postgresql" - hosts: sibelius, busoni, buxtehude, lw07, fasolo + hosts: sibelius, buxtehude, lw07, fasolo - name: disk usage on /var/log servicegroups: diskspace @@ -1526,24 +1410,44 @@ services: nrpe: "/usr/lib/nagios/plugins/check_disk 90 94 /srv/snapshot.debian.org" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-1 + name: disk usage on /srv/farm-snapshot/farm-2017-0 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-0" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2017-1 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-1" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2017-2 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-2" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2017-3 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-1" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-3" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-2 + name: disk usage on /srv/farm-snapshot/farm-2017-4 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-4" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-3 + name: disk usage on /srv/farm-snapshot/farm-2017-5 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-3" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-5" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-4 + name: disk usage on /srv/farm-snapshot/farm-2017-6 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-4" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-6" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2017-7 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-7" hosts: sibelius - name: disk usage on /srv/ftp-master.debian.org @@ -1553,37 +1457,79 @@ services: - name: disk usage on /storage/snapshot-farm-1 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-1" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-1" hosts: lw01 - name: disk usage on /storage/snapshot-farm-2 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-2" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-2" hosts: lw02 - name: disk usage on /storage/snapshot-farm-3 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-3" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-3" hosts: lw03 - name: disk usage on /storage/snapshot-farm-4 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-4" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-4" hosts: lw04 + - + name: disk usage on /storage/snapshot-farm-90 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-09" + hosts: lw09 + - + name: disk usage on /storage/snapshot-farm-10 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-10" + hosts: lw10 + + - + name: disk usage on nfs farm 1 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /auto.dsa/snapshot-1" + hosts: lw07 + - + name: disk usage on nfs farm 2 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /auto.dsa/snapshot-2" + hosts: lw07 + - + name: disk usage on nfs farm 3 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /auto.dsa/snapshot-3" + hosts: lw07 + - + name: disk usage on nfs farm 4 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /auto.dsa/snapshot-4" + hosts: lw07 + - + name: disk usage on nfs farm 09 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /auto.dsa/snapshot-09" + hosts: lw07 + - + name: disk usage on nfs farm 10 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /auto.dsa/snapshot-10" + hosts: lw07 + - name: disk usage on /srv/morgue.debian.org/ servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 95 90 /srv/morgue.debian.org" + nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/morgue.debian.org" hosts: lw03 - name: disk usage on /srv/QNAP-big/ servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 80 /srv/QNAP-big" + nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /srv/QNAP-big" hosts: storace - name: disk usage on /srv/QNAP-tiny servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 80 /srv/QNAP-tiny" + nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/QNAP-tiny" hosts: storace # }}} # {{{ ### system @@ -1593,7 +1539,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-config" hostgroups: computers check_interval: 60 - excludehostgroups: alioth - name: setup - local hostname etc-hosts nrpe: 'if getent ahosts `hostname` | grep -q 127.0; then echo "Warning: local hostname resolves to 127/8 address"; exit 1; else echo "OK: Hostname resolves to non-127/8 address."; exit 0; fi' @@ -1623,19 +1568,15 @@ services: name: processes - total nrpe: "/usr/lib/nagios/plugins/check_procs 620 700" hostgroups: computers - excludehostgroups: manyprocesses + excludehostgroups: manyprocesses, crazymanyprocesses - name: processes - total hostgroups: manyprocesses nrpe: "/usr/lib/nagios/plugins/check_procs 1500 1700" - - name: swap usage - percent - nrpe: "/usr/lib/nagios/plugins/check_swap -w 20% -c 10%" - hostgroups: computers - - - name: swap usage - mb - nrpe: "/usr/lib/nagios/plugins/check_swap -w 20000 -c 5000" - hostgroups: computers + name: processes - total + hostgroups: crazymanyprocesses + nrpe: "/usr/lib/nagios/plugins/check_procs 15000 25000" - name: free memory - mb nrpe: "/usr/lib/nagios/plugins/dsa-check-memory -m mb" @@ -1644,21 +1585,10 @@ services: name: free memory - percent nrpe: "/usr/lib/nagios/plugins/dsa-check-memory -m pct" hostgroups: computers - - - name: process - getty - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C getty -a /sbin/getty" - hostgroups: computers - excludehosts: zelenka, zandonai - excludehostgroups: jessie, stretch - - - name: process - getty - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C agetty -a /sbin/getty" - hostgroups: jessie-freebsd - name: process - getty nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C agetty -a /sbin/agetty" - hostgroups: jessie, stretch - excludehostgroups: freebsd + hostgroups: computers - name: processes - zombies @@ -1669,7 +1599,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-entropy" event_handler: dsa_event_handler_restart_ekey hostgroups: computers - excludehostgroups: freebsd - name: system - filesystem check nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-filesystems" @@ -1701,7 +1630,7 @@ services: remotecheck: "/usr/lib/nagios/plugins/dsa-check-bacula $HOSTNAME$.debian.org" runfrom: dinis hostgroups: computers - excludehostgroups: buildd, porterbox, no-bacula + excludehostgroups: buildd, pybuildd, porterbox, no-bacula check_interval: 60 retry_interval: 15 - @@ -1710,7 +1639,7 @@ services: remotecheck: "/usr/lib/nagios/plugins/dsa-check-bacula -w 1080 -c 1560 $HOSTNAME$.debian.org F" runfrom: dinis hostgroups: computers - excludehostgroups: buildd, porterbox, no-bacula + excludehostgroups: buildd, pybuildd, porterbox, no-bacula check_interval: 60 retry_interval: 15 - @@ -1723,12 +1652,6 @@ services: servicegroups: backup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u bacula -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" hostgroups: computers - excludehostgroups: freebsd, alioth - - - name: process - bacula-fd - servicegroups: backup - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" - hostgroups: freebsd - name: network backup status - draghi @@ -1765,9 +1688,8 @@ services: - name: upgraded libraries servicegroups: security - nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-libs" + nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-libs --ignore-younger=1h" hostgroups: computers - excludehostgroups: freebsd check_interval: 60 retry_interval: 15 notification_interval: 10080 @@ -1775,26 +1697,14 @@ services: name: installed firewall nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/ferm.conf" hostgroups: computers - excludehostgroups: freebsd - name: puppetized firewall nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/conf.d/defs.conf" hostgroups: computers - excludehostgroups: freebsd - - - name: process - ulogd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ulogd -a '/usr/sbin/ulogd -d'" - hostgroups: computers - excludehostgroups: freebsd, sparc, jessie, stretch - name: process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u ulog -C ulogd -a '/usr/sbin/ulogd --daemon --uid ulog'" - hostgroups: jessie, stretch - excludehostgroups: freebsd - - - name: unexpected process - ulogd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C ulogd" - hostgroups: freebsd, sparc + hostgroups: computers #### - name: process - samhain @@ -1818,39 +1728,26 @@ services: excludehostgroups: brokensamhain # }}} # {{{ logging - - - name: process - syslog-ng - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" - hostgroups: computers - excludehostgroups: freebsd, jessie, stretch - - - name: process - syslog-ng - nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:2 -c 2: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" - hostgroups: freebsd - name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -F'" - hostgroups: jessie, stretch - excludehostgroups: freebsd + hostgroups: computers - name: remote logging on lotti remotecheck: "/usr/lib/nagios/plugins/dsa-check-log-age-loghost $HOSTNAME$" runfrom: lotti hostgroups: computers - excludehostgroups: alioth - - name: remote logging on lully + name: remote logging on loghost-grnet-01 remotecheck: "/usr/lib/nagios/plugins/dsa-check-log-age-loghost $HOSTNAME$" - runfrom: lully + runfrom: loghost-grnet-01 hostgroups: computers - excludehostgroups: alioth - - name: remote logging on loghost-grnet-01 + name: remote logging on loghost-osuosl-01 remotecheck: "/usr/lib/nagios/plugins/dsa-check-log-age-loghost $HOSTNAME$" - runfrom: loghost-grnet-01 + runfrom: loghost-osuosl-01 hostgroups: computers - excludehostgroups: alioth # }}} # {{{ base service - @@ -1889,11 +1786,6 @@ services: name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a 'munin-node'" hostgroups: computers - excludehostgroups: freebsd - - - name: process - munin-node - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C perl -a '/usr/bin/perl -wT /usr/sbin/munin-node'" - hostgroups: freebsd - name: network service - munin-node check: check_tcp!4949 @@ -1917,7 +1809,7 @@ services: name: system time synced nrpe: "/usr/lib/nagios/plugins/dsa-check-timedatectl -s" hostgroups: computers - excludehostgroups: systemd-timesyncd, freebsd, wheezy + excludehostgroups: systemd-timesyncd servicegroups: time - name: system time synced @@ -1933,11 +1825,8 @@ services: - name: process - irqbalance nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C irqbalance -a '/usr/sbin/irqbalance'" - #hosts: casulana hostgroups: computers - #excludehostgroups: single-cpu, freebsd - excludehostgroups: freebsd - excludehosts: harris, smetana + excludehosts: harris ### - name: process - cron @@ -1948,17 +1837,6 @@ services: name: process - ud-replicated nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C ud-replicated -a '/usr/bin/python /usr/bin/ud-replicated'" hostgroups: computers - excludehostgroups: freebsd, alioth - - - name: process - ud-replicated - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C python2.7 -a '/usr/bin/python /usr/bin/ud-replicated'" - hostgroups: freebsd - ### - - - name: process - monit - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/bin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" - hostgroups: computers - excludehostgroups: alioth, jessie, stretch ### - name: MQ connection on rainier @@ -1968,7 +1846,7 @@ services: hostgroups: computers check_interval: 60 retry_interval: 15 - excludehostgroups: alioth, broken_mq + excludehostgroups: broken_mq - name: MQ connection on rapoport servicegroups: MQ @@ -1977,7 +1855,7 @@ services: hostgroups: computers check_interval: 60 retry_interval: 15 - excludehostgroups: alioth, broken_mq + excludehostgroups: broken_mq ### - name: local resolver @@ -1988,33 +1866,21 @@ services: name: process - unbound nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u unbound -C unbound -a '/usr/sbin/unbound'" hostgroups: computers - excludehostgroups: alioth - ### - - name: process - uptimed - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u daemon -C uptimed -a '/usr/sbin/uptimed'" + name: unbound trust anchors + nrpe: "/usr/lib/nagios/plugins/dsa-check-unbound-anchors" hostgroups: computers + check_interval: 60 ### - - name: process - udevd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C udevd -a 'udevd'" + name: process - uptimed + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u daemon -C uptimed -a '/usr/sbin/uptimed'" hostgroups: computers - excludehostgroups: freebsd, jessie, stretch - name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C systemd-udevd -a '/lib/systemd/systemd-udevd'" - hostgroups: jessie, stretch - excludehostgroups: freebsd - - - name: unexpected process - udev - nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C udevd" - hostgroups: freebsd + hostgroups: computers ### - - - name: process - acpid - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C acpid -a '/usr/sbin/acpid'" - hostgroups: acpid-hosts - excludehostgroups: jessie, stretch - name: unexpected process - acpid nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C acpid" @@ -2034,20 +1900,12 @@ services: - name: process - stunnel4 - puppet-ekeyd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u stunnel4 -C stunnel4 -a '/usr/bin/stunnel4 /etc/stunnel/puppet-ekeyd.conf'" - hostgroups: wheezy, jessie, stretch - excludehostgroups: freebsd, alioth + hostgroups: computers - name: process - stunnel4 - puppet-ekeyd is crazy nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-stunnel-sanity" hostgroups: computers - excludehostgroups: freebsd, alioth - excludehosts: czerny, grnet-node01, storace, ubc-bl2 - ### - - - name: process - rngd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C rngd -a '/usr/sbin/rngd -r /dev/hwrng'" - hostgroups: kvmdomains - excludehostgroups: stretch + excludehosts: czerny, grnet-node01, storace # }}} # {{{ anti-services - @@ -2100,30 +1958,18 @@ services: name: "sso CRL" nrpe: "if [ -e /var/lib/dsa/sso/ca.crl ]; then /usr/lib/nagios/plugins/dsa-check-crl-expire -w 129600 -c 86400 /var/lib/dsa/sso/ca.crl; else echo 'No sso/ca.crl on this host.'; fi" hostgroups: computers - - - name: SSL certs - puppet - hosts: global - remotecheck: "/usr/lib/nagios/plugins/dsa-check-cert-expire-dir /etc/puppet/modules/ssl/files/servicecerts" - runfrom: handel - name: SSL certs - LE hosts: global - remotecheck: "/usr/lib/nagios/plugins/dsa-check-cert-expire-dir /etc/puppet/modules/ssl/files/from-letsencrypt" + remotecheck: "/usr/lib/nagios/plugins/dsa-check-cert-expire-dir /srv/puppet.debian.org/from-letsencrypt" runfrom: handel # }}} # {{{ HW health/raid - - - name: process - mdadm monitor - servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /run/mdadm/monitor.pid --daemonise --scan'" - hostgroups: sw-raid - excludehostgroups: jessie, stretch - name: process - mdadm monitor servicegroups: raid nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --scan'" hostgroups: sw-raid - excludehostgroups: wheezy - name: RAID - sw raid servicegroups: raid @@ -2148,12 +1994,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --no-controller-ok --ignore-controller='P700m'" check_interval: 120 hostgroups: bm-bl - - - name: HW - hpacucli status - servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --no-battery" - check_interval: 120 - hosts: busoni ### # - # name: HW - edac status @@ -2204,12 +2044,15 @@ services: servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-drbd -d All" hostgroups: drbd-hosts - excludehosts: ubc-bl2, ubc-bl3, ubc-bl6, ubc-bl7, ubc-bl8 - - name: RAID - DRBD - servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/dsa-check-drbd -d All --ok-no-devices" - hosts: ubc-bl2, ubc-bl3, ubc-bl6, ubc-bl7, ubc-bl8 + name: HW - OpenManage status + nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-openmanage" + hostgroups: pe1950, r540 + excludehosts: wieck, schumann + - + name: HW - OpenManage status + nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-openmanage -b bp=0 -b bat_charge=0:0" + hosts: wieck, schumann # }}} # }}} # {{{ ### mail stuff @@ -2219,7 +2062,7 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u Debian-exim -C exim4 -a '/usr/sbin/exim4 -bd -q'" hostgroups: computers excludehostgroups: postfix-hosts, mail-relay - excludehosts: master, busoni, quantz, buxtehude + excludehosts: master, quantz, buxtehude - name: process - exim nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:25 -c 1: -u Debian-exim -C exim4 -a '/usr/sbin/exim4 -bd -q'" @@ -2229,15 +2072,24 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1: -C exim4" hostgroups: computers excludehostgroups: postfix-hosts - excludehosts: master, busoni, quantz, buxtehude + excludehosts: master, quantz, buxtehude - name: process - exim nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:300 -c 1:500 -C exim4 -a '/usr/sbin/exim4'" - hosts: master, busoni, quantz, buxtehude + hosts: master, quantz, buxtehude - name: mail queue nrpe: "/usr/lib/nagios/plugins/check_mailq -M exim -w 1000 -c 2000" hostgroups: heavy-exim + - + name: process - fail2ban + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -C fail2ban-server" + hostgroups: heavy-exim, heavy-postfix + - + name: unwanted process - fail2ban + nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C fail2ban-server" + hostgroups: computers + excludehostgroups: heavy-exim, heavy-postfix # }}} # {{{ clamav - @@ -2249,16 +2101,10 @@ services: nrpe: "/usr/lib/nagios/plugins/check_clamd -H /var/run/clamav/clamd.ctl" hostgroups: heavy-exim, heavy-postfix depends: process - clamav - clamd - - - name: process - clamav - freshclam - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u clamav -C freshclam -a '/usr/bin/freshclam -d --quiet'" - hostgroups: heavy-exim, heavy-postfix - excludehostgroups: jessie, stretch - name: process - clamav - freshclam nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u clamav -C freshclam -a '/usr/bin/freshclam -d --foreground=true'" hostgroups: heavy-exim, heavy-postfix - excludehostgroups: wheezy - name: unwanted process - clamav nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C clamd" @@ -2273,23 +2119,16 @@ services: # {{{ anti-spam - name: process - spamd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" - hostgroups: spamd - excludehosts: picconi - excludehostgroups: jessie, stretch - - - name: process - spamd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamassassin.pid --create-prefs --max-children 5 --helper-home-dir'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamd.pid --create-prefs --max-children 5 --helper-home-dir'" hostgroups: spamd excludehosts: picconi - excludehostgroups: wheezy - name: process - spamd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamassassin.pid --create-prefs --max-children 20 --min-spare=5 --helper-home-dir'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamd.pid --create-prefs --max-children 20 --min-spare=5 --helper-home-dir'" hosts: picconi - name: process - spamd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamassassin.pid --create-prefs --max-children 10 --helper-home-dir'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamd.pid --create-prefs --max-children 10 --helper-home-dir'" hosts: bendel - name: process - spamd - child @@ -2303,7 +2142,7 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C spamd" hostgroups: computers excludehostgroups: spamd - excludehosts: bendel, busoni + excludehosts: bendel - name: unwanted process - greylistd @@ -2311,16 +2150,10 @@ services: hostgroups: computers ### - - - name: process - postgrey - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -a '/usr/sbin/postgrey --pidfile=/var/run/postgrey.pid --daemonize --unix=/var/run/postgrey/socket --retry-window=4 --auto-whitelist-clients=10 --exim'" - hostgroups: heavy-exim - excludehostgroups: jessie, stretch - name: process - postgrey nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -a 'postgrey --pidfile=/var/run/postgrey.pid --daemonize --unix=/var/run/postgrey/socket --retry-window=4 --auto-whitelist-clients=10 --exim'" hostgroups: heavy-exim - excludehostgroups: wheezy - name: process - postgrey nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -a 'postgrey --pidfile=/var/run/postgrey.pid --daemonize --inet=127.0.0.1:60000'" @@ -2351,62 +2184,42 @@ services: - name: process - weightd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u polw -a 'policyd-weight (master)'" - hostgroups: heavy-postfix, alioth + hostgroups: heavy-postfix - name: process - weightd - cache nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u polw -a 'policyd-weight (cache)'" - hostgroups: heavy-postfix, alioth + hostgroups: heavy-postfix depends: process - weightd - master - name: process - weightd - child nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:50 -c 1: -u polw -a 'policyd-weight (child)'" - hostgroups: heavy-postfix, alioth + hostgroups: heavy-postfix depends: process - weightd - master ### - name: unwanted process - policyd-weight nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C policyd-weight" hostgroups: computers - excludehostgroups: heavy-postfix, alioth + excludehostgroups: heavy-postfix # }}} # {{{ postfix ### - - - name: process - postfix - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C master -a '/usr/lib/postfix/master'" - hostgroups: postfix-hosts - excludehostgroups: stretch - name: process - postfix - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C master -a '/usr/lib/postfix/sbin/master'" hostgroups: postfix-hosts - excludehostgroups: jessie - - - name: process - postfix - qmgr - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postfix -C qmgr -a 'qmgr -l -t fifo -u'" - hostgroups: postfix-hosts - depends: process - postfix - master - excludehostgroups: stretch - name: process - postfix - qmgr nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postfix -C qmgr -a 'qmgr -l -t unix -u'" hostgroups: postfix-hosts depends: process - postfix - master - excludehostgroups: jessie - - - name: process - postfix - pickup - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postfix -C pickup -a 'pickup -l -t fifo -u -c'" - hostgroups: postfix-hosts - depends: process - postfix - master - excludehostgroups: stretch - name: process - postfix - pickup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postfix -C pickup -a 'pickup -l -t unix -u -c'" hostgroups: postfix-hosts depends: process - postfix - master - excludehostgroups: jessie - name: process - postfix - anvil @@ -2494,7 +2307,7 @@ services: name: network service - http check: check_http hostgroups: apache2-hosts - excludehosts: klecker + excludehosts: klecker, casulana depends: process - apache2 - master - name: network service - http @@ -2518,6 +2331,12 @@ services: excludehostgroups: broken_https_default_vhost depends: "process - apache2 - master" check_interval: 120 + - + name: network service - https + check: check_https + hostgroups: https-service + excludehostgroups: broken_https_default_vhost + check_interval: 120 - name: network service - https check: dsa_check_https_want_auth @@ -2533,53 +2352,69 @@ services: - name: network service - https cert check: dsa_check_cert!443 - hostgroups: apache-https + hostgroups: apache-https, https-service, haproxy-https-host depends: network service - https check_interval: 60 - name: unwanted network service - https check: dsa_check_port_closed!443 hostgroups: apache2-hosts - excludehostgroups: apache-https + excludehostgroups: apache-https, haproxy-https-host check_interval: 60 - # }}} - # {{{ FTP + + ### - - name: network service - ftp - check: check_ftp - hostgroups: uploadqueue, security_mirror - excludehosts: klecker, mirror-isc, mirror-umn + name: process - haproxy - master + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -a '/usr/sbin/haproxy-systemd-wrapper'" + hostgroups: haproxy-hosts - - name: network service - ftp - check: check_ftp - hosts: klecker-ftp + name: process - haproxy - worker + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1:15 -u haproxy -a '/usr/sbin/haproxy '" + hostgroups: haproxy-hosts + depends: process - haproxy - master - - name: network service - ftp - check: check_ftp - hosts: mirror-umn2 + name: network service - https + check: check_https + hostgroups: haproxy-https-host + depends: "process - haproxy - master" + check_interval: 120 + + - + name: unwanted process - haproxy + nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C haproxy" + hostgroups: computers + excludehostgroups: haproxy-hosts + + ### + - + name: process - varnish + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1:15 -u vcache -a '/usr/sbin/varnishd -j unix,user=vcache -F -a '" + hostgroups: varnish-hosts + excludehostgroups: jessie + - + name: unwanted process - varnish + nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C varnishd" + hostgroups: computers + excludehostgroups: varnish-hosts + + + # }}} + # {{{ FTP - name: network service - ftp check: check_ftp - hosts: mirror-isc2 + hostgroups: uploadqueue # }}} # {{{ postgres - name: unwanted process - postgresql nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres" hostgroups: computers - excludehostgroups: postgres91-hosts, postgres94-hosts, postgres96-hosts + excludehostgroups: postgres96-hosts - name: unwanted process - postgresql 9.0 nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres -a '9.0/bin/postgres'" hostgroups: computers - - - name: process - postgresql91 - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/9.1/bin/postgres'" - hostgroups: postgres91-hosts - - - name: process - postgresql94 - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/9.4/bin/postgres'" - hostgroups: postgres94-hosts - name: process - postgresql96 - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/9.6/bin/postgres'" @@ -2593,29 +2428,23 @@ services: - name: process - buildd servicegroups: buildd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C perl -a '/usr/bin/buildd'" - hosts: fano, finzi, fils, fayrfax + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C buildd -a '/usr/bin/buildd'" + hostgroups: buildd contact_groups: buildd - name: process - buildd servicegroups: buildd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C buildd -a '/usr/bin/buildd'" - hostgroups: buildd - excludehosts: fano, finzi, fils, fayrfax + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C python3 -a 'buildd.py'" + hostgroups: pybuildd contact_groups: buildd - name: processes - zombie schroot nrpe: "(/usr/lib/nagios/plugins/check_procs -a schroot -s Zs -c 0 > /dev/null || /usr/lib/nagios/plugins/check_procs -a schroot -s Zs -c 0) && /usr/lib/nagios/plugins/check_procs -a schroot -s ZNs -c 0" - hostgroups: buildd + hostgroups: buildd, pybuildd contact_groups: +buildd check_interval: 5 max_check_attempts: 24 retry_interval: 5 - - - name: processes - lvcreate - nrpe: "/usr/lib/nagios/plugins/check_procs -m 'ELAPSED' -c 500 -C lvcreate -u root -a 'lvcreate'" - hostgroups: buildd - contact_groups: +buildd # }}} # {{{ NFS Stuff - @@ -2868,6 +2697,16 @@ services: check: "dsa_check_staticsync!miniconf10.debconf.org" hosts: global servicegroups: mirror + - + name: mirror static sync - wiki + check: "dsa_check_staticsync!wiki.debconf.org" + hosts: global + servicegroups: mirror + - + name: mirror static sync - www + check: "dsa_check_staticsync!www.debconf.org" + hosts: global + servicegroups: mirror # }}} # {{{ DNS - @@ -2901,10 +2740,6 @@ services: name: DNS SOA sync - 144-28.118.59.86.in-addr.arpa check: "dsa_check_soas_add!denis.debian.org!144-28.118.59.86.in-addr.arpa" hosts: global - - - name: DNS SOA sync - alioth.debian.org - check: "dsa_check_soas_add!denis.debian.org!alioth.debian.org" - hosts: global - name: DNS SOA sync - debconf.net check: "dsa_check_soas_add!denis.debian.org!debconf.net" @@ -2948,25 +2783,6 @@ services: runfrom: denis # }}} # {{{ storage - - - name: ping alive check - remotecheck: "/usr/lib/nagios/plugins/check_ping -H $HOSTADDRESS$ -w 50,10% -c 200,30%" - runfrom: ubc-bl8 - hosts: giustini - check_interval: 5 - max_check_attempts: 4 - retry_interval: 1 - - - name: Overall Unit Status - remotecheck: "/usr/lib/nagios/plugins/check_snmp -H $HOSTADDRESS$ -C public -P 2c -o connUnitStatus -n -c 3 -w 3" - runfrom: ubc-bl8 - hosts: giustini - - - name: event log - remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=11298 $HOSTADDRESS$ public" - runfrom: ubc-bl8 - hosts: giustini - ### - name: process - multipathd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:15 -c 1: -u root -C multipathd -a '/sbin/multipathd'" @@ -3030,9 +2846,8 @@ services: # {{{ misc - name: system - all services running - nrpe: "/usr/bin/sudo /bin/systemctl is-system-running" - hostgroups: jessie, stretch - excludehostgroups: freebsd + nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-systemd-services" + hostgroups: computers ### - name: process - slapd @@ -3051,31 +2866,10 @@ services: hosts: draghi depends: process - xinetd ### - - - name: network service - rsync - check: check_tcp!873 - hostgroups: rsyncd-systemd-hosts - name: network service - rsync check: check_tcp!873 hostgroups: rsyncd-hosts - depends: process - xinetd - - - name: network service - rsync - check: check_tcp!873 - hosts: milanollo2 - - - name: network service - rsync - check: check_tcp!873 - hosts: mirror-isc2, mirror-isc-syncproxy - - - name: network service - rsync - check: check_tcp!873 - hosts: mirror-umn2, mirror-umn3 - - - name: network service - rsync - check: check_tcp!873 - hosts: mirror-anu2, mirror-anu3 ### - name: process - icinga @@ -3103,6 +2897,11 @@ services: check: dsa_check_cert!5061 check_interval: 60 hosts: vogler + - + name: freeradius process + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u freerad -C freeradius -a '/usr/sbin/freeradius -xx'" + check_interval: 60 + hosts: vogler #### - name: puppetmaster cert @@ -3115,10 +2914,42 @@ services: name: puppet - agent check nrpe: "/usr/lib/nagios/plugins/dsa-check-statusfile /var/cache/dsa/nagios/puppet-agent" hostgroups: computers - excludehosts: moszumanska check_interval: 60 retry_interval: 15 + #### + - + name: ping peer on mgmt network + nrpe: "/usr/lib/nagios/plugins/check_ping -H 172.29.184.12 -w 50,10% -c 200,30%" + hosts: conova-node01 + check_interval: 5 + max_check_attempts: 4 + retry_interval: 1 + - + name: ping peer on mgmt network + nrpe: "/usr/lib/nagios/plugins/check_ping -H 172.29.184.11 -w 50,10% -c 200,30%" + hosts: conova-node02 + check_interval: 5 + max_check_attempts: 4 + retry_interval: 1 + + - + name: ping peer on mgmt network + nrpe: "/usr/lib/nagios/plugins/check_ping -H 172.29.182.14 -w 50,10% -c 200,30%" + hosts: manda-node03 + check_interval: 5 + max_check_attempts: 4 + retry_interval: 1 + - + name: ping peer on mgmt network + nrpe: "/usr/lib/nagios/plugins/check_ping -H 172.29.182.13 -w 50,10% -c 200,30%" + hosts: manda-node04 + check_interval: 5 + max_check_attempts: 4 + retry_interval: 1 + # }}} # }}} # }}} # vim: set ts=2 sw=2 et ai si fdm=marker: + +