X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=cf8594ce7261ac8aa44d7a12df977cd95d5267a0;hb=40389fe7ad8028bedd698e6d804e9474e1156594;hp=4ca3344dbb1f26d5a6fad25dad6745f95fd515fc;hpb=4dd94be5ec29b8e4eab807fd6de7552a764cfbf7;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index 4ca3344..cf8594c 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -212,7 +212,7 @@ servers: pettersson: address: 130.239.18.123 parents: gw-accumu - hostgroups: computers, hasbootfs, aacraid, nfs-client, acpid-hosts, service, apache2-hosts, wheezy, autofs, sw-raid + hostgroups: computers, hasbootfs, aacraid, nfs-client, acpid-hosts, service, apache2-hosts, jessie, autofs, sw-raid praetorius: address: 130.239.18.121 parents: gw-accumu @@ -222,7 +222,7 @@ servers: mips-aql-01: address: 141.170.6.149 parents: gw-aql - hostgroups: computers, buildd, wheezy, nfs-client + hostgroups: computers, buildd, jessie, nfs-client mips-aql-02: address: 141.170.6.150 parents: gw-aql @@ -248,15 +248,19 @@ servers: arnold: address: 217.140.96.57 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, broken_mq + hostgroups: computers, hasbootfs, hassrvfs, buildd, jessie, broken_mq arm-arm-01: address: 217.140.96.58 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, broken_mq + hostgroups: computers, hasbootfs, hassrvfs, buildd, jessie, broken_mq arm-arm-02: address: 217.140.96.59 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, broken_mq + hostgroups: computers, hasbootfs, hassrvfs, buildd, jessie, broken_mq + arm-arm-03: + address: 217.140.96.60 + parents: gw-arm + hostgroups: computers, hasbootfs, hassrvfs, buildd, jessie, broken_mq harris: address: 217.140.96.66 parents: gw-arm @@ -268,7 +272,7 @@ servers: hoiby: address: 217.140.96.71 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd, broken_mq + hostgroups: computers, hasbootfs, hassrvfs, armhf, jessie, buildd, broken_mq ia64-arm-01: address: 217.140.96.61 parents: gw-arm @@ -403,7 +407,7 @@ servers: dinis: address: 5.153.231.19 parents: ganeti-bytemark - hostgroups: computers, general, kvmdomains, wheezy + hostgroups: computers, general, kvmdomains, wheezy, hassrvfs donizetti: address: 5.153.231.20 parents: ganeti-bytemark @@ -433,7 +437,7 @@ servers: barriere: address: 5.153.231.27 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, porterbox + hostgroups: computers, service, kvmdomains, jessie, hassrvfs, porterbox quantz: address: 5.153.231.28 parents: ganeti-bytemark @@ -461,20 +465,24 @@ servers: lindsay: address: 5.153.231.36 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie + hostgroups: computers, service, kvmdomains, jessie, autofs, nfs-client fede: address: 5.153.231.37 - hostgroups: computers, service, kvmdomains, wheezy, hassrvfs + hostgroups: computers, service, kvmdomains, jessie, hassrvfs sor: address: 5.153.231.38 parents: ganeti-bytemark hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, autofs, nfs-client + jerea: + address: 5.153.231.39 + parents: ganeti-bytemark + hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts # }}} # {{{ gw-c3sl santoro: address: 200.17.202.197 parents: gw-c3sl - hostgroups: computers, service, apache2-hosts, rsyncd-hosts, xinetd-hosts, hassrvfs, wheezy, high-RTT, security_mirror, no-bacula, apache-https + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, xinetd-hosts, hassrvfs, jessie, high-RTT, security_mirror, no-bacula, apache-https contacts: faw # }}} # {{{ gw-carnet @@ -504,10 +512,6 @@ servers: hostgroups: computers, buildd, hassrvfs, sw-raid, wheezy, sparc # }}} # {{{ gw-csail - senfl: - address: 128.31.0.51 - parents: gw-csail - hostgroups: computers, service, dl360, acpid-hosts, hassrvfs, apache2-hosts, rsyncd-hosts, xinetd-hosts, squeeze, apache-https steffani: address: 128.31.0.36 parents: gw-csail @@ -542,6 +546,10 @@ servers: address: 128.31.0.50 parents: ganeti-csail hostgroups: computers, buildd, hassrvfs, kvmdomains, wheezy + httpredir-csail-01: + address: 128.31.0.66 + parents: ganeti-csail + hostgroups: computers, service, kvmdomains, jessie, apache2-hosts # }}} # {{{ gw-dgi storace: @@ -583,7 +591,11 @@ servers: cgi-grnet-01: address: 194.177.211.202 parents: gw-grnet - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts + hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, apache-https + x86-grnet-01: + address: 194.177.211.203 + parents: ganeti-grnet + hostgroups: computers, buildd, hassrvfs, kvmdomains, jessie # }}} # {{{ gw-isc schein: @@ -694,7 +706,7 @@ servers: geo1: address: 82.195.75.105 parents: ganeti3 - hostgroups: computers, service, bind9-hosts, kvmdomains, wheezy + hostgroups: computers, service, bind9-hosts, kvmdomains, jessie handel: address: 82.195.75.104 parents: ganeti3 @@ -706,7 +718,7 @@ servers: stockhausen: address: 82.195.75.108 parents: ganeti3 - hostgroups: computers, service, kvmdomains, jessie, acpid-hosts, jetty-hosts + hostgroups: computers, service, kvmdomains, jessie, acpid-hosts ganeti3: address: 82.195.75.111 parents: gw-man-da @@ -744,7 +756,7 @@ servers: zani: address: 148.100.88.22 parents: gw-marist - hostgroups: computers, buildd, hassrvfs, wheezy, incomingmailrelayed, ping-suckers + hostgroups: computers, buildd, hassrvfs, jessie, incomingmailrelayed # }}} # {{{ gw-osuosl busoni: @@ -758,7 +770,7 @@ servers: buxtehude: address: 140.211.166.26 parents: byrd - hostgroups: computers, service, hassrvfs, acpid-hosts, apache2-hosts, heavy-exim, postgres91-hosts, wheezy, hasvarlogfs, apache-https + hostgroups: computers, service, hassrvfs, acpid-hosts, apache2-hosts, heavy-exim, postgres91-hosts, wheezy, hasvarlogfs, apache-https, spamd # malo TODO mayer: address: 140.211.166.78 @@ -779,7 +791,7 @@ servers: partch: address: 140.211.15.152 parents: gw-osuosl - hostgroups: computers, wheezy, hassrvfs, porterbox, sw-raid + hostgroups: computers, jessie, hassrvfs, porterbox, sw-raid rietz: address: 140.211.166.43 parents: gw-osuosl @@ -903,7 +915,7 @@ servers: # MSA 2000 (2012i) giustini: address: 192.168.2.6 - parents: dijkstra + parents: sw-ubcece-kais hostgroups: notacomputer # unless we implement runfrom for host alive checks pingable: false @@ -930,14 +942,6 @@ servers: address: 206.12.19.15 parents: sw-ubcece-kais hostgroups: computers, buildd, wheezy - rossini: - address: 206.12.19.19 - parents: sw-ubcece-kais - hostgroups: computers, dl585, acpid-hosts, service, wheezy - salieri: - address: 206.12.19.20 - parents: sw-ubcece-kais - hostgroups: computers, dl585, acpid-hosts, service, wheezy traetta: address: 206.12.19.21 parents: sw-ubcece-kais @@ -948,11 +952,11 @@ servers: # hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hasvicepa lotti: address: 206.12.19.121 - parents: sw-ubcece-kais + parents: ganeti2 hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, hassrvfs nono: address: 206.12.19.123 - parents: traetta + parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, heavy-exim, xinetd-hosts, apache2-hosts, apache-https, broken_https_default_vhost reger: address: 206.12.19.124 @@ -964,7 +968,7 @@ servers: hostgroups: computers, service, kvmdomains, wheezy, postgres91-hosts, xinetd-hosts glinka: address: 206.12.19.126 - parents: traetta + parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, nfs-client, autofs, xinetd-hosts tye: address: 206.12.19.129 @@ -972,7 +976,7 @@ servers: hostgroups: computers, service, kvmdomains, wheezy, heavy-exim, apache2-hosts, nfs-client, autofs, hassrvfs elgar: address: 206.12.19.130 - parents: salieri + parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy gombert: address: 206.12.19.132 @@ -980,7 +984,7 @@ servers: hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts jenkins: address: 206.12.19.133 - parents: salieri + parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy blavet: address: 206.12.19.134 @@ -988,16 +992,12 @@ servers: hostgroups: computers, service, kvmdomains, wheezy, xinetd-hosts, nfs-client, autofs diabelli: address: 206.12.19.136 - parents: traetta + parents: ganeti2 hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, apache2-hosts, apache-https, broken_https_default_vhost bizet: address: 206.12.19.137 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, no-bacula - lilburn: - address: 206.12.19.138 - parents: ganeti2 - hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts, nfs-client, autofs popov: address: 206.12.19.119 parents: ganeti2 @@ -1043,11 +1043,15 @@ servers: powerpc-unicamp-01: address: 143.106.167.149 parents: prokofiev - hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy + hostgroups: computers, hasbootfs, hassrvfs, buildd, jessie ppc64el-unicamp-01: address: 143.106.167.135 parents: prokofiev hostgroups: computers, hasbootfs, hassrvfs, buildd, jessie + plummer: + address: 143.106.167.146 + parents: prokofiev + hostgroups: computers, porterbox, hassrvfs, jessie # }}} # {{{ gw-utwente klecker: @@ -1071,7 +1075,7 @@ servers: henze: address: 144.32.168.74 parents: gw-ynic - hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd + hostgroups: computers, hasbootfs, hassrvfs, armhf, jessie, buildd hasse: address: 144.32.168.75 parents: gw-ynic @@ -1191,8 +1195,6 @@ hostgroups: alias: Hosts with LSI Logic MegaRAID private: 1 - squeeze: - alias: Hosts running squeeze wheezy: alias: Hosts running wheezy jessie: @@ -1222,9 +1224,6 @@ hostgroups: apache2-hosts: alias: hosts running apache2 private: 1 - jetty-hosts: - alias: hosts running jetty - private: 1 bind9-hosts: alias: hosts running bind9 private: 1 @@ -1316,9 +1315,6 @@ hostgroups: high-RTT: alias: machines with high round trip times private: 1 - ping-suckers: - alias: machines that just suck at icmp - private: 1 alioth: alias: machines that just are just awkward private: 1 @@ -1368,7 +1364,7 @@ services: name: PING check: "check_ping!350.0,20%!600.0,40%" hostgroups: pingable - excludehostgroups: layer3-infrastructure, high-RTT, ping-suckers + excludehostgroups: layer3-infrastructure, high-RTT normal_check_interval: 5 max_check_attempts: 4 retry_check_interval: 1 @@ -1379,13 +1375,6 @@ services: normal_check_interval: 5 max_check_attempts: 4 retry_check_interval: 1 - - - name: PING - check: "check_ping!600.0,90%!900.0,95%" - hostgroups: ping-suckers - normal_check_interval: 5 - max_check_attempts: 4 - retry_check_interval: 1 - name: PING check: "check_ping!2000.0,60%!3000.0,80%" @@ -1673,7 +1662,8 @@ services: - name: upgraded libraries servicegroups: security - nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-libs" + nrpe: "sudo /usr/local/sbin/dsa-check-libs" + #nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-libs" hostgroups: computers excludehostgroups: freebsd normal_check_interval: 60 @@ -1832,21 +1822,17 @@ services: name: process - ud-replicated nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C ud-replicated -a '/usr/bin/python /usr/bin/ud-replicated'" hostgroups: computers - excludehostgroups: squeeze, freebsd, alioth + excludehostgroups: freebsd, alioth - name: process - ud-replicated nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C python2.7 -a '/usr/bin/python /usr/bin/ud-replicated'" hostgroups: freebsd ### - - - name: process - monit - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/sbin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" - hostgroups: squeeze - name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/bin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" hostgroups: computers - excludehostgroups: squeeze, alioth, jessie + excludehostgroups: alioth, jessie ### - name: MQ connection on rainier @@ -1909,7 +1895,7 @@ services: ### - name: process - xinetd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C xinetd -a '/usr/sbin/xinetd -pidfile /var/run/xinetd.pid -stayalive'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C xinetd -a '/usr/sbin/xinetd '" hostgroups: xinetd-hosts - name: unwanted process - xinetd @@ -1920,8 +1906,14 @@ services: - name: process - stunnel4 - puppet-ekeyd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u stunnel4 -C stunnel4 -a '/usr/bin/stunnel4 /etc/stunnel/puppet-ekeyd.conf'" - hostgroups: squeeze, wheezy, jessie + hostgroups: wheezy, jessie + excludehostgroups: freebsd, alioth + - + name: process - stunnel4 - puppet-ekeyd is crazy + nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-stunnel-sanity" + hostgroups: computers excludehostgroups: freebsd, alioth + excludehosts: czerny, grnet-node01, storace # }}} # {{{ anti-services - @@ -1961,6 +1953,14 @@ services: name: "host SSL cert" nrpe: "if [ -e /etc/ssl/certs/thishost.pem ]; then /usr/lib/nagios/plugins/dsa-check-cert-expire /etc/ssl/certs/thishost.pem; else echo 'No thishost.pem on this host.'; fi" hostgroups: computers + - + name: "host SSL cert - debian server" + nrpe: "if [ -e /etc/ssl/debian/certs/thishost-server.crt ]; then /usr/lib/nagios/plugins/dsa-check-cert-expire /etc/ssl/debian/certs/thishost-server.crt; else echo 'No thishost-server.crt on this host.'; fi" + hostgroups: computers + - + name: "host SSL cert - debian client" + nrpe: "if [ -e /etc/ssl/debian/certs/thishost.crt ]; then /usr/lib/nagios/plugins/dsa-check-cert-expire /etc/ssl/debian/certs/thishost.crt; else echo 'No thishost.crt on this host.'; fi" + hostgroups: computers # }}} # {{{ HW health/raid - @@ -2024,13 +2024,13 @@ services: # nrpe: "/usr/lib/nagios/plugins/dsa-check-edac" # normal_check_interval: 120 #hostgroups: computers - #excludehosts: villa, lobos, senfl, schein + #excludehosts: villa, lobos, schein - name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm" normal_check_interval: 120 hostgroups: dl385, dl380, dl360, bl460, dl585, bm-bl - excludehosts: villa, lobos, senfl, schein, storace + excludehosts: villa, lobos, schein, storace - name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm --ps-no-redundant" @@ -2045,7 +2045,7 @@ services: name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm --fan-no-redundant" normal_check_interval: 120 - hosts: senfl, schein + hosts: schein - name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm --fan-ignore-not-present" @@ -2150,21 +2150,12 @@ services: hostgroups: spamd depends: process - spamd - master # - - - name: process - spamd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u debbugs -C spamd -a '/usr/sbin/spamd -d '" - hosts: buxtehude - - - name: process - spamd - child - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u debbugs -C spamd -a 'spamd child'" - hosts: buxtehude - # - name: unwanted process - spamd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C spamd" hostgroups: computers excludehostgroups: spamd - excludehosts: bendel, busoni, buxtehude + excludehosts: bendel, busoni - name: unwanted process - greylistd @@ -2686,16 +2677,6 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:30 -c 1: -u nagios -C icinga -a '/usr/sbin/icinga -d /etc/icinga/icinga.cfg'" hosts: tchaikovsky ### - - - name: process - jetty - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -a 'jsvc.exec'" - hostgroups: jetty-hosts - - - name: process - jetty - worker - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1:100 -u jetty -a 'jsvc.exec -user jetty'" - hostgroups: jetty-hosts - depends: process - jetty - master - ### - name: process - debianqueued nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u dak-unpriv -C debianqueued"