X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=1dbbed880b0712734456a4f27e4af9074b1a118c;hb=6142049d989c16a0bdecc04180e7b512daa7ae19;hp=d3811141d43aabc067add34c2f254979ab6f9358;hpb=599730ff7bf45786acaf1373500f3ab7504ea599;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index d381114..1dbbed8 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -31,9 +31,9 @@ servers: parents: gw-ubcece hostgroups: layer3-infrastructure contacts: joerg - gw-1und1-sec: - address: 212.227.126.33 - parents: gw-ubcece +# gw-1und1-sec: +# address: 212.227.126.33 +# parents: gw-ubcece hostgroups: layer3-infrastructure gw-accumu: address: 130.239.18.97 @@ -177,7 +177,8 @@ servers: # {{{ gw-1und1-sec schumann: address: 212.227.126.54 - parents: gw-1und1-sec + parents: gw-ubcece + #parents: gw-1und1-sec hostgroups: computers, acpid-hosts, service, squeeze chopin: address: 195.20.242.124 @@ -190,10 +191,11 @@ servers: soler: address: 195.20.242.126 parents: schumann - hostgroups: computers, service, hasbootfs, hassrvfs, kvmdomains, apache2-hosts, squeeze + hostgroups: computers, service, hasbootfs, hassrvfs, kvmdomains, apache2-hosts, squeeze, apache-https wieck: address: 195.20.242.89 - parents: gw-1und1-sec + parents: gw-ubcece + #parents: gw-1und1-sec hostgroups: computers, service, apache2-hosts, rsyncd-hosts, acpid-hosts, xinetd-hosts, squeeze, security_mirror, hasvarlogfs # }}} # {{{ gw-accumu @@ -210,35 +212,31 @@ servers: abel: address: 217.140.96.56 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, porterbox, squeeze + hostgroups: computers, hasbootfs, hassrvfs, porterbox, squeeze, deadslow alain: address: 217.140.96.58 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze + hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze, deadslow alwyn: address: 217.140.96.59 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze + hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze, deadslow antheil: address: 217.140.96.60 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze + hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze, deadslow arne: address: 217.140.96.61 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, squeeze + hostgroups: computers, hasbootfs, hassrvfs, squeeze, deadslow arnold: address: 217.140.96.57 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze + hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze, deadslow harris: address: 217.140.96.66 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, porterbox - hartmann: - address: 217.140.96.67 - parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd + hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, porterbox, deadslow hasse: address: 217.140.96.68 parents: gw-arm @@ -319,7 +317,7 @@ servers: argento: address: 93.94.130.160 parents: gw-dgi - hostgroups: computers, buildd, sw-raid, hassrvfs, squeeze + hostgroups: computers, sw-raid, hassrvfs, wheezy contacts: bzed widor: address: 93.94.130.161 @@ -340,11 +338,6 @@ servers: address: 192.25.206.62 parents: gw-ftcollins hostgroups: computers, buildd, hassrvfs, sw-raid, acpid-hosts, squeeze - penalosa: - address: 192.25.206.68 - parents: gw-ftcollins - hostgroups: computers, buildd, hasbootfs, lenny - contacts: dannf samosa: address: 192.25.206.57 parents: gw-ftcollins @@ -378,11 +371,6 @@ servers: parents: rautavaara hostgroups: computers, freebsd, squeeze, buildd, hassrvfs #, mptraid - field: - address: 194.177.211.210 - parents: rautavaara - hostgroups: computers, freebsd, squeeze, buildd, hassrvfs - #, mptraid grieg: address: 194.177.211.200 parents: gw-grnet @@ -403,10 +391,6 @@ servers: address: 194.177.211.199 parents: gw-grnet hostgroups: computers, acpid-hosts, megaraid, service, squeeze - scelsi: - address: 194.177.211.208 - parents: gw-grnet - hostgroups: computers, acpid-hosts, mptraid, service, squeeze vitry: address: 194.177.211.206 parents: gw-grnet @@ -503,6 +487,15 @@ servers: address: 82.195.75.107 parents: unger hostgroups: computers, service, hasbootfs, apache2-hosts, rsyncd-hosts, kvmdomains, xinetd-hosts, squeeze + ganeti3: + address: 82.195.75.111 + parents: gw-man-da + hostgroups: notacomputer + wilder: + address: 82.195.75.112 + parents: ganeti3 + hostgroups: computers, service, hassrvfs, apache2-hosts, kvmdomains, wheezy, acpid-hosts + # lamb: # address: 82.195.75.101 # parents: unger @@ -518,7 +511,7 @@ servers: busoni: address: 140.211.15.34 parents: gw-osuosl - hostgroups: computers, service, dl360, hassrvfs, acpid-hosts, apache2-hosts, heavy-exim, postgres84-hosts, squeeze, hasvarlogfs + hostgroups: computers, service, dl360, hassrvfs, acpid-hosts, heavy-exim, squeeze, hasvarlogfs byrd: address: 140.211.166.20 parents: gw-osuosl @@ -608,7 +601,7 @@ servers: lindberg: address: 86.59.118.149 parents: gw-sil - hostgroups: computers, acpid-hosts, service, apache2-hosts, squeeze, megactl + hostgroups: computers, acpid-hosts, service, squeeze, megactl # which raid? merikanto: address: 86.59.118.147 @@ -753,7 +746,7 @@ servers: lucatelli: address: 206.12.19.15 parents: sw-ubcece-kais - hostgroups: computers, buildd, squeeze + hostgroups: computers, buildd, squeeze, deadslow rossini: address: 206.12.19.19 parents: sw-ubcece-kais @@ -833,7 +826,7 @@ servers: bizet: address: 206.12.19.137 parents: traetta - hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hassrvfs, rsyncd-hosts, heavy-exim, xinetd-hosts, apache2-hosts, uploadqueue + hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, hassrvfs lilburn: address: 206.12.19.138 parents: dijkstra @@ -857,7 +850,16 @@ servers: menotti: address: 206.12.19.143 parents: ganeti2 - hostgroups: computers, service, kvmdomains, squeeze, hassrvfs, apache2-hosts, apache-https + hostgroups: computers, service, kvmdomains, squeeze, hassrvfs, apache2-hosts + #, apache-https + coincy: + address: 206.12.19.144 + parents: ganeti2 + hostgroups: computers, service, kvmdomains, squeeze, hassrvfs + stanley: + address: 206.12.19.145 + parents: ganeti2 + hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts # }}} # {{{ gw-ugent ancina: @@ -873,22 +875,6 @@ servers: hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, hasvarfs, hasusrfs, hasorgfs, xinetd-hosts, squeeze, security_mirror # }}} # {{{ gw-utwente - kassia: - address: 130.89.149.224 - parents: gw-utwente - hostgroups: computers, service, dl360, acpid-hosts, incomingmailrelayed, xinetd-hosts, squeeze - kassia-sec: - address: 130.89.149.225 - parents: kassia - hostgroups: secondary-IPs - kassia-ftp: - address: 130.89.149.226 - parents: kassia - hostgroups: secondary-IPs - kassia-volatile: - address: 130.89.149.227 - parents: kassia - hostgroups: secondary-IPs klecker: address: 130.89.148.10 parents: gw-utwente @@ -1023,9 +1009,6 @@ hostgroups: wheezy: alias: Hosts running wheezy - lenny: - alias: Hosts running lenny - kvmdomains: alias: Hosts that are KVM domains private: 1 @@ -1241,12 +1224,12 @@ services: servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /" hostgroups: computers - excludehosts: kassia, spohr + excludehosts: spohr - name: disk usage on / servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 90 93 /" - hosts: kassia, spohr + hosts: spohr - name: disk usage on /boot servicegroups: diskspace @@ -1267,12 +1250,12 @@ services: servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /srv" hostgroups: hassrvfs - excludehosts: ries, beach + excludehosts: stabile, beach - name: disk usage on /srv servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv" - hosts: ries, beach + hosts: stabile, beach - name: disk usage on /tmp servicegroups: diskspace @@ -1297,7 +1280,7 @@ services: name: disk usage on /var/lib/postgresql servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /var/lib/postgresql" - hosts: samosa, stabile, sibelius, busoni, buxtehude + hosts: stabile, sibelius, busoni, buxtehude - name: disk usage on /var/log servicegroups: diskspace @@ -1564,7 +1547,7 @@ services: - name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a 'munin-node'" - hostgroups: armhf + hostgroups: wheezy - name: network service - munin-node check: check_tcp!4949 @@ -1583,7 +1566,7 @@ services: hostgroups: computers depends: process - ntpd excludehosts: ancina - excludehostgroups: ntpsuckers + excludehostgroups: ntpsuckers, deadslow servicegroups: time # - @@ -1601,7 +1584,7 @@ services: ### - name: process - cron - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u root -C cron -a /usr/sbin/cron" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C cron -a /usr/sbin/cron" hostgroups: computers ### @@ -1676,19 +1659,20 @@ services: name: unwanted process - clamav nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C clamd" hostgroups: computers - excludehostgroups: heavy-exim, heavy-postfix + excludehostgroups: heavy-exim, heavy-postfix, deadslow excludehosts: wagner - name: unwanted process - freshclam nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C freshclam" hostgroups: computers - excludehostgroups: heavy-exim, heavy-postfix + excludehostgroups: heavy-exim, heavy-postfix, deadslow excludehosts: wagner - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" hostgroups: spamd excludehosts: powell, wagner + excludehostgroups: deadslow - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 20 --min-spare=5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" @@ -1717,7 +1701,7 @@ services: name: unwanted process - spamd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C spamd" hostgroups: computers - excludehostgroups: spamd + excludehostgroups: spamd, deadslow excludehosts: bendel, busoni, wagner, buxtehude ### @@ -1730,6 +1714,7 @@ services: name: unwanted process - greylistd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C greylistd" hostgroups: computers + excludehostgroups: deadslow ### - @@ -1745,7 +1730,7 @@ services: name: unwanted process - postgrey nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C postgrey" hostgroups: computers - excludehostgroups: heavy-postfix, heavy-exim + excludehostgroups: heavy-postfix, heavy-exim, deadslow ### - name: process - amavis - master @@ -1761,7 +1746,7 @@ services: name: unwanted process - amavis nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C amavisd-new" hostgroups: computers - excludehostgroups: amavis-hosts + excludehostgroups: amavis-hosts, deadslow ### - name: process - weightd - master @@ -1782,7 +1767,7 @@ services: name: unwanted process - policyd-weight nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C policyd-weight" hostgroups: computers - excludehostgroups: heavy-postfix + excludehostgroups: heavy-postfix, deadslow @@ -1881,6 +1866,11 @@ services: hostgroups: computers excludehosts: vasks, wagner excludehostgroups: freebsd + - + name: system - filesystem check + nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-filesystems" + excludehosts: wagner, vasks + hostgroups: computers ### - name: local resolver @@ -1904,6 +1894,7 @@ services: name: unwanted process - irqbalance nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C irqbalance" hostgroups: computers + excludehostgroups: deadslow #### ### @@ -1919,25 +1910,28 @@ services: name: unwanted process - gkrellmd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C gkrellmd" hostgroups: computers + excludehostgroups: deadslow - name: unwanted process - portmap nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C portmap" hostgroups: computers - excludehostgroups: nfs-client, nfs-server + excludehostgroups: nfs-client, nfs-server, deadslow - name: unwanted process - rpc.statd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C rpc.statd" hostgroups: computers - excludehostgroups: nfs-client, nfs-server + excludehostgroups: nfs-client, nfs-server, deadslow - name: unwanted process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C inetd" hostgroups: computers excludehosts: grieg, abel, alwyn, vasks + excludehostgroups: deadslow - name: unwanted process - snmpd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C snmpd" hostgroups: computers + excludehostgroups: deadslow #### - @@ -1978,7 +1972,7 @@ services: - name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/bin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" - hostgroups: armhf + hostgroups: wheezy - name: RAID - arrayprobe servicegroups: raid @@ -1996,7 +1990,13 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli" normal_check_interval: 120 hostgroups: dl385, dl380, dl360, bl460 - excludehosts: kassia + excludehosts: schein + - + name: HW - hpacucli status + servicegroups: raid + nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --no-battery" + normal_check_interval: 120 + hosts: schein - name: HW - hpacucli enclosure status servicegroups: raid @@ -2009,12 +2009,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --ignore-transfer-speed=1I:1:1 --ignore-transfer-speed=1I:1:2" normal_check_interval: 120 hostgroups: dl585 - - - name: HW - hpacucli status - servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --ignore-transfer-speed=1I:1:2 --ignore-transfer-speed=1I:1:3 --ignore-transfer-speed=1I:1:4 --ignore-transfer-speed=2I:1:5 --ignore-transfer-speed=2I:1:6" - normal_check_interval: 120 - hosts: kassia ### - name: HW - hpasmcli status @@ -2138,7 +2132,7 @@ services: name: unwanted process - xinetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C xinetd" hostgroups: computers - excludehostgroups: xinetd-hosts + excludehostgroups: xinetd-hosts, deadslow ### - name: network service - finger @@ -2162,22 +2156,12 @@ services: check: check_tcp!873 hosts: merikanto2 depends: merikanto:process - xinetd - #- - # name: network service - rsync - # check: check_tcp!873 - # hosts: kassia-sec - # depends: kassia:process - xinetd -# - -# name: network service - rsync -# check: check_tcp!873 -# hosts: merikanto2 -# depends: merikanto:process - xinetd ### - - name: process - nagios3 + name: process - icinga # there is always one extra process per check currently running.. - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:30 -c 1: -u nagios -C nagios3 -a '/usr/sbin/nagios3 -d /etc/nagios3/nagios.cfg'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:30 -c 1: -u nagios -C icinga -a '/usr/sbin/icinga -d /etc/icinga/icinga.cfg'" hosts: tchaikovsky ### @@ -2194,7 +2178,7 @@ services: name: unwanted process - apache2 nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C apache2" hostgroups: computers - excludehostgroups: apache2-hosts + excludehostgroups: apache2-hosts, deadslow - name: network service - http @@ -2239,7 +2223,7 @@ services: name: unwanted network service - https check: dsa_check_port_closed!443 hostgroups: apache2-hosts - excludehostgroups: apache-https + excludehostgroups: apache-https, deadslow # ravel does ssh on port 443 excludehosts: ravel normal_check_interval: 60 @@ -2258,7 +2242,7 @@ services: name: unwanted process - named nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C named" hostgroups: computers - excludehostgroups: bind9-hosts + excludehostgroups: bind9-hosts, deadslow #### - @@ -2303,7 +2287,7 @@ services: name: unwanted process - postresql nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres" hostgroups: computers - excludehostgroups: postgres90-hosts, postgres84-hosts, postgres91-hosts + excludehostgroups: postgres90-hosts, postgres84-hosts, postgres91-hosts, deadslow - name: process - postresql91 - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:4 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/9.1/bin/postgres'" @@ -2320,15 +2304,6 @@ services: name: postgresql backups nrpe: "/usr/bin/sudo -u debbackup /usr/lib/nagios/plugins/dsa-check-backuppg" hosts: beethoven - #### - - - name: process - stunnel4 - postgres-udd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u stunnel4 -C stunnel4 -a '/usr/bin/stunnel4 /etc/stunnel/postgres-udd-server.conf'" - hosts: samosa - - - name: udd stunnel - master cert - nrpe: "/usr/lib/nagios/plugins/check_http -H localhost -p 8080 -S -C 14 -t 45" - hosts: samosa #### #### - @@ -2389,14 +2364,14 @@ services: name: process - buildd servicegroups: buildd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C perl -a '/usr/bin/buildd'" - hosts: fano, fasch, field, finzi, fils + hosts: fano, fasch, finzi, fils contact_groups: buildd - name: process - buildd servicegroups: buildd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C buildd -a '/usr/bin/buildd'" hostgroups: buildd - excludehosts: fano, fasch, field, finzi, fils + excludehosts: fano, fasch, finzi, fils contact_groups: buildd #### - @@ -2447,7 +2422,7 @@ services: name: unwanted process - automount nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C automount" hostgroups: computers - excludehostgroups: autofs + excludehostgroups: autofs, deadslow ############ MISC OTHER Stuff ############ #####