X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=7a6ce31950e39afd9dcf46dc4fa14b3f92d31e3e;hb=7a3d44e17da3ed689de02cda809e07da55a713b1;hp=4e066f7bc23782060511ed5b22719c486c80f978;hpb=17f0593ebb23dbe123bb29274a7c49b1738e6d66;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index 4e066f7..7a6ce31 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -31,9 +31,9 @@ servers: parents: gw-ubcece hostgroups: layer3-infrastructure contacts: joerg - gw-1und1-sec: - address: 212.227.126.33 - parents: gw-ubcece +# gw-1und1-sec: +# address: 212.227.126.33 +# parents: gw-ubcece hostgroups: layer3-infrastructure gw-accumu: address: 130.239.18.97 @@ -177,12 +177,13 @@ servers: # {{{ gw-1und1-sec schumann: address: 212.227.126.54 - parents: gw-1und1-sec + parents: gw-ubcece + #parents: gw-1und1-sec hostgroups: computers, acpid-hosts, service, squeeze chopin: address: 195.20.242.124 parents: schumann - hostgroups: computers, service, apache2-hosts, hassrvfs, hasbootfs, rsyncd-hosts, uploadqueue, kvmdomains, heavy-exim, xinetd-hosts, apache-https, postgres90-hosts, squeeze + hostgroups: computers, service, apache2-hosts, hassrvfs, hasbootfs, rsyncd-hosts, uploadqueue, kvmdomains, heavy-exim, xinetd-hosts, apache-https, postgres91-hosts, squeeze geo3: address: 195.20.242.125 parents: schumann @@ -190,10 +191,11 @@ servers: soler: address: 195.20.242.126 parents: schumann - hostgroups: computers, service, hasbootfs, hassrvfs, kvmdomains, apache2-hosts, squeeze + hostgroups: computers, service, hasbootfs, hassrvfs, kvmdomains, apache2-hosts, squeeze, apache-https wieck: address: 195.20.242.89 - parents: gw-1und1-sec + parents: gw-ubcece + #parents: gw-1und1-sec hostgroups: computers, service, apache2-hosts, rsyncd-hosts, acpid-hosts, xinetd-hosts, squeeze, security_mirror, hasvarlogfs # }}} # {{{ gw-accumu @@ -210,47 +212,43 @@ servers: abel: address: 217.140.96.56 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, porterbox, squeeze + hostgroups: computers, hasbootfs, hassrvfs, porterbox, squeeze, deadslow alain: address: 217.140.96.58 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze + hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze, deadslow alwyn: address: 217.140.96.59 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze + hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze, deadslow antheil: address: 217.140.96.60 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze + hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze, deadslow arne: address: 217.140.96.61 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, squeeze + hostgroups: computers, hasbootfs, hassrvfs, squeeze, deadslow arnold: address: 217.140.96.57 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze + hostgroups: computers, hasbootfs, hassrvfs, buildd, squeeze, deadslow harris: address: 217.140.96.66 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, porterbox - hartmann: - address: 217.140.96.67 - parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd + hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, porterbox, deadslow hasse: address: 217.140.96.68 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd + hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd, deadslow henze: address: 217.140.96.70 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd + hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd, deadslow hoiby: address: 217.140.96.71 parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd + hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd, deadslow # }}} # {{{ gw-brainfood master: @@ -319,7 +317,7 @@ servers: argento: address: 93.94.130.160 parents: gw-dgi - hostgroups: computers, buildd, sw-raid, hassrvfs, squeeze + hostgroups: computers, sw-raid, hassrvfs, wheezy contacts: bzed widor: address: 93.94.130.161 @@ -340,11 +338,6 @@ servers: address: 192.25.206.62 parents: gw-ftcollins hostgroups: computers, buildd, hassrvfs, sw-raid, acpid-hosts, squeeze - penalosa: - address: 192.25.206.68 - parents: gw-ftcollins - hostgroups: computers, buildd, hasbootfs, lenny - contacts: dannf samosa: address: 192.25.206.57 parents: gw-ftcollins @@ -378,11 +371,6 @@ servers: parents: rautavaara hostgroups: computers, freebsd, squeeze, buildd, hassrvfs #, mptraid - field: - address: 194.177.211.210 - parents: rautavaara - hostgroups: computers, freebsd, squeeze, buildd, hassrvfs - #, mptraid grieg: address: 194.177.211.200 parents: gw-grnet @@ -403,10 +391,6 @@ servers: address: 194.177.211.199 parents: gw-grnet hostgroups: computers, acpid-hosts, megaraid, service, squeeze - scelsi: - address: 194.177.211.208 - parents: gw-grnet - hostgroups: computers, acpid-hosts, mptraid, service, squeeze vitry: address: 194.177.211.206 parents: gw-grnet @@ -518,7 +502,7 @@ servers: busoni: address: 140.211.15.34 parents: gw-osuosl - hostgroups: computers, service, dl360, hassrvfs, acpid-hosts, apache2-hosts, heavy-exim, postgres84-hosts, squeeze, hasvarlogfs + hostgroups: computers, service, dl360, hassrvfs, acpid-hosts, heavy-exim, squeeze, hasvarlogfs byrd: address: 140.211.166.20 parents: gw-osuosl @@ -608,7 +592,7 @@ servers: lindberg: address: 86.59.118.149 parents: gw-sil - hostgroups: computers, acpid-hosts, service, apache2-hosts, squeeze, megactl + hostgroups: computers, acpid-hosts, service, squeeze, megactl # which raid? merikanto: address: 86.59.118.147 @@ -753,7 +737,7 @@ servers: lucatelli: address: 206.12.19.15 parents: sw-ubcece-kais - hostgroups: computers, buildd, squeeze + hostgroups: computers, buildd, squeeze, deadslow rossini: address: 206.12.19.19 parents: sw-ubcece-kais @@ -833,7 +817,7 @@ servers: bizet: address: 206.12.19.137 parents: traetta - hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hassrvfs, rsyncd-hosts, heavy-exim, xinetd-hosts, apache2-hosts, uploadqueue + hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, hassrvfs lilburn: address: 206.12.19.138 parents: dijkstra @@ -858,6 +842,14 @@ servers: address: 206.12.19.143 parents: ganeti2 hostgroups: computers, service, kvmdomains, squeeze, hassrvfs, apache2-hosts, apache-https + coincy: + address: 206.12.19.144 + parents: ganeti2 + hostgroups: computers, service, kvmdomains, squeeze, hassrvfs + stanley: + address: 206.12.19.145 + parents: ganeti2 + hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts # }}} # {{{ gw-ugent ancina: @@ -873,22 +865,6 @@ servers: hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, hasvarfs, hasusrfs, hasorgfs, xinetd-hosts, squeeze, security_mirror # }}} # {{{ gw-utwente - kassia: - address: 130.89.149.224 - parents: gw-utwente - hostgroups: computers, service, dl360, acpid-hosts, incomingmailrelayed, xinetd-hosts, squeeze - kassia-sec: - address: 130.89.149.225 - parents: kassia - hostgroups: secondary-IPs - kassia-ftp: - address: 130.89.149.226 - parents: kassia - hostgroups: secondary-IPs - kassia-volatile: - address: 130.89.149.227 - parents: kassia - hostgroups: secondary-IPs klecker: address: 130.89.148.10 parents: gw-utwente @@ -902,15 +878,15 @@ servers: hildegard: address: 144.32.168.74 parents: gw-ynic - hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy + hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, deadslow howells: address: 144.32.168.75 parents: gw-ynic - hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy + hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, deadslow hummel: address: 144.32.168.76 parents: gw-ynic - hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy + hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, deadslow porpora: address: 144.32.168.78 parents: gw-ynic @@ -954,6 +930,8 @@ hostgroups: notacomputer: alias: Systems that are not really systems. Yeah :) private: 1 + deadslow: + alias: Systems too slow to run any real checks freebsd: alias: freebsd private: 1 @@ -1021,9 +999,6 @@ hostgroups: wheezy: alias: Hosts running wheezy - lenny: - alias: Hosts running lenny - kvmdomains: alias: Hosts that are KVM domains private: 1 @@ -1239,12 +1214,12 @@ services: servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /" hostgroups: computers - excludehosts: kassia, spohr + excludehosts: spohr - name: disk usage on / servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 90 93 /" - hosts: kassia, spohr + hosts: spohr - name: disk usage on /boot servicegroups: diskspace @@ -1562,7 +1537,7 @@ services: - name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a 'munin-node'" - hostgroups: armhf + hostgroups: wheezy - name: network service - munin-node check: check_tcp!4949 @@ -1581,7 +1556,7 @@ services: hostgroups: computers depends: process - ntpd excludehosts: ancina - excludehostgroups: ntpsuckers + excludehostgroups: ntpsuckers, deadslow servicegroups: time # - @@ -1674,19 +1649,20 @@ services: name: unwanted process - clamav nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C clamd" hostgroups: computers - excludehostgroups: heavy-exim, heavy-postfix + excludehostgroups: heavy-exim, heavy-postfix, deadslow excludehosts: wagner - name: unwanted process - freshclam nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C freshclam" hostgroups: computers - excludehostgroups: heavy-exim, heavy-postfix + excludehostgroups: heavy-exim, heavy-postfix, deadslow excludehosts: wagner - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" hostgroups: spamd excludehosts: powell, wagner + excludehostgroups: deadslow - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 20 --min-spare=5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" @@ -1715,7 +1691,7 @@ services: name: unwanted process - spamd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C spamd" hostgroups: computers - excludehostgroups: spamd + excludehostgroups: spamd, deadslow excludehosts: bendel, busoni, wagner, buxtehude ### @@ -1728,6 +1704,7 @@ services: name: unwanted process - greylistd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C greylistd" hostgroups: computers + excludehostgroups: deadslow ### - @@ -1743,7 +1720,7 @@ services: name: unwanted process - postgrey nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C postgrey" hostgroups: computers - excludehostgroups: heavy-postfix, heavy-exim + excludehostgroups: heavy-postfix, heavy-exim, deadslow ### - name: process - amavis - master @@ -1759,7 +1736,7 @@ services: name: unwanted process - amavis nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C amavisd-new" hostgroups: computers - excludehostgroups: amavis-hosts + excludehostgroups: amavis-hosts, deadslow ### - name: process - weightd - master @@ -1780,7 +1757,7 @@ services: name: unwanted process - policyd-weight nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C policyd-weight" hostgroups: computers - excludehostgroups: heavy-postfix + excludehostgroups: heavy-postfix, deadslow @@ -1902,6 +1879,7 @@ services: name: unwanted process - irqbalance nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C irqbalance" hostgroups: computers + excludehostgroups: deadslow #### ### @@ -1917,25 +1895,28 @@ services: name: unwanted process - gkrellmd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C gkrellmd" hostgroups: computers + excludehostgroups: deadslow - name: unwanted process - portmap nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C portmap" hostgroups: computers - excludehostgroups: nfs-client, nfs-server + excludehostgroups: nfs-client, nfs-server, deadslow - name: unwanted process - rpc.statd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C rpc.statd" hostgroups: computers - excludehostgroups: nfs-client, nfs-server + excludehostgroups: nfs-client, nfs-server, deadslow - name: unwanted process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C inetd" hostgroups: computers excludehosts: grieg, abel, alwyn, vasks + excludehostgroups: deadslow - name: unwanted process - snmpd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C snmpd" hostgroups: computers + excludehostgroups: deadslow #### - @@ -1976,7 +1957,7 @@ services: - name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/bin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" - hostgroups: armhf + hostgroups: wheezy - name: RAID - arrayprobe servicegroups: raid @@ -1994,7 +1975,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli" normal_check_interval: 120 hostgroups: dl385, dl380, dl360, bl460 - excludehosts: kassia - name: HW - hpacucli enclosure status servicegroups: raid @@ -2007,12 +1987,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --ignore-transfer-speed=1I:1:1 --ignore-transfer-speed=1I:1:2" normal_check_interval: 120 hostgroups: dl585 - - - name: HW - hpacucli status - servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --ignore-transfer-speed=1I:1:2 --ignore-transfer-speed=1I:1:3 --ignore-transfer-speed=1I:1:4 --ignore-transfer-speed=2I:1:5 --ignore-transfer-speed=2I:1:6" - normal_check_interval: 120 - hosts: kassia ### - name: HW - hpasmcli status @@ -2069,8 +2043,8 @@ services: hostgroups: megactl ### - - name: RAID - DRDB - normal_check_interval: 120 + name: RAID - DRBD + servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-drbd -d All" hostgroups: drbd-hosts ### @@ -2136,7 +2110,7 @@ services: name: unwanted process - xinetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C xinetd" hostgroups: computers - excludehostgroups: xinetd-hosts + excludehostgroups: xinetd-hosts, deadslow ### - name: network service - finger @@ -2160,16 +2134,6 @@ services: check: check_tcp!873 hosts: merikanto2 depends: merikanto:process - xinetd - #- - # name: network service - rsync - # check: check_tcp!873 - # hosts: kassia-sec - # depends: kassia:process - xinetd -# - -# name: network service - rsync -# check: check_tcp!873 -# hosts: merikanto2 -# depends: merikanto:process - xinetd ### - @@ -2192,7 +2156,7 @@ services: name: unwanted process - apache2 nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C apache2" hostgroups: computers - excludehostgroups: apache2-hosts + excludehostgroups: apache2-hosts, deadslow - name: network service - http @@ -2237,7 +2201,7 @@ services: name: unwanted network service - https check: dsa_check_port_closed!443 hostgroups: apache2-hosts - excludehostgroups: apache-https + excludehostgroups: apache-https, deadslow # ravel does ssh on port 443 excludehosts: ravel normal_check_interval: 60 @@ -2256,7 +2220,7 @@ services: name: unwanted process - named nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C named" hostgroups: computers - excludehostgroups: bind9-hosts + excludehostgroups: bind9-hosts, deadslow #### - @@ -2301,7 +2265,7 @@ services: name: unwanted process - postresql nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres" hostgroups: computers - excludehostgroups: postgres90-hosts, postgres84-hosts, postgres91-hosts + excludehostgroups: postgres90-hosts, postgres84-hosts, postgres91-hosts, deadslow - name: process - postresql91 - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:4 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/9.1/bin/postgres'" @@ -2387,14 +2351,14 @@ services: name: process - buildd servicegroups: buildd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C perl -a '/usr/bin/buildd'" - hosts: fano, fasch, field, finzi, fils + hosts: fano, fasch, finzi, fils contact_groups: buildd - name: process - buildd servicegroups: buildd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C buildd -a '/usr/bin/buildd'" hostgroups: buildd - excludehosts: fano, fasch, field, finzi, fils + excludehosts: fano, fasch, finzi, fils contact_groups: buildd #### - @@ -2445,7 +2409,7 @@ services: name: unwanted process - automount nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C automount" hostgroups: computers - excludehostgroups: autofs + excludehostgroups: autofs, deadslow ############ MISC OTHER Stuff ############ #####