X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=7fda455407ba1a8b6c9d01c54256703a3d919621;hb=3522d31197e74bed3de85cd608fe69cfb6c79761;hp=de7ae0595f85d578c10266ae3c480c0af95be0e5;hpb=9c5d578009b8c435067773c52f6d0bba8f12bb8d;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index de7ae05..7fda455 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -77,17 +77,21 @@ servers: parents: gw-ubcece hostgroups: layer3-infrastructure gw-karlsruhe: - address: 129.143.166.229 + address: 129.143.57.177 parents: gw-ubcece hostgroups: layer3-infrastructure gw-man-da: address: 82.195.75.126 parents: gw-ubcece hostgroups: layer3-infrastructure - gw-marist: + gw-marist0: address: 148.100.96.1 parents: gw-ubcece hostgroups: layer3-infrastructure + gw-marist: + address: 148.100.88.1 + parents: gw-ubcece + hostgroups: layer3-infrastructure gw-osuosl: address: 140.211.166.1 parents: gw-ubcece @@ -113,12 +117,6 @@ servers: address: 86.59.118.145 parents: gw-ubcece hostgroups: layer3-infrastructure - gw-telegraaf2: - address: 217.196.40.15 - parents: gw-ubcece - hostgroups: layer3-infrastructure - contact_groups: +alioth-admins - no-servicegroups: true gw-ubcece: address: 206.12.19.254 hostgroups: layer3-infrastructure @@ -327,6 +325,10 @@ servers: address: 5.153.231.13 parents: gw-bytemark hostgroups: computers, hassrvfs, kvmdomains, wheezy, apache2-hosts + petrova: + address: 5.153.231.25 + parents: gw-bytemark + hostgroups: computers, kvmdomains, wheezy, apache2-hosts couper: address: 5.153.231.14 parents: gw-bytemark @@ -354,11 +356,19 @@ servers: donizetti: address: 5.153.231.20 parents: gw-bytemark - hostgroups: computers, general, kvmdomains, wheezy - dillo: + hostgroups: computers, general, kvmdomains, wheezy, nfs-client, autofs + dillon: address: 5.153.231.22 parents: gw-bytemark - hostgroups: computers, general, kvmdomains, wheezy + hostgroups: computers, general, kvmdomains, wheezy, nfs-client, autofs + ticharich: + address: 5.153.231.23 + parents: gw-bytemark + hostgroups: computers, general, kvmdomains, wheezy, nfs-client, autofs, apache2-hosts, apache-https, service + diamond: + address: 5.153.231.24 + parents: gw-bytemark + hostgroups: computers, service, kvmdomains, wheezy, bind9-hosts, no-bacula # }}} # {{{ gw-c3sl santoro: @@ -483,7 +493,7 @@ servers: bendel: address: 82.195.75.100 parents: ganeti3 - hostgroups: computers, service, hasbootfs, kvmdomains, hassrvfs, apache2-hosts, squeeze, postfix-hosts, heavy-postfix, acpid-hosts, apache-https, amavis-hosts, hasvarlogfs + hostgroups: computers, service, hasbootfs, kvmdomains, hassrvfs, apache2-hosts, wheezy, postfix-hosts, heavy-postfix, acpid-hosts, apache-https, amavis-hosts, hasvarlogfs master: address: 82.195.75.110 parents: ganeti3 @@ -514,10 +524,6 @@ servers: address: 82.195.75.102 parents: gw-man-da hostgroups: computers, service, dl360, acpid-hosts, wheezy - diamond: - address: 82.195.75.108 - parents: ganeti3 - hostgroups: computers, service, kvmdomains, wheezy, bind9-hosts, no-bacula draghi: address: 82.195.75.106 parents: ganeti3 @@ -534,6 +540,10 @@ servers: address: 82.195.75.107 parents: ganeti3 hostgroups: computers, service, apache2-hosts, rsyncd-hosts, kvmdomains, xinetd-hosts, wheezy + stockhausen: + address: 82.195.75.108 + parents: ganeti3 + hostgroups: computers, service, kvmdomains, wheezy, acpid-hosts, jetty-hosts ganeti3: address: 82.195.75.111 parents: gw-man-da @@ -541,7 +551,7 @@ servers: wilder: address: 82.195.75.112 parents: ganeti3 - hostgroups: computers, service, hassrvfs, apache2-hosts, kvmdomains, wheezy, acpid-hosts, apache2-hosts, apache-https, rsyncd-hosts, xinetd-hosts + hostgroups: computers, service, hassrvfs, apache2-hosts, kvmdomains, wheezy, acpid-hosts, apache-https, rsyncd-hosts, xinetd-hosts vieuxtemps: address: 82.195.75.113 parents: ganeti3 @@ -550,12 +560,20 @@ servers: address: 82.195.75.114 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy, spamd, heavy-exim, mail-relay + denis: + address: 82.195.75.91 + parents: ganeti3 + hostgroups: computers, service, kvmdomains, wheezy, bind9-hosts # }}} # {{{ gw-marist zappa: address: 148.100.96.103 - parents: gw-marist + parents: gw-marist0 hostgroups: computers, buildd, hassrvfs, squeeze, incomingmailrelayed + zani: + address: 148.100.88.22 + parents: gw-marist + hostgroups: computers, buildd, hassrvfs, wheezy # }}} # {{{ gw-osuosl busoni: @@ -602,7 +620,7 @@ servers: caballero: address: 193.201.200.200 parents: gw-rapidswitch - hostgroups: computers, buildd, sw-raid, squeeze + hostgroups: computers, buildd, sw-raid, wheezy, hassrvfs, acpid-hosts # }}} # {{{ gw-sanger sibelius: @@ -640,26 +658,6 @@ servers: parents: gw-sil hostgroups: computers, buildd, wheezy # }}} - # {{{ gw-telegraaf2 - vasks: - address: 217.196.43.140 - parents: gw-telegraaf2 - hostgroups: computers, nfs-server, postgres91-hosts, apache2-hosts, acpid-hosts, apache-https, brokensamhain, no-bacula, sw-raid - contact_groups: alioth-admins - no-servicegroups: true - wagner: - address: 217.196.43.132 - parents: gw-telegraaf2 - hostgroups: computers, bind9-hosts, apache2-hosts, nfs-client, xinetd-hosts, postgres91-hosts, apache-https, dl385, brokensamhain, no-bacula - contact_groups: alioth-admins - no-servicegroups: true - anonscm: - address: 217.196.43.132 - parents: wagner - contact_groups: alioth-admins - hostgroups: secondary-IPs - no-servicegroups: true - # }}} # {{{ gw-ubcece sw-ubcece: hostgroups: layer2-infrastructure @@ -738,7 +736,7 @@ servers: paganini: address: 206.12.19.10 parents: sw-ubcece-kais - hostgroups: computers, hasbootfs, aacraid, hassrvfs, xinetd-hosts, nfs-client, service, apache2-hosts, squeeze, autofs + hostgroups: computers, hasbootfs, aacraid, hassrvfs, nfs-client, service, squeeze, autofs respighi: address: 206.12.19.11 parents: sw-ubcece-kais @@ -1061,6 +1059,9 @@ hostgroups: apache2-hosts: alias: hosts running apache2 private: 1 + jetty-hosts: + alias: hosts running jetty + private: 1 varnish-hosts: alias: hosts running varnish private: 1 @@ -1296,11 +1297,6 @@ services: servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /home" hostgroups: hashomefs - - - name: disk usage on /x - servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /x" - hosts: caballero - name: disk usage on /var/lib/postgresql servicegroups: diskspace @@ -1423,7 +1419,6 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u bacula -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" hostgroups: computers excludehostgroups: freebsd - excludehosts: wagner, vasks - name: process - bacula-fd servicegroups: backup @@ -1473,7 +1468,6 @@ services: # name: puppet # nrpe: "/usr/lib/nagios/plugins/dsa-check-file_age -i 540 -f /var/lib/puppet/state/state.yaml" # hostgroups: computers - # excludehosts: wagner, vasks #### - @@ -1481,13 +1475,11 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/ferm.conf" hostgroups: computers excludehostgroups: freebsd - excludehosts: vasks, wagner - name: puppetized firewall nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/conf.d/defs.conf" hostgroups: computers excludehostgroups: freebsd - excludehosts: vasks, wagner #### - name: ganeti - job watcher paused nrpe: "/usr/lib/nagios/plugins/negate /usr/lib/nagios/plugins/dsa-check-file -f /var/lib/ganeti/watcher.pause" @@ -1507,7 +1499,11 @@ services: normal_check_interval: 60 retry_check_interval: 5 excludehostgroups: brokensamhain - + #### + - + name: process - acc.umu.se backup + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -a 'dsmc'" + hosts: sibelius #### - name: users @@ -1572,7 +1568,6 @@ services: servicegroups: weaksshkeys nrpe: "/usr/lib/nagios/plugins/dsa-check-statusfile /var/cache/dsa/nagios/weak-ssh-keys" hostgroups: computers - excludehosts: wagner, vasks normal_check_interval: 60 #### - @@ -1593,7 +1588,6 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a '/usr/sbin/munin-node'" hostgroups: computers excludehostgroups: freebsd, armhf - excludehosts: vasks, wagner - name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C perl -a '/usr/bin/perl -wT /usr/sbin/munin-node'" @@ -1608,7 +1602,6 @@ services: check: check_tcp!4949 hostgroups: computers depends: process - munin-node - excludehosts: vasks, wagner ### - name: process - ntpd @@ -1648,7 +1641,6 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" hostgroups: computers excludehostgroups: freebsd - excludehosts: vasks, wagner - name: process - syslog-ng @@ -1660,13 +1652,11 @@ services: remotecheck: "/usr/lib/nagios/plugins/dsa-check-log-age-loghost $HOSTNAME$" runfrom: lotti hostgroups: computers - excludehosts: vasks, wagner - name: remote logging on lully remotecheck: "/usr/lib/nagios/plugins/dsa-check-log-age-loghost $HOSTNAME$" runfrom: lully hostgroups: computers - excludehosts: vasks, wagner ### MAIL STUFF ### - @@ -1698,40 +1688,36 @@ services: name: process - clamav - clamd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u clamav -C clamd -a '/usr/sbin/clamd'" hostgroups: heavy-exim, heavy-postfix - hosts: wagner - name: service - clamav nrpe: "/usr/lib/nagios/plugins/check_clamd -H /var/run/clamav/clamd.ctl" hostgroups: heavy-exim, heavy-postfix - hosts: wagner depends: process - clamav - clamd - name: process - clamav - freshclam nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u clamav -C freshclam -a '/usr/bin/freshclam -d --quiet'" - hosts: wagner hostgroups: heavy-exim, heavy-postfix - name: unwanted process - clamav nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C clamd" hostgroups: computers excludehostgroups: heavy-exim, heavy-postfix, deadslow - excludehosts: wagner - name: unwanted process - freshclam nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C freshclam" hostgroups: computers excludehostgroups: heavy-exim, heavy-postfix, deadslow - excludehosts: wagner + ### - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" hostgroups: spamd - excludehosts: wagner, picconi + excludehosts: picconi excludehostgroups: deadslow - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 20 --min-spare=5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" - hosts: wagner, picconi + hosts: picconi - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 10 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" @@ -1739,7 +1725,7 @@ services: - name: process - spamd - child nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:11 -c 1: -C spamd -a 'spamd child'" - hosts: wagner, bendel + hosts: bendel hostgroups: spamd depends: process - spamd - master # @@ -1757,7 +1743,7 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C spamd" hostgroups: computers excludehostgroups: spamd, deadslow - excludehosts: bendel, busoni, wagner, buxtehude + excludehosts: bendel, busoni, buxtehude ### #- @@ -1778,7 +1764,7 @@ services: hostgroups: heavy-exim - name: process - postgrey - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -C postgrey -a '/usr/sbin/postgrey --pidfile=/var/run/postgrey.pid --daemonize --inet=127.0.0.1:60000'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -a '/usr/sbin/postgrey --pidfile=/var/run/postgrey.pid --daemonize --inet=127.0.0.1:60000'" hostgroups: heavy-postfix # - @@ -1789,11 +1775,11 @@ services: ### - name: process - amavis - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u amavis -C amavisd-new -a 'amavisd-new (master)'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u amavis -a 'amavisd-new (master)'" hostgroups: amavis-hosts - name: process - amavis - all - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1:10 -u amavis -C amavisd-new -a 'amavisd-new '" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1:10 -u amavis -a 'amavisd-new '" hostgroups: amavis-hosts depends: process - amavis - master # @@ -1818,27 +1804,11 @@ services: hostgroups: heavy-postfix depends: process - weightd - master ### - - - name: process - weightd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u Debian-exim -a 'policyd-weight (master)'" - hosts: wagner - - - name: process - weightd - cache - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u Debian-exim -a 'policyd-weight (cache)'" - hosts: wagner - depends: process - weightd - master - - - name: process - weightd - child - nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:50 -c 1: -u Debian-exim -a 'policyd-weight (child)'" - hosts: wagner - depends: process - weightd - master - # - name: unwanted process - policyd-weight nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C policyd-weight" hostgroups: computers excludehostgroups: heavy-postfix, deadslow - excludehosts: wagner ### @@ -1928,51 +1898,43 @@ services: name: setup - dsa config nrpe: "/usr/lib/nagios/plugins/dsa-check-config" hostgroups: computers - excludehosts: wagner, vasks normal_check_interval: 60 - name: setup - local hostname etc-hosts nrpe: 'if getent ahosts `hostname` | grep -q 127.0; then echo "Warning: local hostname resolves to 127/8 address"; exit 1; else echo "OK: Hostname resolves to non-127/8 address."; exit 0; fi' hostgroups: computers - excludehosts: wagner, vasks normal_check_interval: 60 - name: setup - ud-ldap freshness nrpe: "/usr/lib/nagios/plugins/dsa-check-udldap-freshness" - excludehosts: wagner, vasks hostgroups: computers - name: system - available entropy nrpe: "/usr/lib/nagios/plugins/dsa-check-entropy" event_handler: dsa_event_handler_restart_ekey hostgroups: computers - excludehosts: vasks, wagner excludehostgroups: freebsd - name: system - filesystem check nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-filesystems" normal_check_interval: 60 retry_check_interval: 15 - excludehosts: wagner, vasks hostgroups: computers ### - name: local resolver nrpe: "/usr/lib/nagios/plugins/dsa-check-resolver www.debian.org www.google.com" hostgroups: computers - excludehosts: vasks, wagner normal_check_interval: 60 - name: process - unbound nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u unbound -C unbound -a '/usr/sbin/unbound'" - excludehosts: vasks, wagner hostgroups: unbound-hosts, squeeze, wheezy ### - name: process - uptimed nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u daemon -C uptimed -a '/usr/sbin/uptimed'" hostgroups: computers - excludehosts: vasks, wagner ### - name: unwanted process - irqbalance @@ -2004,7 +1966,7 @@ services: name: unwanted process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C inetd" hostgroups: computers - excludehosts: abel, alwyn, vasks + excludehosts: abel, alwyn excludehostgroups: deadslow - name: unwanted process - snmpd @@ -2053,13 +2015,12 @@ services: - name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/sbin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" - hostgroups: computers - excludehosts: vasks, wagner, quantz - excludehostgroups: armhf + hostgroups: squeeze - name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/bin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" - hostgroups: wheezy + hostgroups: computers + excludehostgroups: squeeze - name: HW - hpacucli status servicegroups: raid @@ -2168,7 +2129,6 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ulogd -a '/usr/sbin/ulogd -d'" hostgroups: computers excludehostgroups: freebsd, sparc - excludehosts: vasks, wagner - name: unexpected process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C ulogd" @@ -2200,11 +2160,6 @@ services: # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C bosserver -a '/usr/sbin/bosserver'" # hostgroups: bosserver # - ### - - - name: process - inetd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C inetd -a '/usr/sbin/inetd'" - hosts: vasks ### - name: process - xinetd @@ -2245,6 +2200,16 @@ services: # there is always one extra process per check currently running.. nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:30 -c 1: -u nagios -C icinga -a '/usr/sbin/icinga -d /etc/icinga/icinga.cfg'" hosts: tchaikovsky + ### + - + name: process - jetty - master + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -a 'jsvc.exec'" + hostgroups: jetty-hosts + - + name: process - jetty - worker + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1:100 -u jetty -a 'jsvc.exec -user jetty'" + hostgroups: jetty-hosts + depends: process - jetty - master ### - @@ -2328,15 +2293,6 @@ services: ### -# Alioth web URLs - - - - name: network service - loggerhead - remotecheck: "/usr/lib/nagios/plugins/check_http -H anonscm.debian.org -u /loggerhead/" - hosts: anonscm - runfrom: tchaikovsky - depends: wagner:process - apache2 - master - #### - name: process - named @@ -2444,10 +2400,6 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-ups" hosts: franck depends: process - UPS - nut upsd - - - name: process - pglistener - nrpe: "/usr/lib/nagios/plugins/check_procs -u pglisten -C python -a '/usr/bin/python /usr/share/pglistener/starter.py /etc/pglistener/pglistener.cfg /etc/pglistener/conf.d' -w 1: -c 1:" - hosts: wagner, vasks ### - name: process - buildd @@ -2483,15 +2435,6 @@ services: hosts: gombert contact_groups: gobby #### - - - name: network service - git - check: check_tcp!9418 - hosts: wagner - - - name: network service - svn - check: check_tcp!3690 - hosts: wagner - ### #- # name: process - tftpd # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C in.tftpd -a '/usr/sbin/in.tftpd -l -B 1450 -s /var/lib/tftpboot'"