X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=dc5f804b1c47937032b6e304f176729a84050f55;hb=038e3a09fababe90fbfcc4dee268516ca312373f;hp=457189dd12167468823799e555558a2437f93b48;hpb=cd7c11183cf61427bcffd2200598446ef689cec0;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index 457189d..dc5f804 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -39,6 +39,10 @@ servers: address: 130.239.18.97 parents: gw-ubcece hostgroups: layer3-infrastructure + gw-bytemark: + address: 89.16.160.116 + parents: gw-ubcece + hostgroups: layer3-infrastructure gw-c3sl: address: 200.17.202.254 parents: gw-ubcece @@ -105,7 +109,6 @@ servers: address: 82.195.75.126 parents: gw-ubcece hostgroups: layer3-infrastructure - contacts: joerg, bzed gw-marist: address: 148.100.96.1 parents: gw-ubcece @@ -172,8 +175,7 @@ servers: powell: address: 87.106.64.223 parents: gw-1und1 - hostgroups: computers, service, spamd, heavy-exim, rsyncd-hosts, acpid-hosts, hassrvfs, hasvarfs, hasusrfs, xinetd-hosts, apache2-hosts, squeeze - contacts: joerg + hostgroups: computers, service, acpid-hosts, wheezy # }}} # {{{ gw-1und1-sec schumann: @@ -255,7 +257,7 @@ servers: old-master: address: 97.107.116.29 parents: gw-brainfood - hostgroups: computers, general, apache2-hosts, spamd, heavy-exim, highload, xinetd-hosts, mptraid, squeeze, bacula-client + hostgroups: computers, general, spamd, heavy-exim, highload, xinetd-hosts, mptraid, squeeze, bacula-client murphy: address: 97.107.116.31 parents: gw-brainfood @@ -271,6 +273,37 @@ servers: parents: gw-brown hostgroups: computers, service, dl385, acpid-hosts, xinetd-hosts, hassrvfs, squeeze, postgres91-hosts # }}} + # {{{ gw-bytemark + bm-bl1: + address: 5.153.231.241 + parents: gw-bytemark + hostgroups: computers, bl460, acpid-hosts, service, wheezy + bm-bl2: + address: 5.153.231.242 + parents: gw-bytemark + hostgroups: computers, bl460, acpid-hosts, service, wheezy + bm-bl3: + address: 5.153.231.243 + parents: gw-bytemark + hostgroups: computers, bl460, acpid-hosts, service, wheezy + bm-bl4: + address: 5.153.231.244 + parents: gw-bytemark + hostgroups: computers, bl460, acpid-hosts, service, wheezy + bm-bl5: + address: 5.153.231.245 + parents: gw-bytemark + hostgroups: computers, bl460, acpid-hosts, service, wheezy + + milanollo: + address: 5.153.231.2 + parents: gw-bytemark + hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, nfs-server + picconi: + address: 5.153.231.3 + parents: gw-bytemark + hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, nfs-client, autofs + # }}} # {{{ gw-c3sl santoro: address: 200.17.202.197 @@ -319,7 +352,6 @@ servers: address: 93.94.130.160 parents: gw-dgi hostgroups: computers, sw-raid, hassrvfs, wheezy - contacts: bzed # }}} # {{{ gw-ftcollins alkman: @@ -362,7 +394,7 @@ servers: address: 194.177.211.201 parents: rautavaara hostgroups: computers, freebsd, squeeze, buildd, hassrvfs - #, mptraid + contacts: christoph grieg: address: 194.177.211.200 parents: gw-grnet @@ -433,23 +465,24 @@ servers: hostgroups: computers, service, dl380, acpid-hosts, squeeze, drbd-hosts bendel: address: 82.195.75.100 - parents: czerny + parents: ganeti3 hostgroups: computers, service, hasbootfs, kvmdomains, hassrvfs, apache2-hosts, squeeze, postfix-hosts, heavy-postfix, acpid-hosts, apache-https, amavis-hosts, hasvarlogfs master: address: 82.195.75.110 - parents: czerny + parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, bacula-client, spamd, heavy-exim, highload fils: address: 82.195.75.89 - parents: czerny + parents: ganeti3 hostgroups: computers, freebsd, squeeze, buildd, hassrvfs + contacts: christoph vento: address: 82.195.75.98 - parents: czerny + parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts, heavy-exim lully: address: 82.195.75.99 - parents: czerny + parents: ganeti3 hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hasvarlogfs, bacula-client rem: address: 82.195.75.68 @@ -461,23 +494,23 @@ servers: hostgroups: computers, service, dl360, acpid-hosts, squeeze diamond: address: 82.195.75.108 - parents: unger + parents: ganeti3 hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, bind9-hosts draghi: address: 82.195.75.106 - parents: unger + parents: ganeti3 hostgroups: computers, service, hasbootfs, hassrvfs, apache2-hosts, bind9-hosts, spamd, heavy-exim, kvmdomains, xinetd-hosts, apache-https, squeeze, bacula-client geo1: address: 82.195.75.105 - parents: unger + parents: ganeti3 hostgroups: computers, service, hasbootfs, bind9-hosts, kvmdomains, squeeze handel: address: 82.195.75.104 - parents: unger + parents: ganeti3 hostgroups: computers, service, hasbootfs, kvmdomains, apache2-hosts, squeeze, apache-https, hasvarfs kaufmann: address: 82.195.75.107 - parents: unger + parents: ganeti3 hostgroups: computers, service, hasbootfs, apache2-hosts, rsyncd-hosts, kvmdomains, xinetd-hosts, squeeze ganeti3: address: 82.195.75.111 @@ -487,11 +520,14 @@ servers: address: 82.195.75.112 parents: ganeti3 hostgroups: computers, service, hassrvfs, apache2-hosts, kvmdomains, wheezy, acpid-hosts, apache2-hosts, apache-https, bacula-client - -# lamb: -# address: 82.195.75.101 -# parents: unger -# hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hasvicepa, bosserver + vieuxtemps: + address: 82.195.75.113 + parents: ganeti3 + hostgroups: computers, service, kvmdomains, wheezy, varnish-hosts + mailly: + address: 82.195.75.114 + parents: ganeti3 + hostgroups: computers, service, kvmdomains, wheezy, spamd, heavy-exim, mail-relay # }}} # {{{ gw-marist zappa: @@ -507,11 +543,11 @@ servers: byrd: address: 140.211.166.20 parents: gw-osuosl - hostgroups: computers, service, dl380, acpid-hosts, squeeze + hostgroups: computers, service, dl380, acpid-hosts, wheezy buxtehude: address: 140.211.166.26 parents: byrd - hostgroups: computers, service, hassrvfs, acpid-hosts, apache2-hosts, heavy-exim, postgres91-hosts, squeeze, hasvarlogfs + hostgroups: computers, service, hassrvfs, acpid-hosts, apache2-hosts, heavy-exim, postgres91-hosts, wheezy, hasvarlogfs # malo TODO mayer: address: 140.211.166.78 @@ -554,7 +590,7 @@ servers: sibelius: address: 193.62.202.28 parents: gw-sanger - hostgroups: computers, acpid-hosts, postgres90-hosts, service, apache2-hosts, sw-raid, squeeze, rsyncd-hosts, xinetd-hosts, hasvarlogfs + hostgroups: computers, acpid-hosts, postgres91-hosts, service, apache2-hosts, sw-raid, squeeze, rsyncd-hosts, xinetd-hosts, hasvarlogfs contacts: tjrc1, dave smetana: address: 193.62.202.29 @@ -617,6 +653,12 @@ servers: hostgroups: computers, bind9-hosts, apache2-hosts, nfs-client, xinetd-hosts, postgres91-hosts, apache-https, dl385, brokensamhain contact_groups: alioth-admins no-servicegroups: true + anonscm: + address: 217.196.43.132 + parents: wagner + contact_groups: alioth-admins + hostgroups: secondary-IPs + no-servicegroups: true # }}} # {{{ gw-ubcece sw-ubcece: @@ -696,7 +738,7 @@ servers: morricone: address: 206.12.19.9 parents: sw-ubcece-kais - hostgroups: computers, hasbootfs, hasvarfs, hassrvfs, aacraid, postgres90-hosts, rsyncd-hosts, heavy-exim, xinetd-hosts, apache2-hosts, service, squeeze, uploadqueue + hostgroups: computers, hasbootfs, hasvarfs, hassrvfs, aacraid, rsyncd-hosts, heavy-exim, xinetd-hosts, apache2-hosts, service, squeeze, uploadqueue stabile: address: 206.12.19.13 parents: sw-ubcece-kais @@ -725,10 +767,12 @@ servers: address: 206.12.19.110 parents: luchesi hostgroups: computers, freebsd, squeeze, buildd, hassrvfs + contacts: christoph finzi: address: 206.12.19.111 parents: luchesi hostgroups: computers, freebsd, squeeze, buildd, hassrvfs + contacts: christoph fischer: address: 206.12.19.112 parents: luchesi @@ -736,7 +780,7 @@ servers: gabrielli: address: 206.12.19.17 parents: sw-ubcece-kais - hostgroups: computers, porterbox, squeeze + hostgroups: computers, porterbox, wheezy corelli: address: 206.12.19.16 parents: sw-ubcece-kais @@ -748,7 +792,7 @@ servers: rossini: address: 206.12.19.19 parents: sw-ubcece-kais - hostgroups: computers, dl585, acpid-hosts, service, squeeze + hostgroups: computers, dl585, acpid-hosts, service, wheezy salieri: address: 206.12.19.20 parents: sw-ubcece-kais @@ -784,7 +828,7 @@ servers: glinka: address: 206.12.19.126 parents: traetta - hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, apache2-hosts, nfs-client, autofs + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, apache2-hosts, nfs-client, autofs, xinetd-hosts dukas: address: 206.12.19.128 parents: traetta @@ -836,11 +880,11 @@ servers: beach: address: 206.12.19.140 parents: ganeti2 - hostgroups: computers, service, kvmdomains, squeeze, apache2-hosts, xinetd-hosts, hassrvfs, nfs-server, rsyncd-hosts + hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, xinetd-hosts, hassrvfs, nfs-server, rsyncd-hosts ullmann: address: 206.12.19.141 parents: ganeti2 - hostgroups: computers, service, kvmdomains, squeeze, postgres91-hosts, nfs-client, apache2-hosts, autofs + hostgroups: computers, service, kvmdomains, wheezy, postgres91-hosts, nfs-client, apache2-hosts, autofs sonntag: address: 206.12.19.142 parents: ganeti2 @@ -858,6 +902,10 @@ servers: address: 206.12.19.145 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts + muffat: + address: 206.12.19.146 + parents: ganeti2 + hostgroups: computers, service, kvmdomains, wheezy, spamd, heavy-exim, mail-relay # }}} # {{{ gw-ugent ancina: @@ -876,7 +924,7 @@ servers: klecker: address: 130.89.148.10 parents: gw-utwente - hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, acpid-hosts, xinetd-hosts, squeeze, incomingmailrelayed, hassrvfs + hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, acpid-hosts, xinetd-hosts, squeeze, incomingmailrelayed2025, hassrvfs klecker-ftp: address: 130.89.148.12 parents: klecker @@ -1031,6 +1079,9 @@ hostgroups: apache2-hosts: alias: hosts running apache2 private: 1 + varnish-hosts: + alias: hosts running varnish + private: 1 bind9-hosts: alias: hosts running bind9 private: 1 @@ -1056,9 +1107,6 @@ hostgroups: postgres84-hosts: alias: hosts running postgres84 private: 1 - postgres90-hosts: - alias: hosts running postgres90 - private: 1 postgres91-hosts: alias: hosts running postgres91 private: 1 @@ -1158,6 +1206,8 @@ servicegroups: alias: buildd checks raid: alias: raid checks + backup: + alias: backup checks kernel: alias: kernel checks weaksshkeys: @@ -1213,7 +1263,7 @@ services: - name: disk usage - all servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk -w 10% -c 5% -A -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs --ignore-eregi-path=/srv/snapshot.debian.org" + nrpe: "/usr/lib/nagios/plugins/check_disk -w 5% -c 3% -A -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs --ignore-eregi-path=/srv/snapshot.debian.org" hosts: stabile - name: disk usage - all @@ -1262,7 +1312,7 @@ services: name: disk usage on /tmp servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 60 80 /tmp" - hosts: saens, powell, piatti + hosts: saens, piatti - name: disk usage on /usr servicegroups: diskspace @@ -1307,7 +1357,7 @@ services: - name: disk usage on /srv/snapshot.debian.org servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 94 98 /srv/snapshot.debian.org" + nrpe: "/usr/lib/nagios/plugins/check_disk 98 99 /srv/snapshot.debian.org" hosts: stabile - name: disk usage on /srv/snapshot.debian.org @@ -1368,6 +1418,7 @@ services: #### - name: backup + servicegroups: backup nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-dabackup" hostgroups: computers normal_check_interval: 60 @@ -1375,24 +1426,38 @@ services: retry_check_interval: 5 - name: backup server config + servicegroups: backup nrpe: "/usr/lib/nagios/plugins/dsa-check-dabackup-server" hosts: beethoven normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 - - name: backup - bacula - remotecheck: "sudo /usr/lib/nagios/plugins/dsa-check-bacula -H $HOSTNAME$" + name: backup - bacula - last backup + servicegroups: backup + remotecheck: "/usr/lib/nagios/plugins/dsa-check-bacula $HOSTNAME$.debian.org" + runfrom: dinis + hostgroups: bacula-client + normal_check_interval: 60 + retry_check_interval: 15 + - + name: backup - bacula - last full backup + servicegroups: backup + remotecheck: "/usr/lib/nagios/plugins/dsa-check-bacula -w 840 -c 1560 $HOSTNAME$.debian.org F" runfrom: dinis hostgroups: bacula-client + normal_check_interval: 60 + retry_check_interval: 15 - name: process - bacula-fd + servicegroups: backup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" hostgroups: computers excludehostgroups: freebsd excludehosts: wagner, vasks - name: process - bacula-fd + servicegroups: backup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" hostgroups: freebsd @@ -1435,11 +1500,11 @@ services: # retry_check_interval: 5 #### - - - name: puppet - nrpe: "/usr/lib/nagios/plugins/dsa-check-file_age -i 540 -f /var/lib/puppet/state/state.yaml" - hostgroups: computers - excludehosts: wagner, vasks + #- + # name: puppet + # nrpe: "/usr/lib/nagios/plugins/dsa-check-file_age -i 540 -f /var/lib/puppet/state/state.yaml" + # hostgroups: computers + # excludehosts: wagner, vasks #### - @@ -1688,12 +1753,12 @@ services: name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" hostgroups: spamd - excludehosts: powell, wagner + excludehosts: wagner excludehostgroups: deadslow - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 20 --min-spare=5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" - hosts: powell, wagner + hosts: wagner - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 10 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" @@ -1981,6 +2046,13 @@ services: servicegroups: raid nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /var/run/mdadm/monitor.pid --daemonise --scan'" hostgroups: sw-raid + excludehosts: argento + - + # wheezy: + name: process - mdadm monitor + servicegroups: raid + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /run/mdadm/monitor.pid --daemonise --scan'" + hosts: argento - name: RAID - sw raid servicegroups: raid @@ -2004,6 +2076,7 @@ services: nrpe: "sudo /usr/bin/arrayprobe" hostgroups: dl385, dl380, dl360, bl460, dl585 excludehosts: franck + excludehostgroups: wheezy - name: RAID - arrayprobe servicegroups: raid @@ -2253,6 +2326,33 @@ services: excludehosts: ravel normal_check_interval: 60 +### + - + name: process - varnish - master + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C varnishd -a '/usr/sbin/varnishd -P /var/run/varnishd.pid -a :80 -T localhost:6082 -f /etc/varnish/default.vcl'" + hostgroups: varnish-hosts + - + name: process - varnish - worker + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u nobody -C varnishd -a '/usr/sbin/varnishd -P /var/run/varnishd.pid -a :80 -T localhost:6082 -f /etc/varnish/default.vcl'" + hostgroups: varnish-hosts + depends: process - varnish - master + - + name: network service - http + check: check_http + hostgroups: varnish-hosts + depends: process - varnish - master + +### + +# Alioth web URLs + + - + name: network service - loggerhead + remotecheck: "/usr/lib/nagios/plugins/check_http -H anonscm.debian.org -u /loggerhead/" + hosts: anonscm + runfrom: tchaikovsky + depends: wagner:process - apache2 - master + #### - name: process - named @@ -2293,40 +2393,40 @@ services: ### #- - # name: process - postresql81 - master + # name: process - postgresql81 - master # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a '/usr/lib/postgresql/8.1/bin/postmaster -D /var/lib/postgresql/8.1/main -c config_file=/etc/postgresql/8.1/main/postgresql.conf'" # hostgroups: postgres81-hosts #- - # name: process - postresql81 - writer + # name: process - postgresql81 - writer # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: writer process'" # hostgroups: postgres81-hosts - # depends: process - postresql81 - master + # depends: process - postgresql81 - master #- - # name: process - postresql81 - buffer + # name: process - postgresql81 - buffer # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: stats buffer process'" # hostgroups: postgres81-hosts - # depends: process - postresql81 - master + # depends: process - postgresql81 - master #- - # name: process - postresql81 - collector + # name: process - postgresql81 - collector # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: stats collector process'" # hostgroups: postgres81-hosts - # depends: process - postresql81 - master + # depends: process - postgresql81 - master #### - - name: unwanted process - postresql + name: unwanted process - postgresql nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres" hostgroups: computers - excludehostgroups: postgres90-hosts, postgres84-hosts, postgres91-hosts, deadslow + excludehostgroups: postgres84-hosts, postgres91-hosts, deadslow + - + name: unwanted process - postgresql 9.0 + nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres -a '9.0/bin/postgres'" + hostgroups: computers - - name: process - postresql91 - master + name: process - postgresql91 - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:4 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/9.1/bin/postgres'" hostgroups: postgres91-hosts - - name: process - postresql90 - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:4 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/9.0/bin/postgres'" - hostgroups: postgres90-hosts - - - name: process - postresql84 - master + name: process - postgresql84 - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:4 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/8.4/bin/postgres'" hostgroups: postgres84-hosts - @@ -2422,6 +2522,7 @@ services: name: process - portmap nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u daemon -C portmap -a '/sbin/portmap'" hostgroups: nfs-client, nfs-server + excludehostgroups: wheezy - name: process - statd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u statd -C rpc.statd -a '/sbin/rpc.statd'" @@ -2501,10 +2602,6 @@ services: name: DNS SOA sync - alioth.debian.org check: "dsa_check_soas_add!alioth.debian.org!alioth.debian.org" hosts: global - - - name: DNS SOA sync - 2.5.1.1.8.0.0.8.d.8.0.1.0.0.2.ip6.arpa - check: "dsa_check_soas!2.5.1.1.8.0.0.8.d.8.0.1.0.0.2.ip6.arpa" - hosts: global - name: DNS SOA sync - 2.6.a.0.4.6.5.6.1.0.0.0.2.0.0.0.8.d.8.0.1.0.0.2.ip6.arpa check: "dsa_check_soas!2.6.a.0.4.6.5.6.1.0.0.0.2.0.0.0.8.d.8.0.1.0.0.2.ip6.arpa" @@ -2536,7 +2633,7 @@ services: hosts: giustini - name: event log - remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=7634 $HOSTADDRESS$ public" + remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=7778 $HOSTADDRESS$ public" runfrom: dijkstra hosts: giustini