X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=63ad100591227faef4d79dc2e17c9063851a1aa5;hb=0929c982ab97bdb6f32327f5007aa6d67995d520;hp=b841c86209cc014e8dad3bab810a741fa6d80919;hpb=6e3ff0bce4c72c214a94adf02c3d8b313823a8b2;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index b841c86..63ad100 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -33,6 +33,10 @@ servers: address: 130.239.18.97 parents: gw-ubcece hostgroups: layer3-infrastructure + gw-aql: + address: 141.170.2.17 + parents: gw-ubcece + hostgroups: layer3-infrastructure gw-bytemark: address: 89.16.160.116 parents: gw-ubcece @@ -114,6 +118,10 @@ servers: address: 193.201.200.129 parents: gw-ubcece hostgroups: layer3-infrastructure + gw-sakura: + address: 133.242.99.65 + parents: gw-ubcece + hostgroups: layer3-infrastructure gw-sanger: address: 193.62.202.20 parents: gw-ubcece @@ -214,15 +222,29 @@ servers: parents: gw-accumu hostgroups: computers, buildd, hassrvfs, wheezy # }}} + # {{{ gw-aql + mips-aql-01: + address: 141.170.6.149 + parents: gw-aql + hostgroups: computers, buildd, wheezy + mips-aql-02: + address: 141.170.6.150 + parents: gw-aql + hostgroups: computers, buildd, wheezy + mipsel-aql-01: + address: 141.170.6.152 + parents: gw-aql + hostgroups: computers, buildd, jessie, hassrvfs, hasbootfs, sw-raid + mipsel-aql-02: + address: 141.170.6.153 + parents: gw-aql + hostgroups: computers, buildd, jessie, hassrvfs, hasbootfs, sw-raid + # }}} # {{{ gw-arm abel: address: 217.140.96.56 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, porterbox, wheezy, broken_mq - antheil: - address: 217.140.96.60 - parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, broken_mq arnold: address: 217.140.96.57 parents: gw-arm @@ -243,18 +265,14 @@ servers: address: 217.140.96.67 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd, broken_mq - hasse: - address: 217.140.96.68 - parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd, broken_mq - henze: - address: 217.140.96.70 - parents: gw-arm - hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd, broken_mq hoiby: address: 217.140.96.71 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd, broken_mq + ia64-arm-01: + address: 217.140.96.61 + parents: gw-arm + hostgroups: computers, hasbootfs, hassrvfs, wheezy, buildd, broken_mq, sw-raid, acpid-hosts # }}} # {{{ gw-brown franck: @@ -357,11 +375,7 @@ servers: coccia: address: 5.153.231.11 parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, wheezy, autofs, nfs-client, uploadqueue, xinetd-hosts - backuphost: - address: 5.153.231.12 - parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, wheezy + hostgroups: computers, hassrvfs, kvmdomains, wheezy, autofs, nfs-client, uploadqueue, xinetd-hosts, apache-https, apache2-hosts philp: address: 5.153.231.13 parents: ganeti-bytemark @@ -444,6 +458,14 @@ servers: address: 5.153.231.35 parents: ganeti-bytemark hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts + lindsay: + address: 5.153.231.36 + parents: ganeti-bytemark + hostgroups: computers, service, kvmdomains, jessie + sor: + address: 5.153.231.38 + parents: ganeti-bytemark + hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts # }}} # {{{ gw-c3sl santoro: @@ -546,7 +568,7 @@ servers: rautavaara: address: 194.177.211.199 parents: gw-grnet - hostgroups: computers, acpid-hosts, megaraid, service, squeeze, nfs-server + hostgroups: computers, acpid-hosts, megaraid, service, wheezy loghost-grnet-01: address: 194.177.211.200 parents: gw-grnet @@ -597,7 +619,7 @@ servers: asachi: address: 64.28.108.84 parents: gw-linaro - hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, broken_mq + hostgroups: computers, hasbootfs, hassrvfs, porterbox, wheezy, broken_mq # }}} # {{{ gw-karlsruhe zemlinsky: @@ -630,11 +652,11 @@ servers: hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, spamd, heavy-exim, highload mipsel-manda-01: address: 82.195.75.72 - parents: gw-arm + parents: gw-man-da hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy mipsel-manda-02: address: 82.195.75.74 - parents: gw-arm + parents: gw-man-da hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy fils: address: 82.195.75.89 @@ -654,10 +676,6 @@ servers: address: 82.195.75.99 parents: ganeti3 hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, hasvarlogfs - rem: - address: 82.195.75.68 - parents: gw-man-da - hostgroups: computers, hasbootfs, hassrvfs, wheezy, no-bacula draghi: address: 82.195.75.106 parents: ganeti3 @@ -698,6 +716,10 @@ servers: address: 82.195.75.92 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy + wolkenstein: + address: 82.195.75.65 + parents: ganeti3 + hostgroups: computers, hasbootfs, hassrvfs, kvmdomains, service, xinetd-hosts, rsyncd-hosts, apache2-hosts, wheezy mipsel-manda-01: address: 82.195.75.72 parents: gw-man-da @@ -768,7 +790,7 @@ servers: sibelius: address: 193.62.202.28 parents: gw-sanger - hostgroups: computers, acpid-hosts, postgres91-hosts, service, apache2-hosts, sw-raid, squeeze, rsyncd-hosts, xinetd-hosts, hasvarlogfs + hostgroups: computers, acpid-hosts, postgres91-hosts, service, apache2-hosts, sw-raid, wheezy, rsyncd-hosts, xinetd-hosts, hasvarlogfs contacts: tjrc1, dave smetana: address: 193.62.202.29 @@ -859,10 +881,6 @@ servers: address: 206.12.19.118 parents: ganeti2 hostgroups: computers, general, apache2-hosts, hasbootfs, kvmdomains, apache-https, wheezy - wolkenstein: - address: 206.12.19.116 - parents: ganeti2 - hostgroups: computers, hasbootfs, hassrvfs, kvmdomains, service, xinetd-hosts, rsyncd-hosts, apache2-hosts, wheezy brahms: address: 206.12.19.115 parents: ganeti2 @@ -1007,10 +1025,18 @@ servers: address: 143.106.167.145 parents: gw-unicamp hostgroups: layer3-infrastructure + prokofiev: + address: 143.106.167.147 + parents: gw-unicamp + hostgroups: computers, jessie, service powerpc-unicamp-01: address: 143.106.167.149 - parents: asgard + parents: prokofiev hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy + ppc64el-unicamp-01: + address: 143.106.167.135 + parents: prokofiev + hostgroups: computers, hasbootfs, hassrvfs, buildd, jessie # }}} # {{{ gw-utwente klecker: @@ -1031,11 +1057,15 @@ servers: hostgroups: secondary-IPs # }}} # {{{ gw-ynic - howells: + henze: + address: 144.32.168.74 + parents: gw-ynic + hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd + hasse: address: 144.32.168.75 parents: gw-ynic hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd - hummel: + antheil: address: 144.32.168.76 parents: gw-ynic hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd @@ -1047,6 +1077,18 @@ servers: address: 144.32.168.77 parents: gw-ynic hostgroups: computers, buildd, sw-raid, hassrvfs, wheezy + #antheil: + # address: 217.140.96.60 + # parents: gw-arm + # hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, broken_mq + #hasse: + # address: 217.140.96.68 + # parents: gw-arm + # hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd, broken_mq + #henze: + # address: 217.140.96.70 + # parents: gw-arm + # hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd, broken_mq # }}} # {{{ gw-zivit zandonai: @@ -1058,6 +1100,11 @@ servers: parents: gw-zivit hostgroups: computers, porterbox, hassrvfs, wheezy # }}} + # {{{ gw-sakura + setoguchi: + address: 133.242.99.74 + parents: gw-sakura + hostgroups: computers, service, wheezy, no-bacula, hassrvfs, apache2-hosts, rsyncd-hosts, xinetd-hosts, security_mirror, acpid-hosts # }}} # {{{ ############################# host groups ############################# @@ -1145,6 +1192,8 @@ hostgroups: alias: Hosts running squeeze wheezy: alias: Hosts running wheezy + jessie: + alias: Hosts running jessie kvmdomains: alias: Hosts that are KVM domains @@ -1352,7 +1401,7 @@ services: - name: disk usage - all servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs 95 98" + nrpe: "/usr/lib/nagios/plugins/check_disk -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs -x /srv/farm-snapshot/farm-misc 95 98" hosts: sibelius - @@ -1416,9 +1465,24 @@ services: nrpe: "/usr/lib/nagios/plugins/check_disk 90 94 /srv/snapshot.debian.org" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-misc + name: disk usage on /srv/farm-snapshot/farm-1 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-1" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-3 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-misc" + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-3" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-4 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-4" hosts: sibelius - name: disk usage on /var/lib/postgresql/9.1 @@ -1506,6 +1570,12 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C getty -a /sbin/getty" hostgroups: computers excludehosts: zelenka, zandonai + excludehostgroups: jessie + - + name: process - getty + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C agetty -a /sbin/agetty" + hostgroups: computers + hostgroups: jessie - name: processes - zombies nrpe: "/usr/lib/nagios/plugins/check_procs 5 10 -s Z" @@ -1529,7 +1599,7 @@ services: servicegroups: backup nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-dabackup" hostgroups: computers - excludehosts: backuphost + excludehosts: storace normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 @@ -1537,7 +1607,7 @@ services: name: backup server config servicegroups: backup nrpe: "/usr/lib/nagios/plugins/dsa-check-dabackup-server" - hosts: backuphost + hosts: storace normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 @@ -1606,7 +1676,12 @@ services: name: process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ulogd -a '/usr/sbin/ulogd -d'" hostgroups: computers - excludehostgroups: freebsd, sparc + excludehostgroups: freebsd, sparc, jessie + - + name: process - ulogd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u ulog -C ulogd -a '/usr/sbin/ulogd --daemon --uid ulog'" + hostgroups: jessie + excludehostgroups: freebsd - name: unexpected process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C ulogd" @@ -1638,12 +1713,16 @@ services: name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" hostgroups: computers - excludehostgroups: freebsd + excludehostgroups: freebsd, jessie - name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:2 -c 2: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" hostgroups: freebsd + - + name: process - syslog-ng + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -F'" + hostgroups: jessie - name: remote logging on lotti @@ -1702,7 +1781,7 @@ services: - name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a 'munin-node'" - hostgroups: wheezy + hostgroups: wheezy, jessie excludehostgroups: freebsd - name: network service - munin-node @@ -1750,7 +1829,7 @@ services: name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/bin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" hostgroups: computers - excludehostgroups: squeeze, alioth + excludehostgroups: squeeze, alioth, jessie ### - name: MQ connection on rainier @@ -1791,7 +1870,11 @@ services: name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C udevd -a 'udevd'" hostgroups: computers - excludehostgroups: freebsd + excludehostgroups: freebsd, jessie + - + name: process - udevd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C systemd-udevd -a '/lib/systemd/systemd-udevd'" + hostgroups: jessie - name: unexpected process - udev nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C udevd" @@ -1820,7 +1903,7 @@ services: - name: process - stunnel4 - puppet-ekeyd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u stunnel4 -C stunnel4 -a '/usr/bin/stunnel4 /etc/stunnel/puppet-ekeyd.conf'" - hostgroups: squeeze, wheezy + hostgroups: squeeze, wheezy, jessie excludehostgroups: freebsd, alioth # }}} # {{{ anti-services @@ -1866,16 +1949,15 @@ services: - name: process - mdadm monitor servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /var/run/mdadm/monitor.pid --daemonise --scan'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /run/mdadm/monitor.pid --daemonise --scan'" hostgroups: sw-raid - excludehostgroups: wheezy + excludehostgroups: jessie - - # wheezy: name: process - mdadm monitor servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /run/mdadm/monitor.pid --daemonise --scan'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --scan'" hostgroups: sw-raid - excludehostgroups: squeeze + excludehostgroups: wheezy - name: RAID - sw raid servicegroups: raid @@ -2295,7 +2377,7 @@ services: - name: postgresql backups nrpe: "/usr/bin/sudo -u debbackup /usr/lib/nagios/plugins/dsa-check-backuppg" - hosts: backuphost + hosts: storace # }}} # {{{ power # - @@ -2594,6 +2676,17 @@ services: hosts: gombert contact_groups: gobby #### + - + name: network service - sip-tls cert - 443 + check: dsa_check_cert!443 + normal_check_interval: 60 + hosts: vogler + - + name: network service - sip-tls cert - 5061 + check: dsa_check_cert!5061 + normal_check_interval: 60 + hosts: vogler + #### - name: puppetmaster cert nrpe: "/usr/lib/nagios/plugins/dsa-check-cert-expire /var/lib/puppet/ssl/certs/ca.pem"