X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=b400f2e3a7a583f433a21daece2777924d6250a5;hb=9076f9562a9cd7aeb7a20fbf66681b38585cdda9;hp=0f690e3ea4bc4448c9ef94acc3e7dc5c7c8bd56f;hpb=b645ba0e657ad48c28995da6166dae8980d1a5c7;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index 0f690e3..b400f2e 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -33,6 +33,10 @@ servers: address: 130.239.18.97 parents: gw-ubcece hostgroups: layer3-infrastructure + gw-aql: + address: 141.170.2.17 + parents: gw-ubcece + hostgroups: layer3-infrastructure gw-bytemark: address: 89.16.160.116 parents: gw-ubcece @@ -114,6 +118,10 @@ servers: address: 193.201.200.129 parents: gw-ubcece hostgroups: layer3-infrastructure + gw-sakura: + address: 133.242.99.65 + parents: gw-ubcece + hostgroups: layer3-infrastructure gw-sanger: address: 193.62.202.20 parents: gw-ubcece @@ -214,6 +222,24 @@ servers: parents: gw-accumu hostgroups: computers, buildd, hassrvfs, wheezy # }}} + # {{{ gw-aql + mips-aql-01: + address: 141.170.6.149 + parents: gw-aql + hostgroups: computers, buildd, wheezy + mips-aql-02: + address: 141.170.6.150 + parents: gw-aql + hostgroups: computers, buildd, wheezy + mipsel-aql-01: + address: 141.170.6.152 + parents: gw-aql + hostgroups: computers, buildd, jessie, hassrvfs, hasbootfs, sw-raid + mipsel-aql-02: + address: 141.170.6.153 + parents: gw-aql + hostgroups: computers, buildd, jessie, hassrvfs, hasbootfs, sw-raid + # }}} # {{{ gw-arm abel: address: 217.140.96.56 @@ -243,6 +269,10 @@ servers: address: 217.140.96.71 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd, broken_mq + ia64-arm-01: + address: 217.140.96.61 + parents: gw-arm + hostgroups: computers, hasbootfs, hassrvfs, wheezy, buildd, broken_mq, sw-raid, acpid-hosts # }}} # {{{ gw-brown franck: @@ -345,11 +375,7 @@ servers: coccia: address: 5.153.231.11 parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, wheezy, autofs, nfs-client, uploadqueue, xinetd-hosts - backuphost: - address: 5.153.231.12 - parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, wheezy + hostgroups: computers, hassrvfs, kvmdomains, wheezy, autofs, nfs-client, uploadqueue, xinetd-hosts, apache-https, apache2-hosts philp: address: 5.153.231.13 parents: ganeti-bytemark @@ -432,6 +458,10 @@ servers: address: 5.153.231.35 parents: ganeti-bytemark hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts + lindsay: + address: 5.153.231.36 + parents: ganeti-bytemark + hostgroups: computers, service, kvmdomains, jessie # }}} # {{{ gw-c3sl santoro: @@ -534,7 +564,7 @@ servers: rautavaara: address: 194.177.211.199 parents: gw-grnet - hostgroups: computers, acpid-hosts, megaraid, service, squeeze, nfs-server + hostgroups: computers, acpid-hosts, megaraid, service, wheezy loghost-grnet-01: address: 194.177.211.200 parents: gw-grnet @@ -642,10 +672,6 @@ servers: address: 82.195.75.99 parents: ganeti3 hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, hasvarlogfs - rem: - address: 82.195.75.68 - parents: gw-man-da - hostgroups: computers, hasbootfs, hassrvfs, wheezy, no-bacula draghi: address: 82.195.75.106 parents: ganeti3 @@ -686,6 +712,10 @@ servers: address: 82.195.75.92 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy + wolkenstein: + address: 82.195.75.65 + parents: ganeti3 + hostgroups: computers, hasbootfs, hassrvfs, kvmdomains, service, xinetd-hosts, rsyncd-hosts, apache2-hosts, wheezy mipsel-manda-01: address: 82.195.75.72 parents: gw-man-da @@ -756,7 +786,7 @@ servers: sibelius: address: 193.62.202.28 parents: gw-sanger - hostgroups: computers, acpid-hosts, postgres91-hosts, service, apache2-hosts, sw-raid, squeeze, rsyncd-hosts, xinetd-hosts, hasvarlogfs + hostgroups: computers, acpid-hosts, postgres91-hosts, service, apache2-hosts, sw-raid, wheezy, rsyncd-hosts, xinetd-hosts, hasvarlogfs contacts: tjrc1, dave smetana: address: 193.62.202.29 @@ -847,10 +877,6 @@ servers: address: 206.12.19.118 parents: ganeti2 hostgroups: computers, general, apache2-hosts, hasbootfs, kvmdomains, apache-https, wheezy - wolkenstein: - address: 206.12.19.116 - parents: ganeti2 - hostgroups: computers, hasbootfs, hassrvfs, kvmdomains, service, xinetd-hosts, rsyncd-hosts, apache2-hosts, wheezy brahms: address: 206.12.19.115 parents: ganeti2 @@ -995,9 +1021,13 @@ servers: address: 143.106.167.145 parents: gw-unicamp hostgroups: layer3-infrastructure + prokofiev: + address: 143.106.167.147 + parents: gw-unicamp + hostgroups: computers, jessie, acpid-hosts, service powerpc-unicamp-01: address: 143.106.167.149 - parents: asgard + parents: prokofiev hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy # }}} # {{{ gw-utwente @@ -1019,11 +1049,15 @@ servers: hostgroups: secondary-IPs # }}} # {{{ gw-ynic - howells: + henze: + address: 144.32.168.74 + parents: gw-ynic + hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd + hasse: address: 144.32.168.75 parents: gw-ynic hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd - hummel: + antheil: address: 144.32.168.76 parents: gw-ynic hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd @@ -1058,6 +1092,11 @@ servers: parents: gw-zivit hostgroups: computers, porterbox, hassrvfs, wheezy # }}} + # {{{ gw-sakura + setoguchi: + address: 133.242.99.74 + parents: gw-sakura + hostgroups: computers, service, wheezy # }}} # {{{ ############################# host groups ############################# @@ -1145,6 +1184,8 @@ hostgroups: alias: Hosts running squeeze wheezy: alias: Hosts running wheezy + jessie: + alias: Hosts running jessie kvmdomains: alias: Hosts that are KVM domains @@ -1352,7 +1393,7 @@ services: - name: disk usage - all servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs 95 98" + nrpe: "/usr/lib/nagios/plugins/check_disk -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs -x /srv/farm-snapshot/farm-misc 95 98" hosts: sibelius - @@ -1416,9 +1457,24 @@ services: nrpe: "/usr/lib/nagios/plugins/check_disk 90 94 /srv/snapshot.debian.org" hosts: sibelius - - name: disk usage on /srv/farm-snapshot/farm-misc + name: disk usage on /srv/farm-snapshot/farm-1 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-1" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-2 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-3 + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-3" + hosts: sibelius + - + name: disk usage on /srv/farm-snapshot/farm-4 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-misc" + nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-4" hosts: sibelius - name: disk usage on /var/lib/postgresql/9.1 @@ -1506,6 +1562,12 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C getty -a /sbin/getty" hostgroups: computers excludehosts: zelenka, zandonai + excludehostgroups: jessie + - + name: process - getty + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C agetty -a /sbin/agetty" + hostgroups: computers + hostgroups: jessie - name: processes - zombies nrpe: "/usr/lib/nagios/plugins/check_procs 5 10 -s Z" @@ -1529,7 +1591,7 @@ services: servicegroups: backup nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-dabackup" hostgroups: computers - excludehosts: backuphost + excludehosts: storace normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 @@ -1537,7 +1599,7 @@ services: name: backup server config servicegroups: backup nrpe: "/usr/lib/nagios/plugins/dsa-check-dabackup-server" - hosts: backuphost + hosts: storace normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 @@ -1606,7 +1668,12 @@ services: name: process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ulogd -a '/usr/sbin/ulogd -d'" hostgroups: computers - excludehostgroups: freebsd, sparc + excludehostgroups: freebsd, sparc, jessie + - + name: process - ulogd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u ulog -C ulogd -a '/usr/sbin/ulogd --daemon --uid ulog'" + hostgroups: jessie + excludehostgroups: freebsd - name: unexpected process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C ulogd" @@ -1702,7 +1769,7 @@ services: - name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a 'munin-node'" - hostgroups: wheezy + hostgroups: wheezy, jessie excludehostgroups: freebsd - name: network service - munin-node @@ -1750,7 +1817,7 @@ services: name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/bin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" hostgroups: computers - excludehostgroups: squeeze, alioth + excludehostgroups: squeeze, alioth, jessie ### - name: MQ connection on rainier @@ -1791,7 +1858,11 @@ services: name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C udevd -a 'udevd'" hostgroups: computers - excludehostgroups: freebsd + excludehostgroups: freebsd, jessie + - + name: process - udevd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C systemd-udevd -a '/lib/systemd/systemd-udevd'" + hostgroups: jessie - name: unexpected process - udev nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C udevd" @@ -1820,7 +1891,7 @@ services: - name: process - stunnel4 - puppet-ekeyd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u stunnel4 -C stunnel4 -a '/usr/bin/stunnel4 /etc/stunnel/puppet-ekeyd.conf'" - hostgroups: squeeze, wheezy + hostgroups: squeeze, wheezy, jessie excludehostgroups: freebsd, alioth # }}} # {{{ anti-services @@ -1866,16 +1937,15 @@ services: - name: process - mdadm monitor servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /var/run/mdadm/monitor.pid --daemonise --scan'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /run/mdadm/monitor.pid --daemonise --scan'" hostgroups: sw-raid - excludehostgroups: wheezy + excludehostgroups: jessie - - # wheezy: name: process - mdadm monitor servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /run/mdadm/monitor.pid --daemonise --scan'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --scan'" hostgroups: sw-raid - excludehostgroups: squeeze + hostgroups: jessie - name: RAID - sw raid servicegroups: raid @@ -2295,7 +2365,7 @@ services: - name: postgresql backups nrpe: "/usr/bin/sudo -u debbackup /usr/lib/nagios/plugins/dsa-check-backuppg" - hosts: backuphost + hosts: storace # }}} # {{{ power # - @@ -2594,6 +2664,17 @@ services: hosts: gombert contact_groups: gobby #### + - + name: network service - sip-tls cert - 443 + check: dsa_check_cert!443 + normal_check_interval: 60 + hosts: vogler + - + name: network service - sip-tls cert - 5061 + check: dsa_check_cert!5061 + normal_check_interval: 60 + hosts: vogler + #### - name: puppetmaster cert nrpe: "/usr/lib/nagios/plugins/dsa-check-cert-expire /var/lib/puppet/ssl/certs/ca.pem"