X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=46ec094607e4d7ebf7c1fce0a4bdf844525762b7;hb=501b27ce52e5c8c03d2459e34e06bd044d70376f;hp=e8414eeca61f9e24b4d90e80cfa1875396757c14;hpb=4a1d13bd462c41306f3c499ac22549e4cb354bdf;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index e8414ee..46ec094 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -152,10 +152,10 @@ servers: address: 130.239.18.97 parents: gw-ubc hostgroups: routing-infrastructure - gw-esiee: - address: 195.220.83.13 - parents: gw-ubc - hostgroups: routing-infrastructure +# gw-esiee: +# address: 195.220.83.13 +# parents: gw-ubc +# hostgroups: routing-infrastructure gw-ghent: address: 193.191.17.50 parents: gw-ubc @@ -282,11 +282,19 @@ servers: ball: address: 82.195.75.70 parents: gw-man-da - hostgroups: computers, buildd, no-udev, hasbootfs, ntpsuckers + hostgroups: computers, buildd, hasbootfs kokkonen: address: 82.195.75.97 parents: gw-man-da - hostgroups: computers, service, acpid-hosts, postgres84-hosts + hostgroups: computers, service, acpid-hosts, heavy-exim + byrd: + address: 82.195.75.92 + parents: unger + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze + lamb: + address: 82.195.75.101 + parents: unger + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hasvicepa, bosserver master: address: 70.103.162.29 @@ -301,7 +309,7 @@ servers: ries: address: 128.148.34.103 parents: gw-brown.edu - hostgroups: computers, service, apache2-hosts, bind9-hosts, dl385, rsyncd-hosts, postgres83-hosts, spamd, heavy-exim, acpid-hosts, xinetd-hosts + hostgroups: computers, service, dl385, rsyncd-hosts, acpid-hosts, xinetd-hosts, hassrvfs franck: address: 128.148.34.3 @@ -319,7 +327,8 @@ servers: rietz: address: 140.211.166.43 parents: gw-osuosl - hostgroups: computers, service, rsyncd-hosts, dl385, hassrvfs, acpid-hosts, xinetd-hosts + hostgroups: computers, service, rsyncd-hosts, dl385, hassrvfs, acpid-hosts, xinetd-hosts, hasvicepa + #, bosserver rietz2: address: 140.211.166.44 parents: rietz @@ -539,7 +548,7 @@ servers: stabile: address: 206.12.19.13 parents: gw-ubc - hostgroups: computers, hashomefs, sw-raid, rsyncd-hosts, postgres84-hosts, apache2-hosts, xinetd-hosts, service + hostgroups: computers, hashomefs, sw-raid, rsyncd-hosts, postgres84-hosts, apache2-hosts, xinetd-hosts, service, nfs-server cimarosa: address: 206.12.19.8 parents: gw-ubc @@ -591,11 +600,27 @@ servers: salieri: address: 206.12.19.20 parents: tchaikovsky - hostgroups: computers, dl585, acpid-hosts, service + hostgroups: computers, dl585, acpid-hosts, service, squeeze traetta: address: 206.12.19.21 parents: tchaikovsky hostgroups: computers, dl585, acpid-hosts, service + schuetz: + address: 206.12.19.119 + parents: tchaikovsky + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze + locke: + address: 206.12.19.120 + parents: tchaikovsky + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hasvicepa + lotti: + address: 206.12.19.121 + parents: tchaikovsky + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze + quantz: + address: 206.12.19.122 + parents: tchaikovsky + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hassrvfs, nfs-client, xinetd-hosts, heavy-exim lebrun: address: 193.198.184.10 @@ -650,10 +675,10 @@ servers: parents: gw-aca hostgroups: computers, hasbootfs, aacraid, nfs-client, acpid-hosts, service - lafayette: - address: 147.215.7.160 - parents: gw-esiee - hostgroups: computers, buildd, sw-raid, hassrvfs, hasbootfs +# lafayette: +# address: 147.215.7.160 +# parents: gw-esiee +# hostgroups: computers, buildd, sw-raid, hassrvfs, hasbootfs grieg: address: 194.177.211.200 @@ -662,7 +687,7 @@ servers: rautavaara: address: 194.177.211.199 parents: gw-grnet - hostgroups: computers, acpid-hosts, megaraid, service + hostgroups: computers, acpid-hosts, megaraid, service, squeeze fasch: address: 194.177.211.201 parents: rautavaara @@ -699,7 +724,7 @@ servers: orff: address: 194.177.211.209 parents: gw-grnet - hostgroups: computers, acpid-hosts, bind9-hosts, mptraid, service + hostgroups: computers, acpid-hosts, bind9-hosts, mptraid, service, hassrvfs field: address: 194.177.211.210 parents: rautavaara @@ -903,6 +928,9 @@ hostgroups: uploadqueue: alias: hosts that are an anonymous ftp uploadqueue private: 1 + bosserver: + alias: hosts running bosserver + private: 1 nfs-client: alias: hosts mounting filesystems using NFS @@ -940,6 +968,9 @@ hostgroups: hasusrfs: alias: hosts with a /usr filesystem private: 1 + hasvicepa: + alias: hosts with a /vicepa + private: 1 incomingmailrelayed: alias: incoming mail needs to go through a mail relay @@ -1011,12 +1042,12 @@ services: servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /" hostgroups: computers - excludehosts: ries, klecker, kassia, spohr + excludehosts: klecker, kassia, spohr - name: disk usage on / servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 90 93 /" - hosts: ries, klecker, kassia, spohr + hosts: klecker, kassia, spohr - name: disk usage on /boot servicegroups: diskspace @@ -1082,7 +1113,7 @@ services: name: disk usage on /var/log servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /var/log" - hosts: busoni + hosts: busoni, wieck - name: disk usage on /srv/morgue.debian.org @@ -1102,7 +1133,7 @@ services: - name: disk usage on /srv/snapshot.debian.org servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /srv/snapshot.debian.org" + nrpe: "/usr/lib/nagios/plugins/check_disk 90 94 /srv/snapshot.debian.org" hosts: stabile,sibelius - name: disk usage on /srv/farm-snapshot/farm-01 @@ -1144,6 +1175,11 @@ services: servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /srv/fossology.debian.net" hosts: vivaldi + - + name: disk usage on /vicepa + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /vicepa" + hostgroups: hasvicepa ############ All Computers ############ #### @@ -1166,7 +1202,7 @@ services: - name: backup server config nrpe: "/usr/lib/nagios/plugins/dsa-check-dabackup-server" - hosts: bartok, beethoven + hosts: beethoven normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 @@ -1180,6 +1216,35 @@ services: normal_check_interval: 60 retry_check_interval: 5 + #### + - name: afs - space + hostgroups: bosserver + nrpe: "/usr/lib/nagios/plugins/dsa-check-afs-space -H localhost" + normal_check_interval: 60 + max_check_attempts: 2 + retry_check_interval: 5 + + - name: afs - bos + hostgroups: bosserver + nrpe: "/usr/lib/nagios/plugins/dsa-check-afs-bos -H localhost" + normal_check_interval: 60 + max_check_attempts: 2 + retry_check_interval: 5 + + - name: afs - waiting connections + hostgroups: bosserver + nrpe: "/usr/lib/nagios/plugins/dsa-check-afs-rxdebug -H localhost" + normal_check_interval: 60 + max_check_attempts: 2 + retry_check_interval: 5 + + #- name: afs - udebug + # hostgroups: bosserver + # nrpe: "/usr/lib/nagios/plugins/dsa-check-afs-udebug -H localhost" + # normal_check_interval: 60 + # max_check_attempts: 2 + # retry_check_interval: 5 + #### - name: puppet @@ -1306,11 +1371,11 @@ services: name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u root -C munin-node -a '/usr/sbin/munin-node'" hostgroups: computers - excludehostgroups: squeeze + excludehostgroups: freebsd - name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u root -C perl -a '/usr/bin/perl -wT /usr/sbin/munin-node'" - hostgroups: squeeze + hostgroups: freebsd - name: network service - munin-node check: check_tcp!4949 @@ -1352,12 +1417,12 @@ services: name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" hostgroups: computers - excludehostgroups: squeeze + excludehostgroups: freebsd - name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:2 -c 2: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" - hostgroups: squeeze + hostgroups: freebsd - name: remote logging @@ -1371,17 +1436,17 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u Debian-exim -C exim4 -a '/usr/sbin/exim4 -bd -q'" hostgroups: computers excludehostgroups: postfix-hosts - excludehosts: master, busoni, merkel + excludehosts: master, busoni, merkel, quantz - name: process - exim - total nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1: -C exim4" hostgroups: computers excludehostgroups: postfix-hosts - excludehosts: master, busoni, merkel + excludehosts: master, busoni, merkel, quantz - name: process - exim nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:300 -c 1:500 -C exim4 -a '/usr/sbin/exim4'" - hosts: master, busoni, merkel + hosts: master, busoni, merkel, quantz ### - name: process - clamav - clamd @@ -1645,7 +1710,7 @@ services: name: unwanted process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C inetd" hostgroups: computers - excludehosts: grieg + excludehosts: grieg, byrd - name: unwanted process - snmpd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C snmpd" @@ -1703,6 +1768,12 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli" normal_check_interval: 120 hostgroups: dl385, dl380, dl360, bl460 + - + name: HW - hpacucli enclosure status + servicegroups: raid + nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli-enclosure 1 1E:1" + normal_check_interval: 120 + hosts: franck - name: HW - hpacucli status servicegroups: raid @@ -1781,7 +1852,7 @@ services: ### - name: process - udevd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C udevd -a 'udevd'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C udevd -a 'udevd'" hostgroups: computers excludehostgroups: no-udev, freebsd - @@ -1798,12 +1869,17 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C acpid" hostgroups: computers excludehostgroups: acpid-hosts, kvmdomains + ### + - + name: process - bosserver + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C bosserver -a '/usr/sbin/bosserver'" + hostgroups: bosserver ### - name: process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C inetd -a '/usr/sbin/inetd'" - hosts: grieg + hosts: grieg, byrd ### - name: process - xinetd @@ -1885,7 +1961,7 @@ services: - name: network service - https check: check_https - hosts: ries, franck, chopin, draghi, liszt, spohr, widor, tchaikovsky, grieg, vivaldi + hosts: franck, chopin, draghi, liszt, spohr, widor, tchaikovsky, grieg, vivaldi depends: "process - apache2 - master" normal_check_interval: 120 - @@ -1900,7 +1976,7 @@ services: # liszt lists.debian.org # grieg buildd.debian.org # vivaldi fossology.debian.org - hosts: ries, franck, chopin, spohr, tchaikovsky, draghi, merkel2, liszt, widor, grieg, vivaldi + hosts: franck, chopin, spohr, tchaikovsky, draghi, merkel2, liszt, widor, grieg, vivaldi depends: network service - https normal_check_interval: 60 @@ -2032,6 +2108,46 @@ services: name: udd stunnel - master cert nrpe: "/usr/lib/nagios/plugins/check_http -H localhost -p 8080 -S -C 14 -t 45" hosts: samosa + #### + - + name: process - krb - kdc + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C kdc -a '/usr/lib/heimdal-servers/kdc --config-file=/etc/heimdal-kdc/kdc.conf'" + hosts: schuetz, byrd + - + name: process - krb - iprop - slave + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ipropd-slave -a '/usr/sbin/ipropd-slave byrd.debian.org'" + hosts: schuetz + - + name: process - krb - iprop - master + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ipropd-master -a '/usr/sbin/ipropd-master'" + hosts: byrd + - + name: process - krb - kpasswdd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C kpasswdd -a '/usr/lib/heimdal-servers/kpasswdd'" + hosts: byrd + ### + - + name: process - UPS - nut usbhid-ups - ups1 + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u nut -C usbhid-ups -a '/lib/nut/usbhid-ups -a ups1'" + hosts: franck + - + name: process - UPS - nut upsd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u nut -C upsd -a '/sbin/upsd'" + hosts: franck + - + name: process - UPS - nut upsmon master + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C upsmon -a '/sbin/upsmon'" + hosts: franck + - + name: process - UPS - nut upsmon worker + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u nut -C upsmon -a '/sbin/upsmon'" + hosts: franck + depends: process - UPS - nut upsmon master + - + name: UPS - on line power + nrpe: "/usr/lib/nagios/plugins/dsa-check-ups" + hosts: franck + depends: process - UPS - nut upsd #### #- @@ -2054,11 +2170,19 @@ services: hosts: unger ### + - + name: process - buildd + servicegroups: buildd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C perl -a '/usr/bin/buildd'" + hosts: fano, fasch, field, finzi + contacts: luk, pkern, HE + - name: process - buildd servicegroups: buildd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C buildd -a '/usr/bin/buildd'" hostgroups: buildd + excludehosts: fano, fasch, field, finzi contacts: luk, pkern, HE ### @@ -2133,7 +2257,7 @@ services: retry_check_interval: 5 - name: mirror sync - snapshot - check: "dsa_check_mirrorsync_skew!snapshot.debian.org!project/trace/snapshot-master.debian.org!1800:28800" + check: "dsa_check_mirrorsync_skew!snapshot.debian.org!project/trace/snapshot-master.debian.org!3600:28800" hosts: global normal_check_interval: 15 max_check_attempts: 5 @@ -2182,12 +2306,12 @@ services: name: DNS SEC - signature expiry hosts: global remotecheck: "/usr/lib/nagios/plugins/dsa-check-zone-rrsig-expiration-many --warn 20d --critical 7d --geozonedir /srv/dns.debian.org/geo/zones /srv/dns.debian.org/var/gitdns/domains" - runfrom: draghi + runfrom: orff - name: DNS SEC - delegations hosts: global remotecheck: "/usr/lib/nagios/plugins/dsa-check-dnssec-delegation --dir /srv/dns.debian.org/var/gitdns/domains --dir /srv/dns.debian.org/geo/zones check-header" - runfrom: draghi + runfrom: orff ############ - @@ -2205,6 +2329,6 @@ services: hosts: giustini - name: event log - remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=789 $HOSTADDRESS$ public" + remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=952 $HOSTADDRESS$ public" runfrom: dijkstra hosts: giustini