X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=nagios-master.cfg;h=6e6c708c66905c27c6061ff1e71688cebb3b0c1a;hb=ecb76b28a06c9a1e6b324bb026ffb8032c54f9e4;hp=ee15b1ccb4681734579b68a5eb6f86d7547aa23f;hpb=80b8e8429a1c31da2d488cab19520ca22d18970a;p=mirror%2Fdsa-nagios.git diff --git a/nagios-master.cfg b/nagios-master.cfg index ee15b1c..6e6c708 100644 --- a/nagios-master.cfg +++ b/nagios-master.cfg @@ -14,7 +14,6 @@ # - goetz: gmond/gmetad # - verdi: pg upgrade, openvpn # - mundy: salinfo_decode -# - puccini: mailgraph # down: # - sarti @@ -140,26 +139,30 @@ servers: parents: gw-HP-ftc hostgroups: routing-infrastructure contacts: holger + gw-telefonica: + address: 195.71.99.193 + parents: gw-HP-ftc + hostgroups: routing-infrastructure samosa: address: 192.25.206.57 - hostgroups: computers, service, dl380, apache2-hosts, bind9-hosts, heavy-exim + hostgroups: computers, no-udev, service, dl380, apache2-hosts, bind9-hosts, heavy-exim raff: address: 192.25.206.59 parents: samosa - hostgroups: computers, service, dl380, apache1-hosts, bind9-hosts, rsyncd-hosts, heavy-exim + hostgroups: computers, no-udev, service, dl380, apache1-hosts, bind9-hosts, rsyncd-hosts, heavy-exim, ulogd-hosts, nfs-client gluck: address: 192.25.206.10 parents: samosa - hostgroups: computers, general, dl380, apache1-hosts, bind9-hosts, rsyncd-hosts, heavy-exim, highload + hostgroups: computers, no-udev, general, dl380, apache1-hosts, bind9-hosts, heavy-exim, highload, nfs-client, ulogd-hosts merkel: address: 192.25.206.16 parents: samosa - hostgroups: computers, general, apache1-hosts, bind9-hosts, rsyncd-hosts, sw-raid, postgres81-hosts, heavy-exim + hostgroups: computers, general, apache1-hosts, bind9-hosts, rsyncd-hosts, sw-raid, postgres81-hosts, heavy-exim, nfs-client, ulogd-hosts spohr: address: 192.25.206.33 parents: samosa - hostgroups: computers, service, dl380, apache2-hosts, postgres81-hosts + hostgroups: computers, service, dl380, apache2-hosts, postgres81-hosts, ulogd-hosts, nfs-server peri: address: 192.25.206.15 parents: samosa @@ -173,15 +176,15 @@ servers: mundy: address: 192.25.206.62 parents: samosa - hostgroups: computers, buildd + hostgroups: computers, no-udev, buildd paer: address: 192.25.206.11 parents: samosa - hostgroups: computers, porterbox, bind9-hosts + hostgroups: computers, porterbox, bind9-hosts, single-cpu merulo: address: 192.25.206.58 parents: samosa - hostgroups: computers, porterbox + hostgroups: computers, no-udev, porterbox bartok: address: 82.195.75.91 @@ -201,46 +204,46 @@ servers: agricola: address: 82.195.75.86 parents: gw-man-da - hostgroups: computers, porterbox, sw-raid, single-cpu, lenny + hostgroups: computers, porterbox, sw-raid, single-cpu, lenny, no-samhain contacts: bzed arcadelt: address: 82.195.75.87 parents: gw-man-da - hostgroups: computers, buildd, sw-raid, single-cpu, lenny + hostgroups: computers, buildd, sw-raid, single-cpu, lenny, no-samhain contacts: bzed liszt: address: 82.195.75.100 parents: gw-man-da - hostgroups: computers, service, apache2-hosts, bind9-hosts, postfix-hosts, heavy-postfix, amavis-hosts, dl385 - contacts: bzed - auber: - address: 82.195.75.101 - parents: gw-man-da - hostgroups: computers, buildd, sw-raid + hostgroups: computers, service, apache2-hosts, bind9-hosts, postfix-hosts, heavy-postfix, amavis-hosts, dl385, acpid-hosts contacts: bzed +# auber: +# address: 82.195.75.101 +# parents: gw-man-da +# hostgroups: computers, no-udev, buildd, sw-raid +# contacts: bzed master: address: 70.103.162.29 parents: gw-brainfood - hostgroups: computers, general, apache2-hosts, bind9-hosts, heavy-exim, highload + hostgroups: computers, no-udev, general, apache2-hosts, bind9-hosts, heavy-exim, highload murphy: address: 70.103.162.31 parents: gw-brainfood - hostgroups: computers, general, apache2-hosts, bind9-hosts, postfix-hosts, dl380 + hostgroups: computers, general, postfix-hosts, dl380, acpid-hosts ries: address: 128.148.34.103 parents: gw-brown.edu - hostgroups: computers, service, apache2-hosts, bind9-hosts, ftpd-hosts, dl385, rsyncd-hosts, postgres81-hosts, heavy-exim + hostgroups: computers, service, apache2-hosts, bind9-hosts, ftpd-hosts, dl385, rsyncd-hosts, postgres81-hosts, heavy-exim, acpid-hosts mayer: address: 140.211.166.78 parents: gw-osuosl - hostgroups: computers, buildd + hostgroups: computers, no-udev, buildd mayr: address: 140.211.166.58 parents: gw-osuosl - hostgroups: computers, buildd + hostgroups: computers, no-udev, buildd malo: address: 140.211.166.27 parents: gw-osuosl @@ -248,7 +251,7 @@ servers: rietz: address: 140.211.166.43 parents: gw-osuosl - hostgroups: computers, service, apache2-hosts, bind9-hosts, rsyncd-hosts, dl385, heavy-exim, highload + hostgroups: computers, no-udev, service, apache2-hosts, bind9-hosts, rsyncd-hosts, dl385, heavy-exim, highload rietz2: address: 140.211.166.44 parents: rietz @@ -266,7 +269,7 @@ servers: steffani: address: 128.31.0.36 parents: gw-mit-csail - hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, sw-raid, bind9-hosts + hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, sw-raid, bind9-hosts, acpid-hosts mahler: address: 128.31.0.46 parents: gw-mit-csail @@ -280,22 +283,22 @@ servers: saens: address: 128.101.240.212 parents: gw-umn.edu - hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, dl380, heavy-exim + hostgroups: computers, no-udev, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, dl380, heavy-exim argento: address: 195.49.152.174 parents: gw-dg-i.net - hostgroups: computers, buildd, sw-raid, single-cpu, lenny + hostgroups: computers, buildd, sw-raid, single-cpu, lenny, no-samhain contacts: bzed pergolesi: address: 62.104.23.252 parents: gw-freenet - hostgroups: computers, porterbox, sw-raid + hostgroups: computers, no-udev, porterbox, sw-raid bruckner: address: 62.104.23.253 parents: gw-freenet - hostgroups: computers, porterbox, single-cpu + hostgroups: computers, no-udev, porterbox, single-cpu, deadslow raptor: address: 195.243.109.162 @@ -314,6 +317,11 @@ servers: # SMP kernel doesn't run stable hostgroups: computers, buildd, sw-raid, single-cpu contacts: tjrc1 + smetana: + address: 193.62.202.29 + parents: gw-sanger + hostgroups: computers, porterbox, sw-raid + contacts: tjrc1 verdi: address: 192.54.42.193 @@ -329,18 +337,18 @@ servers: puccini: address: 87.106.4.56 parents: gw-1und1 - hostgroups: computers, service, apache2-hosts, bind9-hosts, postfix-hosts, heavy-postfix, amavis-hosts + hostgroups: computers, buildd contacts: joerg powell: address: 87.106.64.223 parents: gw-1und1 - hostgroups: computers, service, heavy-exim + hostgroups: computers, service, heavy-exim, rsyncd-hosts, ulogd-hosts, acpid-hosts contacts: joerg caballero: address: 193.201.200.200 parents: gw-blackcat - hostgroups: computers, buildd, sw-raid, bind9-hosts + hostgroups: computers, no-udev, buildd, sw-raid, bind9-hosts elara: address: 67.210.160.90 @@ -365,12 +373,12 @@ servers: kassia: address: 130.89.175.54 parents: gw-utwente - hostgroups: computers, service, postfix-hosts, apache2-hosts, ftpd-hosts, rsyncd-hosts, dl360 + hostgroups: computers, service, postfix-hosts, apache2-hosts, ftpd-hosts, rsyncd-hosts, dl360, acpid-hosts allegri: address: 157.193.39.233 parents: gw-HP-ftc - hostgroups: computers, buildd, postfix-hosts, sw-raid, single-cpu, lenny + hostgroups: computers, buildd, postfix-hosts, sw-raid, single-cpu, lenny, no-samhain contacts: luk agnesi: @@ -386,7 +394,7 @@ servers: ravel: address: 137.82.84.43 parents: gw-ubc - hostgroups: computers, general, dl385, apache2-hosts + hostgroups: computers, general, dl385, apache2-hosts, acpid-hosts lebrun: address: 193.198.184.10 @@ -405,9 +413,14 @@ servers: piatti: address: 193.167.161.225 parents: gw-helsinki - hostgroups: computers, postfix-hosts, dl385 + hostgroups: computers, postfix-hosts, dl385, ulogd-hosts, acpid-hosts contacts: holger + rem: + address: 195.71.99.217 + parents: gw-helsinki + hostgroups: computers, buildd + ############################# # host groups # @@ -466,6 +479,10 @@ hostgroups: alias: Hosts running lenny, not etch private: 1 + no-samhain: + alias: hosts not running samhain properly + private: 1 + syslog-ng-hosts: alias: hosts running syslog-ng instead of sysklogd private: 1 @@ -476,7 +493,7 @@ hostgroups: alias: hosts running postfix instead of exim private: 1 heavy-exim: - alias: "hosts running the full mail stuff, including clamav, SA, and greylistd" + alias: "hosts running the full mail stuff, including clamav, SA, and postgrey" private: 1 heavy-postfix: alias: "postfix hosts running the full mail stuff, including clamav, SA, postgrey, policyd-weight" @@ -508,6 +525,22 @@ hostgroups: mysql-hosts: alias: hosts running mysql private: 1 + no-udev: + alias: hosts not using udev + private: 1 + ulogd-hosts: + alias: hosts running ulogd + private: 1 + acpid-hosts: + alias: hosts running acpid + private: 1 + + nfs-client: + alias: hosts mounting filesystems using NFS + private: 1 + nfs-server: + alias: hosts serving filesystems using NFS + private: 1 highload: alias: "hosts on which high load is normal" @@ -585,7 +618,7 @@ services: name: disk usage on /boot servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 85 /boot" - hosts: sperger, rietz, steffani, penalosa, peri, albeniz, goetz, mayer, mayr, paer, spontini, tartini, morales, ravel, auber, schroeder, piatti + hosts: sperger, rietz, steffani, penalosa, peri, albeniz, goetz, mayer, mayr, paer, spontini, tartini, morales, ravel, schroeder, piatti, rem - name: disk usage on /var servicegroups: diskspace @@ -605,7 +638,7 @@ services: name: disk usage on /srv servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /srv" - hosts: agricola, arcadelt, argento, allegri, tartini, morales, auber, powell + hosts: agricola, arcadelt, argento, allegri, tartini, morales, powell - name: disk usage on /org/scratch servicegroups: diskspace @@ -615,7 +648,7 @@ services: name: disk usage on /tmp servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 60 80 /tmp" - hosts: samosa, raff, gluck, saens, puccini, merkel, tartini, powell + hosts: samosa, raff, gluck, saens, puccini, merkel, tartini, powell, piatti - name: disk usage on /usr servicegroups: diskspace @@ -625,7 +658,7 @@ services: name: disk usage on /home servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /home" - hosts: raptor, voltaire, lebrun + hosts: raptor, voltaire, lebrun, rem - name: disk usage on /home servicegroups: diskspace @@ -691,11 +724,13 @@ services: name: process - samhain nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C samhain -a '/usr/sbin/samhain'" hostgroups: computers + excludehostgroups: no-samhain - name: samhain servicegroups: samhain - nrpe: "/usr/lib/nagios/plugins/dsa-check-samhain" + nrpe: "/usr/lib/nagios/plugins/dsa-check-samhain -t 45" hostgroups: computers + excludehostgroups: no-samhain depends: process - samhain normal_check_interval: 240 retry_check_interval: 5 @@ -791,7 +826,7 @@ services: normal_check_interval: 360 - name: "network service - sshd - version" - check: "dsa_check_ssh_port_version!22!OpenSSH_5.1p1 Debian-2" + check: "dsa_check_ssh_port_version!22!OpenSSH_5.1p1 Debian-3" depends: network service - sshd hostgroups: lenny normal_check_interval: 360 @@ -976,18 +1011,21 @@ services: hosts: merkel, raff ### - - - name: process - greylistd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u greylist -C greylistd -a '/usr/bin/python /usr/sbin/greylistd'" - hostgroups: heavy-exim + #- + # name: process - greylistd + # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u greylist -C greylistd -a '/usr/bin/python /usr/sbin/greylistd'" + # hostgroups: heavy-exim # - name: unwanted process - greylistd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C greylistd" hostgroups: computers - excludehostgroups: heavy-exim ### + - + name: process - postgrey + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -C postgrey -a '/usr/sbin/postgrey --pidfile=/var/run/postgrey.pid --daemonize --unix=/var/run/postgrey/socket --retry-window=4 --auto-whitelist-clients=10 --exim'" + hostgroups: heavy-exim - name: process - postgrey nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -C postgrey -a '/usr/sbin/postgrey --pidfile=/var/run/postgrey.pid --daemonize --inet=127.0.0.1:60000'" @@ -997,7 +1035,7 @@ services: name: unwanted process - postgrey nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C postgrey" hostgroups: computers - excludehostgroups: heavy-postfix + excludehostgroups: heavy-postfix, heavy-exim ### - name: process - amavis - master @@ -1191,10 +1229,12 @@ services: name: unwanted process - portmap nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C portmap" hostgroups: computers + excludehostgroups: nfs-client, nfs-server - name: unwanted process - rpc.statd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C rpc.statd" hostgroups: computers + excludehostgroups: nfs-client, nfs-server - name: unwanted process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C inetd" @@ -1278,28 +1318,48 @@ services: name: process - slapd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:20 -c 1:50 -u openldap -C slapd -a '/usr/sbin/slapd -h ldap:/// ldaps:/// -g openldap -u openldap'" hosts: samosa + ### + - + name: process - ulogd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ulogd -a '/usr/sbin/ulogd -d'" + hostgroups: ulogd-hosts + - + name: unexpected process - ulogd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C ulogd" + hostgroups: computers + excludehostgroups: ulogd-hosts ### - name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C udevd -a 'udevd'" - hosts: sperger, ries, steffani, merkel, spohr, peri, penalosa, albeniz, verdi, liszt, kassia, agricola, arcadelt, argento, allegri, morales, bartok, schroeder + hostgroups: computers + excludehostgroups: no-udev + - + name: unexpected process - udev + nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C udevd" + hostgroups: no-udev ### - name: process - acpid nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C acpid -a '/usr/sbin/acpid -c /etc/acpi/events -s /var/run/acpid.socket'" - hosts: ries, steffani, liszt, kassia + hostgroups: acpid-hosts + - + name: unexpected process - acpid + nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C acpid" + hostgroups: computers + excludehostgroups: acpid-hosts ### - name: process - xinetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C xinetd -a '/usr/sbin/xinetd -pidfile /var/run/xinetd.pid -stayalive'" - hosts: samosa, raptor, allegri + hosts: samosa, raptor, allegri, gluck hostgroups: rsyncd-hosts - name: unwanted process - xinetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C xinetd" hostgroups: computers - excludehosts: samosa, raptor, allegri + excludehosts: samosa, raptor, allegri, gluck excludehostgroups: rsyncd-hosts ### - @@ -1495,3 +1555,36 @@ services: name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C monit -a '/usr/sbin/monit -d 30 -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" hosts: villa, lobos, steffani, kassia, master + + ############ NFS Stuff ############ + #### + - + name: process - portmap + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u daemon -C portmap -a '/sbin/portmap'" + hostgroups: nfs-client, nfs-server + - + name: process - statd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u statd -C rpc.statd -a '/sbin/rpc.statd'" + hostgroups: nfs-client, nfs-server + - + name: process - nfsd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u root -C nfsd -a '[nfsd]'" + hostgroups: nfs-server + - + name: process - lockd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C lockd -a '[lockd]'" + hostgroups: nfs-server + - + name: process - mountd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C rpc.mountd -a '/sbin/rpc.mountd'" + hostgroups: nfs-server + # see if the nfs stuff works and doesn't hang. + # the df check all script will also hang, but we don't appear to pay attention to that + - + name: nfs mount ftp archive + nrpe: "/usr/lib/nagios/plugins/check_disk 100 100 /home/org/ftp.root/debian" + hosts: gluck + - + name: nfs mount ftp archive + nrpe: "/usr/lib/nagios/plugins/check_disk 100 100 /org/mirrors/ftp.debian.org/ftp" + hosts: merkel, raff