X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=a503959b5a1d33d6f246c497ce5c3ef405d9b23e;hb=1e8ddf89706b8afa4fd60eed434c4e3f36043ccf;hp=15ff20a2d2d9650abac4b171e18e1514aa34a7c0;hpb=5a95548e0faa2563c882adae3b10494707485018;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index 15ff20a..a503959 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -10,7 +10,6 @@ # - *: check munin stats collection works # - *: check backups are successful # - *: unwanted: network: auth, discard, daytime, time (on some), cvs-pserver, rsync (on some), ftp (on some), http (on some) -# - verdi: pg upgrade, openvpn # - mundy: salinfo_decode # down: @@ -27,6 +26,11 @@ servers: parents: gw-HP-ftc hostgroups: routing-infrastructure contacts: joerg, bzed + gw-man-da2: + address: 82.195.75.46 + parents: gw-man-da + hostgroups: routing-infrastructure + contacts: joerg, bzed gw-HP-ftc: address: 192.25.206.1 parents: spohr @@ -160,6 +164,10 @@ servers: address: 193.191.17.50 parents: gw-HP-ftc hostgroups: routing-infrastructure + gw-anu: + address: 150.203.164.38 + parents: gw-HP-ftc + hostgroups: routing-infrastructure global: hostgroups: notacomputer @@ -169,15 +177,11 @@ servers: samosa: address: 192.25.206.57 parents: spohr - hostgroups: computers, service, dl380, lenny, hassrvfs, hasbootfs, acpid-hosts, ulogd-hosts + hostgroups: computers, service, dl380, lenny, hassrvfs, hasbootfs, acpid-hosts, ulogd-hosts, nfs-client raff: address: 192.25.206.59 parents: spohr hostgroups: computers, no-udev, service, dl380, apache2-hosts, bind9-hosts, rsyncd-hosts, heavy-exim, ulogd-hosts, nfs-client, lenny, hasvarfs, hasusrfs - gluck: - address: 192.25.206.10 - parents: spohr - hostgroups: computers, no-udev, general, dl380, apache2-hosts, bind9-hosts, heavy-exim, highload, nfs-client, ulogd-hosts, lenny, hasvarfs, hasusrfs merkel: address: 192.25.206.16 parents: spohr @@ -188,7 +192,7 @@ servers: hostgroups: secondary-IPs spohr: address: 192.25.206.33 - hostgroups: computers, service, dl380, apache2-hosts, postgres83-hosts, ulogd-hosts, nfs-server, lenny, heavy-exim + hostgroups: computers, service, dl380, apache2-hosts, postgres83-hosts, ulogd-hosts, nfs-server, lenny, heavy-exim, bind9-hosts spohr2: address: 192.25.206.38 parents: spohr @@ -227,8 +231,8 @@ servers: # hostgroups: computers, porterbox, single-cpu, no-samhain, hasbootfs, hassrvfs, lenny, hasvarfs, hasusrfs # contacts: bzed sperger: - address: 82.195.75.98 - parents: gw-man-da + address: 82.195.75.34 + parents: gw-man-da2 hostgroups: computers, porterbox, sw-raid, hasbootfs, lenny contacts: bzed agricola: @@ -270,7 +274,11 @@ servers: kaufmann: address: 82.195.75.107 parents: unger - hostgroups: computers, service, lenny, hasbootfs, apache2-hosts, single-cpu + hostgroups: computers, service, lenny, hasbootfs, apache2-hosts, single-cpu, rsyncd-hosts + byrd: + address: 82.195.75.101 + parents: unger + hostgroups: computers, service, lenny, hasbootfs, hassrvfs master: address: 70.103.162.29 @@ -315,6 +323,10 @@ servers: address: 212.211.132.250 parents: gw-scanplus-lobos hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, dl380, lenny, hasvarfs, hasusrfs + gluck: + address: 150.203.164.38 + parents: gw-anu + hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, dl380, lenny, no-udev, hassrvfs, acpid-hosts steffani: address: 128.31.0.36 @@ -331,7 +343,7 @@ servers: senfl: address: 128.31.0.51 parents: gw-mit-csail - hostgroups: computers, service, lenny, dl360, acpid-hosts, hassrvfs, ulogd-hosts, apache2-hosts + hostgroups: computers, service, lenny, dl360, acpid-hosts, hassrvfs, ulogd-hosts, apache2-hosts, rsyncd-hosts carver: address: 128.31.0.50 parents: gw-mit-csail @@ -356,7 +368,7 @@ servers: widor: address: 93.94.130.161 parents: gw-dg-i.net - hostgroups: computers, apache2-hosts, sw-raid, single-cpu, lenny, acpid-hosts + hostgroups: computers, apache2-hosts, sw-raid, lenny, acpid-hosts contacts: bzed pergolesi: @@ -382,11 +394,6 @@ servers: hostgroups: computers, porterbox, sw-raid, lenny contacts: tjrc1 - verdi: - address: 192.54.42.193 - parents: gw-lrz - hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, postgres81-hosts, postfix-hosts - voltaire: address: 72.66.115.54 parents: gw-frost @@ -467,11 +474,15 @@ servers: ravel: address: 137.82.84.66 parents: gw-ubc - hostgroups: computers, general, dl385, apache2-hosts, acpid-hosts, ftpd-hosts, hasbootfs, lenny, nfs-server + hostgroups: computers, general, dl385, apache2-hosts, acpid-hosts, ftpd-hosts, hasbootfs, lenny, nfs-server, rsyncd-hosts dijkstra: address: 137.82.84.70 parents: gw-ubc hostgroups: computers, bl460, acpid-hosts, lenny + wolkenstein: + address: 137.82.84.89 + parents: dijkstra + hostgroups: computers, lenny, hasbootfs, hassrvfs brahms: address: 137.82.84.74 parents: dijkstra @@ -487,19 +498,23 @@ servers: valente: address: 137.82.84.76 parents: dijkstra - hostgroups: computers, lenny, hasbootfs, single-cpu + hostgroups: computers, lenny, hasbootfs, single-cpu, hassrvfs, postgres83-hosts, ftpd-hosts, rsyncd-hosts bellini: address: 137.82.84.79 parents: gw-ubc - hostgroups: computers, lenny, hasbootfs, nfs-client, hashomefs, hassrvfs, aacraid + hostgroups: computers, lenny, hasbootfs, nfs-client, hassrvfs, aacraid + morricone: + address: 137.82.84.81 + parents: gw-ubc + hostgroups: computers, lenny, hasbootfs, hassrvfs, aacraid, postgres83-hosts, ftpd-hosts, rsyncd-hosts stabile: address: 137.82.84.72 parents: gw-ubc - hostgroups: computers, lenny, hashomefs, sw-raid + hostgroups: computers, lenny, hashomefs, sw-raid, rsyncd-hosts cimarosa: address: 137.82.84.80 parents: gw-ubc - hostgroups: computers, lenny, hasbootfs, aacraid + hostgroups: computers, lenny, hasbootfs, aacraid, hassrvfs # MSA 2000 (2012i) giustini: address: 192.168.2.6 @@ -674,9 +689,9 @@ hostgroups: rsyncd-hosts: alias: hosts providing rsync services via xinetd private: 1 - postgres81-hosts: - alias: hosts running postgres81 - private: 1 + #postgres81-hosts: + # alias: hosts running postgres81 + # private: 1 postgres83-hosts: alias: hosts running postgres83 private: 1 @@ -813,7 +828,7 @@ services: name: disk usage on /org servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /org" - hosts: sperger, raff, lobos, villa, steffani, saens, pergolesi, verdi, spontini, ravel, mahler, schroeder, piatti, pescetti, widor, schein, lebrun + hosts: sperger, raff, lobos, villa, steffani, saens, pergolesi, spontini, ravel, mahler, schroeder, piatti, pescetti, widor, schein, lebrun - name: disk usage on /org servicegroups: diskspace @@ -833,7 +848,7 @@ services: name: disk usage on /tmp servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 60 80 /tmp" - hosts: raff, gluck, saens, puccini, merkel, tartini, powell, piatti, escher + hosts: raff, saens, puccini, merkel, tartini, powell, piatti, escher - name: disk usage on /usr servicegroups: diskspace @@ -844,11 +859,6 @@ services: servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /home" hostgroups: hashomefs - - - name: disk usage on /home - servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /home" - hosts: gluck - name: disk usage on /mnt/hdc servicegroups: diskspace @@ -920,15 +930,9 @@ services: retry_check_interval: 5 #### - - - name: process - puppet - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C ruby -a 'ruby /usr/sbin/puppetd -w 5 --factsync'" - hostgroups: lenny - excludehosts: agnesi - - name: puppet - nrpe: "/usr/lib/nagios/plugins/dsa-check-file_age -f /var/lib/puppet/state/state.yaml" + nrpe: "/usr/lib/nagios/plugins/dsa-check-file_age -i 540 -f /var/lib/puppet/state/state.yaml" hostgroups: lenny excludehosts: agnesi @@ -1017,11 +1021,6 @@ services: check: dsa_check_ssh_port!2260 hosts: agnesi normal_check_interval: 180 - - - name: "network service - sshd - 443" - check: dsa_check_ssh_port!443 - hosts: gluck - normal_check_interval: 180 - name: "network service - sshd - version" @@ -1120,11 +1119,11 @@ services: - name: process - syslogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslogd -a '/sbin/syslogd'" - hosts: rietz, verdi + hosts: rietz - name: process - klogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C klogd -a '/sbin/klogd -x'" - hosts: rietz, verdi + hosts: rietz ### MAIL STUFF ### @@ -1133,17 +1132,17 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u Debian-exim -C exim4 -a '/usr/sbin/exim4 -bd -q'" hostgroups: computers excludehostgroups: postfix-hosts - excludehosts: master, rietz, merkel, gluck + excludehosts: master, rietz, merkel - name: process - exim - total nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1: -C exim4" hostgroups: computers excludehostgroups: postfix-hosts - excludehosts: master, rietz, merkel, gluck + excludehosts: master, rietz, merkel - name: process - exim nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:300 -c 1:500 -C exim4 -a '/usr/sbin/exim4'" - hosts: master, rietz, merkel, gluck + hosts: master, rietz, merkel ### - name: process - clamav - clamd @@ -1158,12 +1157,6 @@ services: name: process - clamav - freshclam nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u clamav -C freshclam -a '/usr/bin/freshclam -d --quiet'" hostgroups: heavy-exim, heavy-postfix - - - name: process - clamav - getsigs - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u clamav -C getclamsigs -a 'getclamsigs'" - hostgroups: heavy-exim, heavy-postfix - excludehosts: master, powell - # - name: unwanted process - clamav nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C clamd" @@ -1174,13 +1167,6 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C freshclam" hostgroups: computers excludehostgroups: heavy-exim, heavy-postfix - - - name: unwanted process - clamav - getsigs - nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C getclamsigs" - hostgroups: computers - excludehostgroups: heavy-exim, heavy-postfix - hosts: master, powell - ### - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" @@ -1335,19 +1321,6 @@ services: hostgroups: postfix-hosts depends: process - postfix - master - - - name: process - postfix - smtpd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:40 -c 0:90 -u postfix -C smtpd -a 'smtpd -n smtp -t inet -u -c'" - hostgroups: postfix-hosts - excludehosts: liszt - depends: process - postfix - master - - - name: process - postfix - smtp - nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:10 -c 0:15 -u postfix -C smtp -a 'smtp -t unix -u -c'" - hostgroups: postfix-hosts - excludehosts: liszt - depends: process - postfix - master - - name: process - postfix - smtpd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:150 -c 0:200 -u postfix -C smtpd -a 'smtpd -n smtp -t inet -u -c'" @@ -1371,7 +1344,6 @@ services: name: network service - smtp check: dsa_check_smtp hostgroups: postfix-hosts - excludehosts: verdi depends: process - postfix - master - name: network service - submission @@ -1383,11 +1355,6 @@ services: check: dsa_check_smtp_port!2025 hostgroups: incomingmailrelayed2025 depends: process - exim - - - name: network service - smtp - port 2025 - check: dsa_check_smtp_port!2025 - hosts: verdi - depends: process - postfix - master - name: network service local - smtps cert nrpe: "/usr/lib/nagios/plugins/check_http -H localhost -p 465 -S -C 14 -t 45" @@ -1449,6 +1416,7 @@ services: name: unwanted process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C inetd" hostgroups: computers + excludehosts: rietz - name: unwanted process - snmpd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C snmpd" @@ -1503,12 +1471,6 @@ services: servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-raid-areca" hosts: powell - ### - - - name: RAID - DAC960 - servicegroups: raid - nrpe: "/usr/lib/nagios/plugins/dsa-check-raid-dac960" - hosts: verdi ### - name: RAID - aacraid @@ -1568,13 +1530,13 @@ services: - name: process - xinetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C xinetd -a '/usr/sbin/xinetd -pidfile /var/run/xinetd.pid -stayalive'" - hosts: gluck, zelenka, ancina, draghi + hosts: zelenka, ancina, draghi hostgroups: rsyncd-hosts - name: unwanted process - xinetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C xinetd" hostgroups: computers - excludehosts: gluck, zelenka, ancina, draghi + excludehosts: zelenka, ancina, draghi excludehostgroups: rsyncd-hosts ### - @@ -1741,25 +1703,25 @@ services: hosts: ries, ravel, klecker ### - - - name: process - postresql81 - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a '/usr/lib/postgresql/8.1/bin/postmaster -D /var/lib/postgresql/8.1/main -c config_file=/etc/postgresql/8.1/main/postgresql.conf'" - hostgroups: postgres81-hosts - - - name: process - postresql81 - writer - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: writer process'" - hostgroups: postgres81-hosts - depends: process - postresql81 - master - - - name: process - postresql81 - buffer - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: stats buffer process'" - hostgroups: postgres81-hosts - depends: process - postresql81 - master - - - name: process - postresql81 - collector - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: stats collector process'" - hostgroups: postgres81-hosts - depends: process - postresql81 - master + #- + # name: process - postresql81 - master + # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a '/usr/lib/postgresql/8.1/bin/postmaster -D /var/lib/postgresql/8.1/main -c config_file=/etc/postgresql/8.1/main/postgresql.conf'" + # hostgroups: postgres81-hosts + #- + # name: process - postresql81 - writer + # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: writer process'" + # hostgroups: postgres81-hosts + # depends: process - postresql81 - master + #- + # name: process - postresql81 - buffer + # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: stats buffer process'" + # hostgroups: postgres81-hosts + # depends: process - postresql81 - master + #- + # name: process - postresql81 - collector + # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: stats collector process'" + # hostgroups: postgres81-hosts + # depends: process - postresql81 - master #### - name: process - postresql83 - master @@ -1867,10 +1829,6 @@ services: hostgroups: nfs-server # see if the nfs stuff works and doesn't hang. # the df check all script will also hang, but we don't appear to pay attention to that - - - name: nfs mount ftp archive - nrpe: "/usr/lib/nagios/plugins/check_disk 100 100 /home/org/ftp.root/debian" - hosts: gluck - name: nfs mount ftp archive nrpe: "/usr/lib/nagios/plugins/check_disk 100 100 /org/mirrors/ftp.debian.org/ftp" @@ -1888,16 +1846,15 @@ services: hosts: global - name: mirror sync - security - check: "dsa_check_mirrorsync!security.debian.org!project/trace/security-master.debian.org" - hosts: global - - - name: mirror sync - security.eu - check: "dsa_check_mirrorsync!security.eu.debian.org!project/trace/security-master.debian.org" + check: "dsa_check_mirrorsync!security-nagios.debian.org!project/trace/security-master.debian.org" hosts: global - - name: mirror sync - security.us - check: "dsa_check_mirrorsync!security.us.debian.org!project/trace/security-master.debian.org" + name: mirror sync - packages + check: "dsa_check_mirrorsync!packages.debian.org!Pics/.trace" hosts: global + normal_check_interval: 15 + max_check_attempts: 5 + retry_check_interval: 5 - name: DNS SOA sync - security.geo.debian.org check: "dsa_check_soas!security.geo.debian.org"