X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=nagios-master.cfg;h=967b4d884459dc04b88e6884ca318bd3baf34194;hb=a0364d5c6999b2c7b87de612b8e6293faacb42f2;hp=b7f31d19e02caf986922a3fafae89c28de8c1669;hpb=0a96a722f6153c179f5fdbbcc21e59bad396371d;p=mirror%2Fdsa-nagios.git diff --git a/nagios-master.cfg b/nagios-master.cfg index b7f31d1..967b4d8 100644 --- a/nagios-master.cfg +++ b/nagios-master.cfg @@ -15,14 +15,11 @@ # - verdi: pg upgrade, openvpn # - mundy: salinfo_decode # - puccini: mailgraph -# - lebrun: ippl # down: -# - ravel # - sarti # - goedel # - leisner -# - schulz --- ############################# @@ -88,10 +85,6 @@ servers: parents: gw-HP-ftc hostgroups: routing-infrastructure contacts: tjrc1 - gw-cst: - address: 213.188.99.215 - parents: gw-HP-ftc - hostgroups: routing-infrastructure gw-lrz: address: 129.187.0.150 parents: gw-HP-ftc @@ -193,7 +186,7 @@ servers: bartok: address: 82.195.75.91 parents: gw-man-da - hostgroups: computers, service, syslog-ng-hosts, postfix-hosts, dl385 + hostgroups: computers, service, syslog-ng-hosts, postfix-hosts, dl385, bind9-hosts contacts: joerg, bzed morales: address: 82.195.75.97 @@ -220,6 +213,11 @@ servers: parents: gw-man-da hostgroups: computers, service, apache2-hosts, bind9-hosts, postfix-hosts, heavy-postfix, amavis-hosts, dl385 contacts: bzed + auber: + address: 82.195.75.101 + parents: gw-man-da + hostgroups: computers, buildd, sw-raid + contacts: bzed master: address: 70.103.162.29 @@ -268,11 +266,11 @@ servers: steffani: address: 128.31.0.36 parents: gw-mit-csail - hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, sw-raid - casals: - address: 128.31.0.16 + hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, sw-raid, bind9-hosts + mahler: + address: 128.31.0.46 parents: gw-mit-csail - hostgroups: deadslow + hostgroups: computers, single-cpu, lenny, porterbox, rsyslog-hosts klecker: address: 194.109.137.218 @@ -307,19 +305,16 @@ servers: albeniz: address: 193.62.202.27 parents: gw-sanger - hostgroups: computers, porterbox, sw-raid + # SMP kernel doesn't run stable + hostgroups: computers, porterbox, sw-raid, single-cpu contacts: tjrc1 goetz: address: 193.62.202.26 parents: gw-sanger - hostgroups: computers, buildd, sw-raid + # SMP kernel doesn't run stable + hostgroups: computers, buildd, sw-raid, single-cpu contacts: tjrc1 - escher: - address: 213.188.99.215 - parents: gw-cst - hostgroups: computers, porterbox, single-cpu - verdi: address: 192.54.42.193 parents: gw-lrz @@ -383,16 +378,24 @@ servers: parents: gw-ubc hostgroups: computers, buildd contacts: lfilipoz + ravel: + address: 137.82.84.43 + parents: gw-ubc + hostgroups: computers, general, dl385, apache2-hosts lebrun: address: 161.53.160.165 parents: gw-carnet hostgroups: computers, buildd + schroeder: + address: 161.53.160.164 + parents: gw-carnet + hostgroups: computers, buildd, sw-raid tartini: address: 82.94.249.158 parents: gw-telegraaf - hostgroups: computers, sw-raid + hostgroups: computers, sw-raid, apache2-hosts, mysql-hosts piatti: address: 193.167.161.225 @@ -461,6 +464,9 @@ hostgroups: syslog-ng-hosts: alias: hosts running syslog-ng instead of sysklogd private: 1 + rsyslog-hosts: + alias: hosts running rsyslogd instead of sysklogd + private: 1 postfix-hosts: alias: hosts running postfix instead of exim private: 1 @@ -494,6 +500,9 @@ hostgroups: postgres81-hosts: alias: hosts running postgres81 private: 1 + mysql-hosts: + alias: hosts running mysql + private: 1 highload: alias: "hosts on which high load is normal" @@ -520,9 +529,11 @@ servicegroups: alias: weak ssh keys apt: alias: apt upgrade status + samhain: + alias: samhain integrity status security: alias: security - servicegroup_members: apt, weaksshkeys, kernel + servicegroup_members: apt, weaksshkeys, kernel, samhain ############################# # services @@ -569,17 +580,17 @@ services: name: disk usage on /boot servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 85 /boot" - hosts: sperger, rietz, steffani, penalosa, peri, albeniz, escher, goetz, mayer, mayr, paer, spontini, tartini, morales + hosts: sperger, rietz, steffani, penalosa, peri, albeniz, goetz, mayer, mayr, paer, spontini, tartini, morales, ravel, auber, schroeder - name: disk usage on /var servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /var" - hosts: bartok, samosa, raff, lobos, villa, gluck, saens, escher, voltaire, puccini, lebrun, tartini, morales + hosts: bartok, samosa, raff, lobos, villa, gluck, saens, voltaire, puccini, lebrun, tartini, morales - name: disk usage on /org servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /org" - hosts: sperger, samosa, raff, lobos, villa, steffani, saens, pergolesi, verdi, puccini, spontini + hosts: sperger, samosa, raff, lobos, villa, steffani, saens, pergolesi, verdi, puccini, spontini, ravel, mahler, schroeder - name: disk usage on /org servicegroups: diskspace @@ -589,7 +600,7 @@ services: name: disk usage on /srv servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /srv" - hosts: agricola, arcadelt, argento, allegri, tartini, morales + hosts: agricola, arcadelt, argento, allegri, tartini, morales, auber - name: disk usage on /org/scratch servicegroups: diskspace @@ -599,7 +610,7 @@ services: name: disk usage on /tmp servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 60 80 /tmp" - hosts: samosa, raff, gluck, saens, escher, puccini, merkel, tartini + hosts: samosa, raff, gluck, saens, puccini, merkel, tartini - name: disk usage on /usr servicegroups: diskspace @@ -609,7 +620,7 @@ services: name: disk usage on /home servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /home" - hosts: raptor, escher, voltaire, lebrun + hosts: raptor, voltaire, lebrun - name: disk usage on /home servicegroups: diskspace @@ -643,7 +654,8 @@ services: servicegroups: apt nrpe: "/usr/lib/nagios/plugins/dsa-check-statusfile /var/cache/dsa/nagios/apt" hostgroups: computers - normal_check_interval: 360 + normal_check_interval: 60 + retry_check_interval: 15 #### - name: backup @@ -662,6 +674,20 @@ services: normal_check_interval: 180 retry_check_interval: 5 + #### + - + name: process - samhain + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C samhain -a '/usr/sbin/samhain'" + hostgroups: computers + - + name: samhain + servicegroups: samhain + nrpe: "/usr/lib/nagios/plugins/dsa-check-samhain" + hostgroups: computers + depends: process - samhain + normal_check_interval: 240 + retry_check_interval: 5 + #### - name: users @@ -739,7 +765,7 @@ services: - name: "network service - sshd - version" - check: "dsa_check_ssh_port_version!22!OpenSSH_4.3p2 Debian-9etch2" + check: "dsa_check_ssh_port_version!22!OpenSSH_4.3p2 Debian-9etch3" depends: network service - sshd hostgroups: computers, deadslow excludehosts: agnesi, crest, kullervo @@ -753,13 +779,13 @@ services: normal_check_interval: 360 - name: "network service - sshd - version" - check: "dsa_check_ssh_port_version!22!OpenSSH_4.7p1 Debian-9" + check: "dsa_check_ssh_port_version!22!OpenSSH_5.1p1 Debian-2" depends: network service - sshd hostgroups: lenny normal_check_interval: 360 - name: "network service - sshd - version - 2260" - check: "dsa_check_ssh_port_version!2260!OpenSSH_4.3p2 Debian-9etch2" + check: "dsa_check_ssh_port_version!2260!OpenSSH_4.3p2 Debian-9etch3" depends: network service - sshd - 2260 hosts: agnesi normal_check_interval: 360 @@ -830,17 +856,22 @@ services: name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" hostgroups: syslog-ng-hosts + ### + - + name: process - rsyslogd + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C rsyslogd -a '/usr/sbin/rsyslogd -c3'" + hostgroups: rsyslog-hosts ### - name: process - syslogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslogd -a '/sbin/syslogd'" hostgroups: computers - excludehostgroups: syslog-ng-hosts + excludehostgroups: syslog-ng-hosts, rsyslog-hosts - name: process - klogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C klogd -a '/sbin/klogd -x'" hostgroups: computers - excludehostgroups: syslog-ng-hosts + excludehostgroups: syslog-ng-hosts, rsyslog-hosts ### MAIL STUFF ### @@ -874,6 +905,10 @@ services: name: process - clamav - freshclam nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u clamav -C freshclam -a '/usr/bin/freshclam -d --quiet'" hostgroups: heavy-exim, heavy-postfix + - + name: process - clamav - getsigs + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u clamav -C getclamsigs -a 'getclamsigs'" + hostgroups: heavy-exim, heavy-postfix # - name: unwanted process - clamav @@ -885,6 +920,11 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C freshclam" hostgroups: computers excludehostgroups: heavy-exim, heavy-postfix + - + name: unwanted process - clamav - getsigs + nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C getclamsigs" + hostgroups: computers + excludehostgroups: heavy-exim, heavy-postfix ### - name: process - spamd - master @@ -1160,7 +1200,7 @@ services: - name: process - rngd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C rngd -a '/usr/sbin/rngd -r /dev/hwrng'" - hosts: bartok + hostgroups: dl385 ### - name: process - sensord @@ -1194,6 +1234,7 @@ services: name: HW - hpacucli status servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli" + normal_check_interval: 120 hostgroups: dl385, dl380, dl360 ### - @@ -1223,7 +1264,7 @@ services: - name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C udevd -a 'udevd'" - hosts: sperger, ries, steffani, merkel, spohr, peri, penalosa, albeniz, escher, verdi, liszt, kassia, agricola, arcadelt, argento, allegri, morales + hosts: sperger, ries, steffani, merkel, spohr, peri, penalosa, albeniz, verdi, liszt, kassia, agricola, arcadelt, argento, allegri, morales, bartok, schroeder ### - name: process - acpid @@ -1354,7 +1395,7 @@ services: - name: process - debianqueued nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u dak -C debianqueued" - hosts: ries + hosts: ries, ravel ### - @@ -1376,21 +1417,31 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: stats collector process'" hostgroups: postgres81-hosts depends: process - postresql81 - master - #### - - name: process - xenconsoled - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C xenconsoled -a 'xenconsoled'" - hosts: piatti - - - name: process - xenstored - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C xenstored -a '/usr/lib/xen-3.0.3-1/bin/xenstored --pid-file /var/run/xenstore.pid'" - hosts: piatti + name: process - mysql - master + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u root -C mysqld_safe -a '/bin/sh /usr/bin/mysqld_safe'" + hostgroups: mysql-hosts - - name: process - xend - nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:2 -c 2: -u root -C python -a 'python /usr/lib/xen-3.0.3-1/bin/xend start'" - hosts: piatti + name: process - mysql - workers + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:25 -c 1: -u mysql -C mysqld -a /usr/sbin/mysqld" + hostgroups: mysql-hosts + depends: process - mysql - master + #### + #- + # name: process - xenconsoled + # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C xenconsoled -a 'xenconsoled'" + # hosts: piatti + #- + # name: process - xenstored + # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C xenstored -a '/usr/lib/xen-3.0.3-1/bin/xenstored --pid-file /var/run/xenstore.pid'" + # hosts: piatti + #- + # name: process - xend + # nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:2 -c 2: -u root -C python -a 'python /usr/lib/xen-3.0.3-1/bin/xend start'" + # hosts: piatti +# #### # XXX is this needed? -