X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=3c472051476c7fec4c31c9eb7c1c3a6bb5f27659;hb=5410d83bb5d20703ee786d2737a02542f7e64aa1;hp=a034d8afb81d8033ad86ef493c50e940a3d808b7;hpb=1fc3592ef98ff67ebe85a855437383918a661fff;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index a034d8a..3c47205 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -102,10 +102,6 @@ servers: # address: 157.193.39.254 # parents: gw-ubc # hostgroups: routing-infrastructure - gw-agnesi: - address: 65.173.90.22 - parents: gw-ubc - hostgroups: routing-infrastructure gw-ubc: address: 206.12.19.254 parents: tchaikovsky @@ -115,10 +111,6 @@ servers: address: 161.53.160.1 parents: gw-ubc hostgroups: routing-infrastructure - gw-telegraaf: - address: 82.94.249.153 - parents: gw-ubc - hostgroups: routing-infrastructure gw-telegraaf2: address: 217.196.40.15 parents: gw-ubc @@ -129,10 +121,6 @@ servers: parents: gw-ubc hostgroups: routing-infrastructure contacts: holger - gw-cst: - address: 213.157.2.23 - parents: gw-ubc - hostgroups: routing-infrastructure gw-isc: address: 149.20.20.1 parents: gw-ubc @@ -183,7 +171,7 @@ servers: parents: gw-ubc hostgroups: routing-infrastructure gw-conova: - address: 217.196.146.254 + address: 217.196.149.238 parents: gw-ubc hostgroups: routing-infrastructure @@ -208,14 +196,10 @@ servers: address: 192.25.206.57 parents: gw-HP-ftc hostgroups: computers, service, dl380, hassrvfs, hasbootfs, acpid-hosts, nfs-client, postgres90-hosts, xinetd-hosts, apache2-hosts, squeeze - raff: - address: 192.25.206.59 - parents: gw-HP-ftc - hostgroups: computers, service, dl380, hassrvfs, acpid-hosts, squeeze spohr: address: 192.25.206.33 parents: gw-HP-ftc - hostgroups: computers, service, dl380, apache2-hosts, nfs-server, spamd, heavy-exim, squeeze + hostgroups: computers, service, dl380, apache2-hosts, nfs-server, spamd, heavy-exim, squeeze, apache-https peri: address: 192.25.206.15 parents: gw-HP-ftc @@ -263,14 +247,14 @@ servers: parents: gw-man-da hostgroups: computers, service, apache2-hosts, bind9-hosts, postfix-hosts, heavy-postfix, amavis-hosts, dl385, acpid-hosts, apache-https, lenny contacts: bzed + bendel: + address: 82.195.75.101 + parents: gw-man-da + hostgroups: computers, service, hasbootfs, kvmdomains, hassrvfs, apache2-hosts, squeeze, postfix-hosts, heavy-postfix, acpid-hosts, apache-https heininen: address: 82.195.75.98 parents: gw-man-da hostgroups: computers, acpid-hosts, service, squeeze, megactl - nielsen: - address: 82.195.75.99 - parents: gw-man-da - hostgroups: computers, acpid-hosts, service, squeeze, megactl unger: address: 82.195.75.102 parents: gw-man-da @@ -303,10 +287,6 @@ servers: address: 82.195.75.97 parents: gw-man-da hostgroups: computers, service, acpid-hosts, heavy-exim, mail-relay, apache2-hosts, squeeze - byrd: - address: 82.195.75.92 - parents: unger - hostgroups: computers, service, hasbootfs, kvmdomains, squeeze # lamb: # address: 82.195.75.101 # parents: unger @@ -318,7 +298,7 @@ servers: new-master: address: 82.195.75.110 parents: czerny - hostgroups: computers, service, hasbootfs, kvmdomains, squeeze + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hassrvfs master: address: 70.103.162.29 @@ -343,7 +323,7 @@ servers: mayer: address: 140.211.166.78 parents: gw-osuosl - hostgroups: computers, buildd, hasbootfs, lenny + hostgroups: computers, buildd, hasbootfs, squeeze # mayr: # address: 140.211.166.58 # parents: gw-osuosl @@ -361,10 +341,18 @@ servers: address: 140.211.15.34 parents: gw-osuosl hostgroups: computers, service, dl360, hassrvfs, acpid-hosts, apache2-hosts, heavy-exim, postgres84-hosts, squeeze - zee: - address: 140.211.166.16 + parry: + address: 140.211.15.153 + parents: gw-osuosl + hostgroups: computers, hassrvfs, squeeze, buildd, hassrvfs + partch: + address: 140.211.15.152 parents: gw-osuosl - hostgroups: computers, porterbox, hassrvfs, hasbootfs, sparc, lenny + hostgroups: computers, hassrvfs, squeeze, hassrvfs + piston: + address: 140.211.15.154 + parents: gw-osuosl + hostgroups: computers, hassrvfs, squeeze villa: address: 212.211.132.32 @@ -422,18 +410,6 @@ servers: parents: gw-freenet hostgroups: computers, porterbox, sw-raid, hasusrfs, hasorgfs, squeeze - albeniz: - address: 193.62.202.27 - parents: gw-sanger - # SMP kernel doesn't run stable - hostgroups: computers, porterbox, sw-raid, hasbootfs, ntpsuckers, lenny - contacts: tjrc1, dave - goetz: - address: 193.62.202.26 - parents: gw-sanger - # SMP kernel doesn't run stable - hostgroups: computers, buildd, sw-raid, hasbootfs, ntpsuckers, hassrvfs, lenny - contacts: tjrc1, dave sibelius: address: 193.62.202.28 parents: gw-sanger @@ -448,7 +424,7 @@ servers: powell: address: 87.106.64.223 parents: gw-1und1 - hostgroups: computers, service, spamd, heavy-exim, rsyncd-hosts, acpid-hosts, hassrvfs, hasvarfs, hasusrfs, xinetd-hosts, apache2-hosts, lenny + hostgroups: computers, service, spamd, heavy-exim, rsyncd-hosts, acpid-hosts, hassrvfs, hasvarfs, hasusrfs, xinetd-hosts, apache2-hosts, squeeze contacts: joerg schumann: @@ -506,14 +482,9 @@ servers: ancina: address: 157.193.39.13 parents: gw-ghent - hostgroups: computers, buildd, hassrvfs, hasbootfs, incomingmailrelayed2025, xinetd-hosts, lenny + hostgroups: computers, buildd, hassrvfs, hasbootfs, incomingmailrelayed2025, xinetd-hosts, squeeze contacts: luk - agnesi: - address: 67.233.102.241 - parents: gw-agnesi - hostgroups: deadslow, porterbox, lenny - spontini: address: 206.12.19.14 parents: gw-ubc @@ -522,7 +493,7 @@ servers: ravel: address: 206.12.19.5 parents: tchaikovsky - hostgroups: computers, general, dl385, apache2-hosts, acpid-hosts, hasbootfs, nfs-server, rsyncd-hosts, bind9-hosts, uploadqueue, hasorgfs, heavy-exim, xinetd-hosts, squeeze + hostgroups: computers, general, dl385, apache2-hosts, acpid-hosts, hasbootfs, nfs-client, rsyncd-hosts, bind9-hosts, uploadqueue, hasorgfs, heavy-exim, xinetd-hosts, squeeze, autofs dijkstra: address: 206.12.19.218 parents: tchaikovsky @@ -597,15 +568,15 @@ servers: gabrielli: address: 206.12.19.17 parents: tchaikovsky - hostgroups: computers, porterbox, lenny + hostgroups: computers, porterbox, squeeze corelli: address: 206.12.19.16 parents: tchaikovsky - hostgroups: computers, buildd, lenny + hostgroups: computers, buildd, squeeze lucatelli: address: 206.12.19.15 parents: tchaikovsky - hostgroups: computers, buildd, lenny + hostgroups: computers, buildd, squeeze rossini: address: 206.12.19.19 parents: tchaikovsky @@ -618,10 +589,6 @@ servers: address: 206.12.19.21 parents: tchaikovsky hostgroups: computers, dl585, acpid-hosts, service, squeeze - schuetz: - address: 206.12.19.119 - parents: tchaikovsky - hostgroups: computers, service, hasbootfs, kvmdomains, squeeze # locke: # address: 206.12.19.120 # parents: tchaikovsky @@ -669,7 +636,7 @@ servers: gombert: address: 206.12.19.132 parents: traetta - hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hassrvfs + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hassrvfs, heavy-exim jenkins: address: 206.12.19.133 parents: salieri @@ -677,7 +644,19 @@ servers: blavet: address: 206.12.19.134 parents: traetta - hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, xinetd-hosts + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, xinetd-hosts, nfs-client, autofs + barriere: + address: 206.12.19.135 + parents: traetta + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hassrvfs + diabelli: + address: 206.12.19.136 + parents: traetta + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, apache2-hosts, apache-https + bizet: + address: 206.12.19.137 + parents: traetta + hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hassrvfs, ftpd-hosts, rsyncd-hosts, heavy-exim, xinetd-hosts, apache2-hosts lebrun: address: 193.198.184.10 @@ -688,11 +667,6 @@ servers: parents: gw-carnet hostgroups: computers, buildd, sw-raid, hassrvfs, sparc, squeeze - tartini: - address: 82.94.249.158 - parents: gw-telegraaf - hostgroups: computers, sw-raid, apache2-hosts, mysql-hosts, hasbootfs, hassrvfs, hasvarfs, hasusrfs, service, lenny - piatti: address: 193.167.161.225 parents: gw-helsinki @@ -713,11 +687,6 @@ servers: parents: gw-zivit hostgroups: computers, buildd, hassrvfs, squeeze - goedel: - address: 213.188.99.214 - parents: gw-cst - hostgroups: computers, hasbootfs, ntpsuckers, buildd, lenny - schein: address: 149.20.20.6 parents: gw-isc @@ -892,7 +861,7 @@ servers: santoro: address: 200.17.202.197 parents: gw-c3sl - hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, xinetd-hosts, hassrvfs, squeeze + hostgroups: computers, service, apache2-hosts, ftpd-hosts, rsyncd-hosts, xinetd-hosts, hassrvfs, squeeze, high-RTT contacts: faw zemlinsky: @@ -906,9 +875,13 @@ servers: hostgroups: computers, buildd, hassrvfs, squeeze, incomingmailrelayed sompek: - address: 217.196.146.208 + address: 217.196.149.225 parents: gw-conova - hostgroups: computers, buildd, hasbootfs, sw-raid, squeeze + hostgroups: computers, buildd, hassrvfs, sw-raid, squeeze, sparc + stadler: + address: 217.196.149.226 + parents: gw-conova + hostgroups: computers, buildd, hassrvfs, sw-raid, squeeze, sparc ############################# # host groups @@ -927,8 +900,6 @@ hostgroups: notacomputer: alias: Systems that are not really systems. Yeah :) private: 1 - deadslow: - alias: Systems too slow to run any real checks freebsd: alias: freebsd private: 1 @@ -1055,9 +1026,6 @@ hostgroups: postgres90-hosts: alias: hosts running postgres90 private: 1 - mysql-hosts: - alias: hosts running mysql - private: 1 no-ulogd: alias: hosts not running ulogd private: 1 @@ -1130,6 +1098,9 @@ hostgroups: brokensamhain: alias: machines that can not run samhain private: 1 + high-RTT: + alias: machines with hight round trip times + private: 1 ############################# # servicegroups @@ -1149,6 +1120,8 @@ servicegroups: alias: apt upgrade status samhain: alias: samhain integrity status + time: + alias: time stuff security: alias: security servicegroup_members: apt, weaksshkeys, kernel, samhain @@ -1161,7 +1134,14 @@ services: name: PING check: "check_ping!300.0,20%!600.0,40%" hostgroups: pingable - excludehostgroups: routing-infrastructure + excludehostgroups: routing-infrastructure, high-RTT + normal_check_interval: 5 + max_check_attempts: 4 + retry_check_interval: 1 + - + name: PING + check: "check_ping!600.0,20%!900.0,40%" + hostgroups: high-RTT normal_check_interval: 5 max_check_attempts: 4 retry_check_interval: 1 @@ -1183,6 +1163,13 @@ services: servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs 90 95" hostgroups: computers + excludehosts: sibelius + - + name: disk usage - all + servicegroups: diskspace + nrpe: "/usr/lib/nagios/plugins/check_disk -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs 95 98" + hosts: sibelius + - name: disk usage on / servicegroups: diskspace @@ -1224,7 +1211,7 @@ services: name: disk usage on /tmp servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 60 80 /tmp" - hosts: saens, tartini, powell, piatti + hosts: saens, powell, piatti - name: disk usage on /usr servicegroups: diskspace @@ -1270,47 +1257,47 @@ services: - name: disk usage on /srv/farm-snapshot/farm-01 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/farm-snapshot/farm-01" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 98 /srv/farm-snapshot/farm-01" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-23 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/farm-snapshot/farm-23" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 98 /srv/farm-snapshot/farm-23" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-45 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/farm-snapshot/farm-45" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 98 /srv/farm-snapshot/farm-45" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-67 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/farm-snapshot/farm-67" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 98 /srv/farm-snapshot/farm-67" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-89 servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/farm-snapshot/farm-89" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 98 /srv/farm-snapshot/farm-89" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-ab servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/farm-snapshot/farm-ab" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 98 /srv/farm-snapshot/farm-ab" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-cd servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/farm-snapshot/farm-cd" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 98 /srv/farm-snapshot/farm-cd" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-f servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 85 95 /srv/farm-snapshot/farm-f" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 85 /srv/farm-snapshot/farm-f" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-e servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 85 95 /srv/farm-snapshot/farm-e" + nrpe: "/usr/lib/nagios/plugins/check_disk 95 85 /srv/farm-snapshot/farm-e" hosts: sibelius - name: disk usage on /srv/fossology.debian.net @@ -1503,12 +1490,6 @@ services: normal_check_interval: 60 notification_interval: 1440 - - - name: "network service - sshd - 2260" - check: dsa_check_ssh_port!2260 - hosts: agnesi - normal_check_interval: 180 - - name: ssh - weak keys servicegroups: weaksshkeys @@ -1532,17 +1513,17 @@ services: ### - name: process - munin-node - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u root -C munin-node -a '/usr/sbin/munin-node'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a '/usr/sbin/munin-node'" hostgroups: computers excludehostgroups: freebsd, armhf excludehosts: vasks, wagner - name: process - munin-node - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u root -C perl -a '/usr/bin/perl -wT /usr/sbin/munin-node'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C perl -a '/usr/bin/perl -wT /usr/sbin/munin-node'" hostgroups: freebsd - name: process - munin-node - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u root -C munin -a '/usr/sbin/munin-node'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin -a '/usr/sbin/munin-node'" hostgroups: armhf - name: network service - munin-node @@ -1555,6 +1536,7 @@ services: name: process - ntpd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -p 1 -C ntpd -a '/usr/sbin/ntpd -p /var/run/ntpd.pid'" hostgroups: computers + servicegroups: time - name: network service - ntp check: dsa_check_ntp @@ -1562,12 +1544,14 @@ services: depends: process - ntpd excludehosts: ancina excludehostgroups: ntpsuckers + servicegroups: time # - name: network service - time check: dsa_check_time hosts: ancina depends: process - xinetd + servicegroups: time ### - @@ -1914,7 +1898,7 @@ services: name: unwanted process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C inetd" hostgroups: computers - excludehosts: grieg, byrd, abel, alwyn, vasks + excludehosts: grieg, abel, alwyn, vasks - name: unwanted process - snmpd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C snmpd" @@ -1925,6 +1909,10 @@ services: name: "host SSL cert" nrpe: "if [ -e /etc/ssl/certs/thishost.pem ]; then /usr/lib/nagios/plugins/dsa-check-cert-expire /etc/ssl/certs/thishost.pem; else echo 'No thishost.pem on this host.'; fi" hostgroups: computers + - + name: "pg SSL cert" + nrpe: "/usr/lib/nagios/plugins/dsa-check-cert-expire /etc/ssl/certs/pg-ubcece.debian.org-chained.pem" + hosts: danzi ############ Processes/Services that only run on some computers ############ #### @@ -2104,7 +2092,7 @@ services: - name: process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C inetd -a '/usr/sbin/inetd'" - hosts: grieg, byrd, vasks + hosts: grieg, vasks ### - name: process - xinetd @@ -2317,17 +2305,6 @@ services: name: postgresql backups nrpe: "/usr/bin/sudo -u debbackup /usr/lib/nagios/plugins/dsa-check-backuppg" hosts: beethoven - #### - - - name: process - mysql - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u root -C mysqld_safe -a '/bin/sh /usr/bin/mysqld_safe'" - hostgroups: mysql-hosts - - - name: process - mysql - workers - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:25 -c 1: -u mysql -C mysqld -a /usr/sbin/mysqld" - hostgroups: mysql-hosts - depends: process - mysql - master - #### - name: process - stunnel4 - postgres-udd @@ -2345,23 +2322,6 @@ services: hostgroups: squeeze, wheezy excludehosts: fano, fasch, field, finzi #### - - - name: process - krb - kdc - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C kdc -a '/usr/lib/heimdal-servers/kdc --config-file=/etc/heimdal-kdc/kdc.conf'" - hosts: schuetz, byrd - - - name: process - krb - iprop - slave - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ipropd-slave -a '/usr/sbin/ipropd-slave byrd.debian.org'" - hosts: schuetz - - - name: process - krb - iprop - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ipropd-master -a '/usr/sbin/ipropd-master'" - hosts: byrd - - - name: process - krb - kpasswdd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C kpasswdd -a '/usr/lib/heimdal-servers/kpasswdd'" - hosts: byrd - ### - name: process - UPS - nut usbhid-ups - ups1 nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u nut -C usbhid-ups -a '/lib/nut/usbhid-ups -a ups1'" @@ -2577,6 +2537,6 @@ services: hosts: giustini - name: event log - remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=952 $HOSTADDRESS$ public" + remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=2041 $HOSTADDRESS$ public" runfrom: dijkstra hosts: giustini