X-Git-Url: https://git.adam-barratt.org.uk/?p=mirror%2Fdsa-nagios.git;a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=f2ef5d8e1c2b6e60062d1220245f24289748bbe1;hp=bd5cc292f14f03232a09edbf197ad942a41ecac3;hb=53474a40dd94c064058aae4f9936b9e52577162d;hpb=cb998decd5ffe2992ed3a5fd181c896fdd5c3e2b diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index bd5cc29..f2ef5d8 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -106,7 +106,7 @@ servers: parents: ubc-gateway hostgroups: layer3-infrastructure gw-sanger: - address: 193.62.202.20 + address: 193.62.202.25 parents: ubc-gateway hostgroups: layer3-infrastructure contacts: tjrc1, dave @@ -335,19 +335,15 @@ servers: address: 5.153.231.4 parents: gw-bytemark hostgroups: computers, service, kvmdomains, stretch, apache2-hosts, no-bacula, apache-https, nfs-server, systemd-timesyncd - adayevskaya: - address: 5.153.231.5 - parents: gw-bytemark - hostgroups: computers, service, kvmdomains, buster, systemd-timesyncd pejacevic: address: 5.153.231.6 parents: gw-bytemark - hostgroups: computers, service, kvmdomains, stretch, apache2-hosts, nfs-client, autofs, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, apache2-hosts, nfs-client, autofs, apache-https, systemd-timesyncd contacts: holger piu-slave-bm-a: address: 5.153.231.7 parents: gw-bytemark - hostgroups: computers, service, kvmdomains, stretch, nfs-client, autofs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, nfs-client, autofs, systemd-timesyncd contacts: holger bmdb1: address: 5.153.231.10 @@ -364,7 +360,7 @@ servers: backuphost: address: 5.153.231.12 parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, stretch, systemd-timesyncd + hostgroups: computers, hassrvfs, kvmdomains, buster, systemd-timesyncd philp: address: 5.153.231.13 parents: ganeti-bytemark @@ -380,7 +376,7 @@ servers: delfin: address: 5.153.231.17 parents: ganeti-bytemark - hostgroups: computers, hassrvfs, kvmdomains, stretch, apache2-hosts, apache-https, nfs-client, autofs, systemd-timesyncd + hostgroups: computers, hassrvfs, kvmdomains, buster, apache2-hosts, apache-https, nfs-client, autofs, systemd-timesyncd wuiet: address: 5.153.231.18 parents: ganeti-bytemark @@ -400,19 +396,11 @@ servers: ticharich: address: 5.153.231.23 parents: ganeti-bytemark - hostgroups: computers, general, kvmdomains, stretch, nfs-client, autofs, apache2-hosts, apache-https, service, broken_https_default_vhost, systemd-timesyncd + hostgroups: computers, general, kvmdomains, buster, nfs-client, autofs, apache2-hosts, apache-https, service, broken_https_default_vhost, systemd-timesyncd petrova: address: 5.153.231.25 parents: ganeti-bytemark hostgroups: computers, kvmdomains, stretch, apache2-hosts, apache-https, systemd-timesyncd - olin: - address: 5.153.231.26 - parents: ganeti-bytemark - hostgroups: computers, kvmdomains, stretch, systemd-timesyncd - barriere: - address: 5.153.231.27 - parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, buster, hassrvfs, porterbox, systemd-timesyncd quantz: address: 5.153.231.28 parents: ganeti-bytemark @@ -444,7 +432,7 @@ servers: jerea: address: 5.153.231.39 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd mekeel: address: 5.153.231.40 parents: ganeti-bytemark @@ -460,7 +448,7 @@ servers: manziarly: address: 5.153.231.44 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, stretch, autofs, nfs-client, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, autofs, nfs-client, apache2-hosts, apache-https, systemd-timesyncd casulana: address: 5.153.231.41 @@ -580,12 +568,20 @@ servers: address: 128.31.0.69 parents: ganeti-csail hostgroups: computers, service, kvmdomains, stretch, hassrvfs, uploadqueue, queued, systemd-timesyncd + barriere: + address: 128.31.0.66 + parents: ganeti-csail + hostgroups: computers, service, kvmdomains, buster, hassrvfs, porterbox, systemd-timesyncd + olin: + address: 128.31.0.65 + parents: ganeti-csail + hostgroups: computers, kvmdomains, stretch, systemd-timesyncd # }}} # {{{ gw-dgi storace: address: 93.94.130.161 parents: gw-dgi - hostgroups: computers, stretch, dl380, nfs-client, hassrvfs, physical_x86_intel + hostgroups: computers, buster, dl380, nfs-client, hassrvfs, physical_x86_intel # }}} # {{{ gw-gatech sechter: @@ -609,7 +605,7 @@ servers: loghost-grnet-01: address: 194.177.211.200 parents: gw-grnet - hostgroups: computers, service, kvmdomains, stretch, hassrvfs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, hassrvfs, systemd-timesyncd geo3: address: 194.177.211.201 parents: gw-grnet @@ -669,19 +665,19 @@ servers: lw01: address: 185.17.185.177 parents: gw-leaseweb - hostgroups: computers, service, stretch, dl180, nfs-server, rsyncd-hosts, physical_x86_intel + hostgroups: computers, service, stretch, dl180, nfs-server, physical_x86_intel lw02: address: 185.17.185.178 parents: gw-leaseweb - hostgroups: computers, service, stretch, dl180, nfs-server, rsyncd-hosts, physical_x86_intel + hostgroups: computers, service, stretch, dl180, nfs-server, physical_x86_intel lw03: address: 185.17.185.179 parents: gw-leaseweb - hostgroups: computers, service, stretch, dl180, nfs-server, rsyncd-hosts, physical_x86_intel + hostgroups: computers, service, stretch, dl180, nfs-server, physical_x86_intel lw04: address: 185.17.185.180 parents: gw-leaseweb - hostgroups: computers, service, stretch, dl180, nfs-server, rsyncd-hosts, physical_x86_intel + hostgroups: computers, service, stretch, dl180, nfs-server, physical_x86_intel lw07: address: 185.17.185.187 parents: gw-leaseweb @@ -708,7 +704,7 @@ servers: czerny: address: 82.195.75.109 parents: gw-manda - hostgroups: computers, service, dl380, acpid-hosts, stretch, manyprocesses, physical_x86_intel + hostgroups: computers, service, dl380, acpid-hosts, buster, manyprocesses, physical_x86_intel clementi: address: 82.195.75.103 parents: gw-manda @@ -801,6 +797,10 @@ servers: address: 82.195.75.68 parents: ganeti-manda hostgroups: computers, service, kvmdomains, stretch, uploadqueue, queued, systemd-timesyncd + adayevskaya: + address: 82.195.75.75 + parents: ganeti-manda + hostgroups: computers, service, kvmdomains, buster, systemd-timesyncd # }}} # {{{ gw-marist zani: @@ -816,7 +816,7 @@ servers: beach: address: 140.211.166.201 parents: byrd - hostgroups: computers, service, kvmdomains, stretch, apache2-hosts, hassrvfs, rsyncd-hosts, apache-https + hostgroups: computers, service, kvmdomains, buster, apache2-hosts, hassrvfs, rsyncd-hosts, apache-https mipsel-osuosl-01: address: 140.211.166.210 @@ -835,12 +835,12 @@ servers: loghost-osuosl-01: address: 140.211.166.202 parents: pijper - hostgroups: computers, service, kvmdomains, stretch, hassrvfs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, hassrvfs, systemd-timesyncd pieta: address: 140.211.166.195 parents: gw-osuosl - hostgroups: computers, stretch, service, manyprocesses + hostgroups: computers, buster, service, manyprocesses ppc64el-osuosl-01: address: 140.211.166.196 parents: pijper @@ -858,7 +858,7 @@ servers: sibelius: address: 193.62.202.28 parents: gw-sanger - hostgroups: computers, service, apache2-hosts, sw-raid, jessie, rsyncd-hosts, hasvarlogfs, multipath-hosts, nfs-server, varnish-hosts + hostgroups: computers, service, apache2-hosts, sw-raid, buster, rsyncd-hosts, hasvarlogfs, multipath-hosts, nfs-server contacts: tjrc1, dave # }}} # {{{ gw-scanplus @@ -916,7 +916,7 @@ servers: rachmaninoff: address: 209.87.16.20 parents: ganeti2-ubc - hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, systemd-timesyncd x86-ubc-01: address: 209.87.16.21 parents: ganeti2-ubc @@ -932,7 +932,7 @@ servers: gombert: address: 209.87.16.25 parents: ganeti2-ubc - hostgroups: computers, service, kvmdomains, stretch, apache2-hosts, apache-https, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, apache2-hosts, apache-https, systemd-timesyncd nono: address: 209.87.16.26 parents: ganeti2-ubc @@ -960,7 +960,7 @@ servers: lotti: address: 209.87.16.32 parents: ganeti2-ubc - hostgroups: computers, service, kvmdomains, stretch, hassrvfs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, hassrvfs, systemd-timesyncd muffat: address: 209.87.16.33 parents: ganeti2-ubc @@ -976,7 +976,7 @@ servers: gretchaninov: address: 209.87.16.36 parents: ganeti2-ubc - hostgroups: computers, general, kvmdomains, stretch, hassrvfs, nfs-server, apache2-hosts, xinetd-hosts, apache-https, systemd-timesyncd + hostgroups: computers, general, kvmdomains, buster, hassrvfs, nfs-server, apache2-hosts, xinetd-hosts, apache-https, systemd-timesyncd tye: address: 209.87.16.37 parents: ganeti2-ubc @@ -988,16 +988,16 @@ servers: buxtehude: address: 209.87.16.39 parents: ganeti2-ubc - hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, heavy-exim, postgres96-hosts, hasvarlogfs, apache-https, spamd, nfs-server, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, hassrvfs, apache2-hosts, heavy-exim, postgres11-hosts, hasvarlogfs, apache-https, spamd, nfs-server, systemd-timesyncd piu-slave-ubc-01: address: 209.87.16.42 parents: ganeti2-ubc - hostgroups: computers, service, kvmdomains, stretch, nfs-client, autofs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, nfs-client, autofs, systemd-timesyncd contacts: holger hier: address: 209.87.16.43 parents: ganeti2-ubc - hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, nfs-client, autofs, systemd-timesyncd + hostgroups: computers, service, kvmdomains, buster, hassrvfs, apache2-hosts, apache-https, nfs-client, autofs, systemd-timesyncd godard: address: 209.87.16.44 parents: ganeti2-ubc @@ -1013,7 +1013,7 @@ servers: grabbe: address: 209.87.16.48 parents: ganeti2-ubc - hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, apache2-hosts, apache-https + hostgroups: computers, service, kvmdomains, buster, systemd-timesyncd, apache2-hosts, apache-https trabaci: address: 209.87.16.49 parents: ganeti2-ubc @@ -1115,24 +1115,32 @@ servers: address: 130.89.148.14 parents: klecker hostgroups: secondary-IPs + new-klecker: + address: 130.89.148.77 + parents: gw-utwente + hostgroups: computers, service, buster, r540, manyprocesses, incomingmailrelayed2025, physical_x86_intel, hassrvfs smit: address: 130.89.148.78 parents: gw-utwente - hostgroups: computers, service, buster, r540, manyprocesses, incomingmailrelayed2025, physical_x86_intel + hostgroups: computers, service, buster, r540, manyprocesses, incomingmailrelayed2025, physical_x86_intel, apache2-hosts, apache-https, hassrvfs + mikrotik-utwente: + address: 130.89.148.79 + parents: gw-utwente + hostgroups: notacomputer # }}} # {{{ gw-ynic henze: address: 144.32.168.74 parents: gw-ynic - hostgroups: computers, hasbootfs, hassrvfs, armhf, stretch, buildd + hostgroups: computers, hasbootfs, hassrvfs, armhf, buster, buildd hasse: address: 144.32.168.75 parents: gw-ynic - hostgroups: computers, hasbootfs, hassrvfs, armhf, stretch, buildd + hostgroups: computers, hasbootfs, hassrvfs, armhf, buster, buildd antheil: address: 144.32.168.76 parents: gw-ynic - hostgroups: computers, hasbootfs, hassrvfs, armhf, stretch, buildd + hostgroups: computers, hasbootfs, hassrvfs, armhf, buster, buildd # }}} # {{{ gw-zivit zandonai: @@ -1214,8 +1222,6 @@ hostgroups: alias: Physical machines with Intel CPUs private: 1 - jessie: - alias: Hosts running jessie stretch: alias: Hosts running stretch buster: @@ -1259,6 +1265,9 @@ hostgroups: xinetd-hosts: alias: hosts providing services via xinetd private: 1 + postgres11-hosts: + alias: hosts running postgres11 + private: 1 postgres96-hosts: alias: hosts running postgres96 private: 1 @@ -1541,7 +1550,7 @@ services: nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-4" hosts: lw04 - - name: disk usage on /storage/snapshot-farm-90 + name: disk usage on /storage/snapshot-farm-09 servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-09" hosts: lw09 @@ -1718,6 +1727,7 @@ services: servicegroups: backup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u bacula -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" hostgroups: computers + excludehostgroups: buildd, pybuildd, porterbox, no-bacula - name: network backup status - draghi @@ -1834,13 +1844,6 @@ services: hostgroups: computers max_check_attempts: -2 notification_interval: 1440 - - - name: process - nrpe - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:25 -c 1: -u nagios -C nrpe -a '/usr/sbin/nrpe -c /etc/nagios/nrpe.cfg -d'" - hostgroups: computers - excludehostgroups: stretch, buster - max_check_attempts: -1 - depends: network service - nrpe - name: process - nrpe nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:25 -c 1: -u nagios -C nrpe -a '/usr/sbin/nrpe -c /etc/nagios/nrpe.cfg -f'" @@ -1891,8 +1894,12 @@ services: - name: process - irqbalance nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C irqbalance -a '/usr/sbin/irqbalance'" + hostgroups: stretch + - + name: unexpected process - irqbalance + nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C irqbalance" hostgroups: computers - excludehosts: harris + excludehostgroups: stretch ### - name: process - cron @@ -2467,7 +2474,6 @@ services: name: process - varnish nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1:15 -u vcache -a '/usr/sbin/varnishd -j unix,user=vcache -F -a '" hostgroups: varnish-hosts - excludehostgroups: jessie - name: unwanted process - varnish nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C varnishd" @@ -2487,11 +2493,15 @@ services: name: unwanted process - postgresql nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres" hostgroups: computers - excludehostgroups: postgres96-hosts + excludehostgroups: postgres96-hosts, postgres11-hosts - name: unwanted process - postgresql 9.0 nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres -a '9.0/bin/postgres'" hostgroups: computers + - + name: process - postgresql11 - master + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/11/bin/postgres'" + hostgroups: postgres11-hosts - name: process - postgresql96 - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/9.6/bin/postgres'" @@ -2524,11 +2534,6 @@ services: retry_interval: 5 # }}} # {{{ NFS Stuff - - - name: process - statd - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u statd -C rpc.statd -a '/sbin/rpc.statd'" - hostgroups: nfs-client, nfs-server - excludehostgroups: stretch, buster - name: process - nfsd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u root -C nfsd -a '[nfsd]'" @@ -2993,6 +2998,18 @@ services: hostgroups: computers check_interval: 60 retry_interval: 15 + + - + name: puppet - catalog run + remotecheck: "/usr/lib/nagios/plugins/check_puppetdb_nodes -a 4 --node $HOSTNAME$.debian.org -w 720 -c 1440" + hostgroups: computers + runfrom: handel + + - + name: puppet - all catalog runs + nrpe: "/usr/lib/nagios/plugins/check_puppetdb_nodes -a 4 -w 720 -c 1440" + hosts: handel + #### - name: ping peer on mgmt network