X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=8b9e088293d898353dfb9adf82c968f93c899573;hb=b6caa23495e36aa81975967ef36764d20e955853;hp=538833c038208226188894569acb0965a086835e;hpb=3483edb7c09c4b7eb1a95e0f77c6ad938d293af1;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index 538833c..8b9e088 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -197,10 +197,6 @@ servers: address: 195.20.242.124 parents: schumann hostgroups: computers, service, apache2-hosts, hassrvfs, hasbootfs, rsyncd-hosts, uploadqueue, kvmdomains, xinetd-hosts, apache-https, postgres94-hosts, jessie - soler: - address: 195.20.242.126 - parents: schumann - hostgroups: computers, service, hasbootfs, hassrvfs, kvmdomains, apache2-hosts, jessie, apache-https wieck: address: 195.20.242.89 parents: gw-1und1-sec @@ -386,6 +382,10 @@ servers: address: 5.153.231.11 parents: ganeti-bytemark hostgroups: computers, hassrvfs, kvmdomains, jessie, autofs, nfs-client, uploadqueue, xinetd-hosts, apache-https, apache2-hosts + backuphost: + address: 5.153.231.12 + parents: ganeti-bytemark + hostgroups: computers, hassrvfs, kvmdomains, jessie philp: address: 5.153.231.13 parents: ganeti-bytemark @@ -435,7 +435,7 @@ servers: oyens: address: 5.153.231.26 parents: ganeti-bytemark - hostgroups: computers, kvmdomains, jessie, openstack-controller, broken_mq #, apache2-hosts, apache-https + hostgroups: computers, kvmdomains, jessie, openstack-controller, broken_mq, apache2-hosts # apache-https barriere: address: 5.153.231.27 parents: ganeti-bytemark @@ -459,7 +459,7 @@ servers: gideon: address: 5.153.231.34 parents: ganeti-bytemark - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, apache-https + hostgroups: computers, service, kvmdomains, jessie, hassrvfs httpredir-bm-01: address: 5.153.231.35 parents: ganeti-bytemark @@ -551,7 +551,7 @@ servers: fischer: address: 128.31.0.35 parents: ganeti-csail - hostgroups: computers, freebsd, hassrvfs, porterbox, wheezy + hostgroups: computers, freebsd, hassrvfs, porterbox, jessie mirror-csail: address: 128.31.0.62 parents: ganeti-csail @@ -560,10 +560,18 @@ servers: address: 128.31.0.50 parents: ganeti-csail hostgroups: computers, buildd, hassrvfs, kvmdomains, jessie + x86-csail-02: + address: 128.31.0.68 + parents: ganeti-csail + hostgroups: computers, buildd, hassrvfs, kvmdomains, jessie httpredir-csail-01: address: 128.31.0.66 parents: ganeti-csail hostgroups: computers, service, kvmdomains, jessie, apache2-hosts + soriano: + address: 128.31.0.67 + parents: ganeti-csail + hostgroups: computers, service, kvmdomains, hassrvfs, jessie, apache2-hosts, apache-https # }}} # {{{ gw-dgi storace: @@ -605,11 +613,19 @@ servers: cgi-grnet-01: address: 194.177.211.202 parents: gw-grnet - hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, apache-https + hostgroups: computers, service, kvmdomains, jessie, hassrvfs, apache2-hosts, apache-https, xinetd-hosts x86-grnet-01: address: 194.177.211.203 parents: ganeti-grnet hostgroups: computers, buildd, hassrvfs, kvmdomains, jessie + gigault: + address: 194.177.211.204 + parents: ganeti-grnet + hostgroups: computers, service, hassrvfs, kvmdomains, jessie + vittoria: + address: 194.177.211.205 + parents: ganeti-grnet + hostgroups: computers, service, hassrvfs, kvmdomains, jessie # }}} # {{{ gw-isc schein: @@ -621,19 +637,19 @@ servers: lw01: address: 185.17.185.177 parents: gw-leaseweb - hostgroups: computers, service, acpid-hosts, jessie, dl180, nfs-server + hostgroups: computers, service, acpid-hosts, jessie, dl180, nfs-server, rsyncd-hosts, xinetd-hosts lw02: address: 185.17.185.178 parents: gw-leaseweb - hostgroups: computers, service, acpid-hosts, jessie, dl180, nfs-server + hostgroups: computers, service, acpid-hosts, jessie, dl180, nfs-server, rsyncd-hosts, xinetd-hosts lw03: address: 185.17.185.179 parents: gw-leaseweb - hostgroups: computers, service, acpid-hosts, jessie, dl180, nfs-server + hostgroups: computers, service, acpid-hosts, jessie, dl180, nfs-server, rsyncd-hosts, xinetd-hosts lw04: address: 185.17.185.180 parents: gw-leaseweb - hostgroups: computers, service, acpid-hosts, jessie, dl180, nfs-server + hostgroups: computers, service, acpid-hosts, jessie, dl180, nfs-server, rsyncd-hosts, xinetd-hosts lw07: address: 185.17.185.187 parents: gw-leaseweb @@ -661,7 +677,7 @@ servers: zemlinsky: address: 129.143.160.6 parents: gw-karlsruhe - hostgroups: computers, buildd, wheezy + hostgroups: computers, buildd, jessie contacts: pkern # }}} # {{{ gw-man-da @@ -677,28 +693,20 @@ servers: bendel: address: 82.195.75.100 parents: ganeti3 - hostgroups: computers, service, hasbootfs, kvmdomains, hassrvfs, apache2-hosts, wheezy, postfix-hosts, heavy-postfix, acpid-hosts, apache-https, amavis-hosts, hasvarlogfs + hostgroups: computers, service, hasbootfs, kvmdomains, hassrvfs, apache2-hosts, jessie, postfix-hosts, heavy-postfix, acpid-hosts, apache-https, amavis-hosts, hasvarlogfs master: address: 82.195.75.110 parents: ganeti3 hostgroups: computers, service, kvmdomains, jessie, hassrvfs, spamd, heavy-exim, highload - mipsel-manda-01: - address: 82.195.75.72 - parents: gw-man-da - hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy - mipsel-manda-02: - address: 82.195.75.74 - parents: gw-man-da - hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy fils: address: 82.195.75.89 parents: ganeti3 - hostgroups: computers, freebsd, wheezy, buildd, hassrvfs + hostgroups: computers, freebsd, jessie, buildd, hassrvfs contacts: christoph fayrfax: address: 82.195.75.82 parents: ganeti3 - hostgroups: computers, freebsd, wheezy, buildd, hassrvfs + hostgroups: computers, freebsd, jessie, buildd, hassrvfs contacts: christoph vento: address: 82.195.75.98 @@ -755,11 +763,15 @@ servers: mipsel-manda-01: address: 82.195.75.72 parents: gw-man-da - hostgroups: computers, buildd, wheezy, hassrvfs, sw-raid + hostgroups: computers, buildd, jessie, hassrvfs, sw-raid, hasbootfs mipsel-manda-02: address: 82.195.75.74 parents: gw-man-da - hostgroups: computers, buildd, wheezy, hassrvfs, sw-raid + hostgroups: computers, buildd, jessie, hassrvfs, sw-raid, hasbootfs + seger: + address: 82.195.75.93 + parents: ganeti3 + hostgroups: computers, service, apache2-hosts, hassrvfs, hasbootfs, rsyncd-hosts, uploadqueue, kvmdomains, xinetd-hosts, apache-https, postgres94-hosts, jessie # }}} # {{{ gw-marist zani: @@ -784,11 +796,19 @@ servers: address: 140.211.166.195 parents: gw-osuosl hostgroups: computers, jessie, service + ppc64el-osuosl-01: + address: 140.211.166.196 + parents: pieta + hostgroups: computers, hassrvfs, buildd, jessie + powerpc-osuosl-01: + address: 140.211.166.197 + parents: pieta + hostgroups: computers, hassrvfs, buildd, jessie + pizzetti: + address: 140.211.166.198 + parents: pieta + hostgroups: computers, jessie, hassrvfs, porterbox # malo TODO - mayer: - address: 140.211.166.78 - parents: gw-osuosl - hostgroups: computers, buildd, hasbootfs, wheezy # mayr: # address: 140.211.166.58 # parents: gw-osuosl @@ -797,10 +817,6 @@ servers: address: 140.211.166.46 parents: gw-osuosl hostgroups: computers, porterbox, hasusrfs, wheezy - parry: - address: 140.211.15.153 - parents: gw-osuosl - hostgroups: computers, jessie, buildd, hassrvfs, sw-raid partch: address: 140.211.15.152 parents: gw-osuosl @@ -849,14 +865,10 @@ servers: address: 86.59.118.151 parents: gw-sil hostgroups: computers, porterbox, jessie, hassrvfs - eysler: - address: 86.59.118.152 - parents: gw-sil - hostgroups: computers, buildd, wheezy eberlin: address: 86.59.118.155 parents: gw-sil - hostgroups: computers, buildd, wheezy, sw-raid + hostgroups: computers, buildd, jessie, sw-raid # }}} # {{{ gw-ubcece sw-ubcece: @@ -913,10 +925,6 @@ servers: address: 206.12.19.118 parents: ganeti2 hostgroups: computers, general, apache2-hosts, kvmdomains, apache-https, jessie - brahms: - address: 206.12.19.115 - parents: ganeti2 - hostgroups: computers, buildd, hassrvfs, kvmdomains, jessie geo2: address: 206.12.19.113 parents: ganeti2 @@ -932,21 +940,13 @@ servers: fano: address: 206.12.19.110 parents: ganeti2 - hostgroups: computers, freebsd, wheezy, buildd, hassrvfs + hostgroups: computers, freebsd, jessie, buildd, hassrvfs contacts: christoph finzi: address: 206.12.19.111 parents: ganeti2 - hostgroups: computers, freebsd, wheezy, buildd, hassrvfs + hostgroups: computers, freebsd, jessie, buildd, hassrvfs contacts: christoph - gabrielli: - address: 206.12.19.17 - parents: sw-ubcece-kais - hostgroups: computers, porterbox, jessie - corelli: - address: 206.12.19.16 - parents: sw-ubcece-kais - hostgroups: computers, buildd, jessie lucatelli: address: 206.12.19.15 parents: sw-ubcece-kais @@ -991,7 +991,7 @@ servers: address: 206.12.19.132 parents: ganeti2 hostgroups: computers, service, kvmdomains, jessie, apache2-hosts, apache-https - jenkins: + jenko: address: 206.12.19.133 parents: ganeti2 hostgroups: computers, service, kvmdomains, jessie @@ -1486,7 +1486,7 @@ services: - name: disk usage on /srv/ftp-master.debian.org servicegroups: diskspace - nrpe: "/usr/lib/nagios/plugins/check_disk 85 95 /srv/ftp-master.debian.org" + nrpe: "/usr/lib/nagios/plugins/check_disk 93 96 /srv/ftp-master.debian.org" hosts: franck - name: disk usage on /storage/snapshot-farm-1 @@ -1551,11 +1551,11 @@ services: name: processes - total nrpe: "/usr/lib/nagios/plugins/check_procs 620 700" hostgroups: computers - excludehosts: prokofiev + excludehosts: prokofiev, pieta - name: processes - total nrpe: "/usr/lib/nagios/plugins/check_procs 1500 1700" - hosts: prokofiev + hosts: prokofiev, pieta - name: swap usage - percent nrpe: "/usr/lib/nagios/plugins/check_swap -w 20% -c 10%" @@ -1603,7 +1603,7 @@ services: servicegroups: backup nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-dabackup" hostgroups: computers - excludehosts: storace + excludehosts: backuphost, storace, backuphost normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 @@ -1611,7 +1611,7 @@ services: name: backup server config servicegroups: backup nrpe: "/usr/lib/nagios/plugins/dsa-check-dabackup-server" - hosts: storace + hosts: backuphost, storace, backuphost normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 @@ -1969,6 +1969,10 @@ services: name: "host SSL cert - debian client" nrpe: "if [ -e /etc/ssl/debian/certs/thishost.crt ]; then /usr/lib/nagios/plugins/dsa-check-cert-expire /etc/ssl/debian/certs/thishost.crt; else echo 'No thishost.crt on this host.'; fi" hostgroups: computers + - + name: "sso CRL" + nrpe: "if [ -e /var/lib/dsa/sso/ca.crl ]; then /usr/lib/nagios/plugins/dsa-check-crl-expire -w 129600 -c 86400 /var/lib/dsa/sso/ca.crl; else echo 'No sso/ca.crl on this host.'; fi" + hostgroups: computers # }}} # {{{ HW health/raid - @@ -2162,7 +2166,7 @@ services: hosts: picconi - name: process - spamd - master - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 10 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd -d --pidfile=/var/run/spamassassin.pid --create-prefs --max-children 10 --helper-home-dir'" hosts: bendel - name: process - spamd - child @@ -2196,7 +2200,7 @@ services: excludehostgroups: wheezy - name: process - postgrey - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -a '/usr/sbin/postgrey --pidfile=/var/run/postgrey.pid --daemonize --inet=127.0.0.1:60000'" + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -a 'postgrey --pidfile=/var/run/postgrey.pid --daemonize --inet=127.0.0.1:60000'" hostgroups: heavy-postfix # - @@ -2328,6 +2332,12 @@ services: nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1:100 -u www-data -a /usr/sbin/apache2" hostgroups: apache2-hosts depends: process - apache2 - master + excludehosts: klecker + - + name: process - apache2 - worker + nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:80 -c 1:150 -u www-data -a /usr/sbin/apache2" + hosts: klecker + depends: process - apache2 - master - name: unwanted process - apache2 nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C apache2" @@ -2338,7 +2348,7 @@ services: name: network service - http check: check_http hostgroups: apache2-hosts - excludehosts: klecker + excludehosts: klecker, oyens depends: process - apache2 - master - name: network service - http @@ -2358,14 +2368,14 @@ services: name: network service - https check: check_https hostgroups: apache-https - excludehosts: handel,menotti + excludehosts: menotti excludehostgroups: broken_https_default_vhost depends: "process - apache2 - master" normal_check_interval: 120 - name: network service - https check: dsa_check_https_want_auth - hosts: handel,menotti + hosts: menotti depends: "process - apache2 - master" normal_check_interval: 120 - @@ -2420,7 +2430,7 @@ services: - name: postgresql backups nrpe: "/usr/bin/sudo -u debbackup /usr/lib/nagios/plugins/dsa-check-backuppg" - hosts: storace + hosts: storace, backuphost # }}} # {{{ power # - @@ -2562,6 +2572,22 @@ services: name: DNS SOA sync - alioth.debian.org check: "dsa_check_soas_add!denis.debian.org!alioth.debian.org" hosts: global + - + name: DNS SOA sync - debconf.net + check: "dsa_check_soas_add!denis.debian.org!debconf.net" + hosts: global + - + name: DNS SOA sync - debconf.org + check: "dsa_check_soas_add!denis.debian.org!debconf.org" + hosts: global + - + name: DNS SOA sync - debianday.org + check: "dsa_check_soas_add!denis.debian.org!debianday.org" + hosts: global + - + name: DNS SOA sync - dpkg.org + check: "dsa_check_soas_add!denis.debian.org!dpkg.org" + hosts: global - name: DNS - delegation and signature expiry hosts: global @@ -2599,7 +2625,7 @@ services: hosts: giustini - name: event log - remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=10791 $HOSTADDRESS$ public" + remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=10867 $HOSTADDRESS$ public" runfrom: ubc-bl8 hosts: giustini # }}} @@ -2612,46 +2638,46 @@ services: retry_check_interval: 15 # }}} # {{{ openstack - - - name: process - openstack - memcached - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nobody -C memcached -a '/usr/bin/memcached -m 128 -p 11211 -u nobody -l 0.0.0.0'" - hostgroups: openstack-controller - - - name: process - openstack - glance-registry - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u glance -C glance-registry -a '/usr/bin/python /usr/bin/glance-registry'" - hostgroups: openstack-controller - - - name: process - openstack - nova-api - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -C nova-api -a '/usr/bin/python /usr/bin/nova-api --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-api.log'" - hostgroups: openstack-controller +# - +# name: process - openstack - memcached +# nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nobody -C memcached -a '/usr/bin/memcached -m 128 -p 11211 -u nobody -l 0.0.0.0'" +# hostgroups: openstack-controller +# - +# name: process - openstack - glance-registry +# nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u glance -C glance-registry -a '/usr/bin/python /usr/bin/glance-registry'" +# hostgroups: openstack-controller +# - +# name: process - openstack - nova-api +# nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -C nova-api -a '/usr/bin/python /usr/bin/nova-api --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-api.log'" +# hostgroups: openstack-controller - name: process - openstack - nova-compute nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -C nova-compute -a '/usr/bin/python /usr/bin/nova-compute --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-compute.log --config-file=/etc/nova/nova-compute.conf'" hostgroups: openstack-compute - - - name: process - openstack - nova-cert - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -C nova-cert -a '/usr/bin/python /usr/bin/nova-cert --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-cert.log'" - hostgroups: openstack-controller - - - name: process - openstack - nova-conductor - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -C nova-conductor -a '/usr/bin/python /usr/bin/nova-conductor --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-conductor.log'" - hostgroups: openstack-controller - - - name: process - openstack - nova-consoleauth - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -a '/usr/bin/python /usr/bin/nova-consoleauth --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-consoleauth.log'" - hostgroups: openstack-controller - - - name: process - openstack - nova-scheduler - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -a '/usr/bin/python /usr/bin/nova-scheduler --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-scheduler.log'" - hostgroups: openstack-controller - - - name: process - openstack - nova-spicehtml5proxy - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -a '/usr/bin/python /usr/bin/nova-spicehtml5proxy --log-file /var/log/nova/nova-consoleproxy.log'" - hostgroups: openstack-controller - - - name: process - openstack - neutron-server - nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u neutron -C neutron-server -a '/usr/bin/python2.7 /usr/bin/neutron-server --config-file=/etc/neutron/neutron.conf --config-file /etc/neutron/plugins/openvswitch/ovs_neutron_plugin.ini --log-file=/var/log/neutron/neutron-server.log'" - hostgroups: openstack-controller +# - +# name: process - openstack - nova-cert +# nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -C nova-cert -a '/usr/bin/python /usr/bin/nova-cert --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-cert.log'" +# hostgroups: openstack-controller +# - +# name: process - openstack - nova-conductor +# nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -C nova-conductor -a '/usr/bin/python /usr/bin/nova-conductor --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-conductor.log'" +# hostgroups: openstack-controller +# - +# name: process - openstack - nova-consoleauth +# nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -a '/usr/bin/python /usr/bin/nova-consoleauth --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-consoleauth.log'" +# hostgroups: openstack-controller +# - +# name: process - openstack - nova-scheduler +# nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -a '/usr/bin/python /usr/bin/nova-scheduler --config-file=/etc/nova/nova.conf --log-file /var/log/nova/nova-scheduler.log'" +# hostgroups: openstack-controller +# - +# name: process - openstack - nova-spicehtml5proxy +# nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u nova -a '/usr/bin/python /usr/bin/nova-spicehtml5proxy --log-file /var/log/nova/nova-consoleproxy.log'" +# hostgroups: openstack-controller +# - +# name: process - openstack - neutron-server +# nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u neutron -C neutron-server -a '/usr/bin/python2.7 /usr/bin/neutron-server --config-file=/etc/neutron/neutron.conf --config-file /etc/neutron/plugins/openvswitch/ovs_neutron_plugin.ini --log-file=/var/log/neutron/neutron-server.log'" +# hostgroups: openstack-controller # }}} # {{{ misc - @@ -2728,7 +2754,7 @@ services: #### - name: puppetmaster cert - nrpe: "/usr/lib/nagios/plugins/dsa-check-cert-expire /var/lib/puppet/ssl/certs/ca.pem" + nrpe: "sudo -u puppet /usr/lib/nagios/plugins/dsa-check-cert-expire /var/lib/puppet/ssl/certs/ca.pem" hosts: handel normal_check_interval: 60 max_check_attempts: 2