X-Git-Url: https://git.adam-barratt.org.uk/?a=blobdiff_plain;f=config%2Fnagios-master.cfg;h=aedf36d919c5f7c5149c0a495beb72e26f724dc2;hb=f7167e7c56afd55cef645076864e0f77cc618e6f;hp=e67d0b523014920697525b78ab460ca38045f550;hpb=5be1906ab0042172eed788189789b020361bf7b5;p=mirror%2Fdsa-nagios.git diff --git a/config/nagios-master.cfg b/config/nagios-master.cfg index e67d0b5..aedf36d 100644 --- a/config/nagios-master.cfg +++ b/config/nagios-master.cfg @@ -642,7 +642,7 @@ servers: porta: address: 194.177.211.207 parents: ganeti-grnet - hostgroups: computers, service, hassrvfs, kvmdomains, jessie, rsyncd-hosts, xinetd-hosts, systemd-timesyncd + hostgroups: computers, service, hassrvfs, kvmdomains, jessie, rsyncd-systemd-hosts, xinetd-hosts, systemd-timesyncd melartin: address: 194.177.211.208 parents: ganeti-grnet @@ -763,7 +763,7 @@ servers: kaufmann: address: 82.195.75.107 parents: ganeti3 - hostgroups: computers, service, apache2-hosts, rsyncd-hosts, kvmdomains, xinetd-hosts, jessie, apache-https + hostgroups: computers, service, apache2-hosts, rsyncd-systemd-hosts, kvmdomains, jessie, apache-https stockhausen: address: 82.195.75.108 parents: ganeti3 @@ -856,6 +856,10 @@ servers: hostgroups: computers, jessie, hassrvfs, porterbox, sw-raid # }}} # {{{ gw-sanger + sallinen: + address: 193.62.202.26 + parents: gw-sanger + hostgroups: computers, service, jessie, dl380, hpnewraid sibelius: address: 193.62.202.28 parents: gw-sanger @@ -1282,6 +1286,9 @@ hostgroups: rsyncd-hosts: alias: hosts providing rsync services via xinetd private: 1 + rsyncd-systemd-hosts: + alias: hosts providing rsync services via systemd + private: 1 xinetd-hosts: alias: hosts providing services via xinetd private: 1 @@ -1417,21 +1424,21 @@ services: excludehostgroups: layer3-infrastructure, high-RTT check_interval: 5 max_check_attempts: 4 - retry_check_interval: 1 + retry_interval: 1 - name: PING check: "check_ping!600.0,20%!900.0,40%" hostgroups: high-RTT check_interval: 5 max_check_attempts: 4 - retry_check_interval: 1 + retry_interval: 1 - name: PING check: "check_ping!2000.0,60%!3000.0,80%" hostgroups: layer3-infrastructure check_interval: 5 max_check_attempts: 4 - retry_check_interval: 1 + retry_interval: 1 # }}} # {{{ ### disk usage - @@ -1632,7 +1639,7 @@ services: name: system - filesystem check nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-filesystems" check_interval: 60 - retry_check_interval: 15 + retry_interval: 15 hostgroups: computers # }}} # {{{ backup @@ -1644,7 +1651,7 @@ services: excludehosts: backuphost, storace check_interval: 60 max_check_attempts: 2 - retry_check_interval: 5 + retry_interval: 5 - name: backup server config servicegroups: backup @@ -1652,7 +1659,7 @@ services: hosts: storace check_interval: 60 max_check_attempts: 2 - retry_check_interval: 5 + retry_interval: 5 - name: backup - bacula - last backup servicegroups: backup @@ -1661,7 +1668,7 @@ services: hostgroups: computers excludehostgroups: buildd, porterbox, no-bacula check_interval: 60 - retry_check_interval: 15 + retry_interval: 15 - name: backup - bacula - last full backup servicegroups: backup @@ -1670,7 +1677,7 @@ services: hostgroups: computers excludehostgroups: buildd, porterbox, no-bacula check_interval: 60 - retry_check_interval: 15 + retry_interval: 15 - name: process - bacula-dir servicegroups: backup @@ -1701,14 +1708,14 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-running-kernel" hostgroups: computers check_interval: 60 - retry_check_interval: 5 + retry_interval: 5 - name: apt - security updates servicegroups: apt nrpe: "/usr/lib/nagios/plugins/dsa-check-statusfile /var/cache/dsa/nagios/apt" hostgroups: computers check_interval: 60 - retry_check_interval: 15 + retry_interval: 15 - name: unexpected file - apt sources.list servicegroups: apt @@ -1722,7 +1729,7 @@ services: hostgroups: computers excludehostgroups: freebsd check_interval: 60 - retry_check_interval: 15 + retry_interval: 15 notification_interval: 10080 - name: installed firewall @@ -1761,7 +1768,7 @@ services: hostgroups: computers depends: process - samhain check_interval: 60 - retry_check_interval: 5 + retry_interval: 5 excludehostgroups: brokensamhain - name: processes - samhain zombies @@ -1911,7 +1918,7 @@ services: runfrom: rainier hostgroups: computers check_interval: 60 - retry_check_interval: 15 + retry_interval: 15 excludehostgroups: alioth, broken_mq - name: MQ connection on rapoport @@ -1920,7 +1927,7 @@ services: runfrom: rapoport hostgroups: computers check_interval: 60 - retry_check_interval: 15 + retry_interval: 15 excludehostgroups: alioth, broken_mq ### - @@ -2122,7 +2129,7 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm" check_interval: 120 hostgroups: dl380, dl360, bl460, bm-bl - excludehosts: villa, lobos, storace, mirror-anu + excludehosts: villa, lobos, storace, mirror-anu, sallinen - name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm --ps-no-redundant" @@ -2137,7 +2144,7 @@ services: name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm --fan-ignore-not-present" check_interval: 120 - hosts: storace + hosts: storace, sallinen - name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm --fan-ignore-not-present --ps-no-redundant --ignore-failed='PS1'" @@ -2551,7 +2558,7 @@ services: contact_groups: +buildd check_interval: 5 max_check_attempts: 24 - retry_check_interval: 5 + retry_interval: 5 - name: processes - lvcreate nrpe: "/usr/lib/nagios/plugins/check_procs -m 'ELAPSED' -c 500 -C lvcreate -u root -a 'lvcreate'" @@ -2603,7 +2610,7 @@ services: hosts: global check_interval: 15 max_check_attempts: 5 - retry_check_interval: 5 + retry_interval: 5 servicegroups: mirror - name: mirror sync - snapshot @@ -2611,7 +2618,7 @@ services: hosts: global check_interval: 15 max_check_attempts: 5 - retry_check_interval: 5 + retry_interval: 5 servicegroups: mirror - @@ -2882,7 +2889,7 @@ services: hosts: giustini check_interval: 5 max_check_attempts: 4 - retry_check_interval: 1 + retry_interval: 1 - name: Overall Unit Status remotecheck: "/usr/lib/nagios/plugins/check_snmp -H $HOSTADDRESS$ -C public -P 2c -o connUnitStatus -n -c 3 -w 3" @@ -2910,7 +2917,7 @@ services: nrpe: "/usr/lib/nagios/plugins/dsa-check-dchroots-current" hostgroups: porterbox check_interval: 60 - retry_check_interval: 15 + retry_interval: 15 # }}} # {{{ openstack # - @@ -2978,6 +2985,10 @@ services: hosts: draghi depends: process - xinetd ### + - + name: network service - rsync + check: check_tcp!873 + hostgroups: rsyncd-systemd-hosts - name: network service - rsync check: check_tcp!873 @@ -3037,7 +3048,7 @@ services: hosts: handel check_interval: 60 max_check_attempts: 2 - retry_check_interval: 5 + retry_interval: 5 # }}} # }}}