address: 72.52.94.70
parents: gw-ubcece
hostgroups: layer3-infrastructure
- gw-karlsruhe:
- address: 129.143.59.214
- parents: gw-ubcece
- hostgroups: layer3-infrastructure
gw-leaseweb:
address: 185.17.185.190
parents: gw-ubcece
address: 130.239.18.123
parents: gw-accumu
hostgroups: computers, hasbootfs, aacraid, nfs-client, service, apache2-hosts, stretch, autofs, sw-raid
+ contacts: zobel, tfheen, lfilipoz, zumbi, jcristau, pabs, aurel32, dsa-nsa
+ contact_groups: ""
mirror-accumu:
address: 130.242.6.199
parents: gw-accumu2
x86-bm-01:
address: 5.153.231.32
parents: ganeti-bytemark
- hostgroups: computers, kvmdomains, stretch, no-bacula, systemd-timesyncd
+ hostgroups: computers, pybuildd, hassrvfs, kvmdomains, stretch, systemd-timesyncd
tate:
address: 5.153.231.33
parents: ganeti-bytemark
address: 5.153.231.41
parents: gw-bytemark
hostgroups: computers, service, stretch, hassrvfs, dl380, manyprocesses, apache2-hosts
+ contacts: zobel, tfheen, lfilipoz, zumbi, jcristau, pabs, aurel32, dsa-nsa
+ contact_groups: ""
# }}}
# {{{ gw-c3sl
santoro:
x86-grnet-01:
address: 194.177.211.203
parents: ganeti-grnet
- hostgroups: computers, buildd, hassrvfs, kvmdomains, stretch, systemd-timesyncd
+ hostgroups: computers, pybuildd, hassrvfs, kvmdomains, stretch, systemd-timesyncd
vittoria:
address: 194.177.211.205
parents: ganeti-grnet
parents: gw-leaseweb
hostgroups: computers, service, stretch, dl180
# }}}
- # {{{ gw-karlsruhe
- zemlinsky:
- address: 129.143.160.6
- parents: gw-karlsruhe
- hostgroups: computers, buildd, stretch
- contacts: pkern
- # }}}
# {{{ gw-manda
czerny:
address: 82.195.75.109
zani:
address: 148.100.88.22
parents: gw-marist
- hostgroups: computers, buildd, hassrvfs, stretch, incomingmailrelayed
+ hostgroups: computers, pybuildd, hassrvfs, stretch, incomingmailrelayed
# }}}
# {{{ gw-osuosl
byrd:
sallinen:
address: 193.62.202.26
parents: gw-sanger
- hostgroups: computers, service, stretch, dl380, nfs-client, autofs, postgres96-hosts
+ hostgroups: computers, service, stretch, dl380, nfs-client, autofs, postgres96-hosts, apache2-hosts
sibelius:
address: 193.62.202.28
parents: gw-sanger
godard:
address: 209.87.16.44
parents: ubc-gateway
- hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd, postfix-hosts, postgres96-hosts, manyprocesses
+ hostgroups: computers, service, kvmdomains, stretch, hassrvfs, apache2-hosts, apache-https, systemd-timesyncd, postfix-hosts, postgres96-hosts, crazymanyprocesses
debussy:
address: 209.87.16.46
parents: ubc-gateway
hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, apache2-hosts, apache-https, broken_https_default_vhost
+ kantuser:
+ address: 209.87.16.47
+ parents: ubc-gateway
+ hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd
+ grabbe:
+ address: 209.87.16.48
+ parents: ubc-gateway
+ hostgroups: computers, service, kvmdomains, stretch, systemd-timesyncd, apache2-hosts, apache-https
# }}}
# {{{ gw-umn
#saens:
computers:
alias: computers
private: 1
- extinfo-icon_image: base/debian.png
- extinfo-icon_image_alt: Debian GNU/Linux
- extinfo-notes_url: https://db.debian.org/machines.cgi?host=%s
layer3-infrastructure:
alias: Layer 3 Devices
- extinfo-icon_image: base/switch40.png
- extinfo-icon_image_alt: router
notacomputer:
alias: Systems that are not really systems. Yeah :)
private: 1
alias: machines running services
buildd:
alias: buildd systems
+ pybuildd:
+ alias: buildd systems running pybuildd
general:
alias: general purpose developer accessible machines
private: 1
manyprocesses:
alias: hosts with lots and lots of (kernel) processes
+ crazymanyprocesses:
+ alias: hosts with stupidly lots of processes
no-bacula:
alias: hosts which are not being backed up with bacula
check_interval: 5
max_check_attempts: 4
retry_interval: 1
+ -
+ name: network - v6 gw
+ nrpe: "/usr/lib/nagios/plugins/dsa-check-ipv6-default-gw"
+ hostgroups: computers
+ check_interval: 60
+ excludehostgroups: alioth
# }}}
# {{{ ### disk usage
-
-
name: disk usage on /srv/farm-snapshot/farm-2017-0
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-0"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-0"
hosts: sibelius
-
name: disk usage on /srv/farm-snapshot/farm-2017-1
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-1"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-1"
hosts: sibelius
-
name: disk usage on /srv/farm-snapshot/farm-2017-2
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-2"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-2"
hosts: sibelius
-
name: disk usage on /srv/farm-snapshot/farm-2017-3
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-3"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-3"
hosts: sibelius
-
name: disk usage on /srv/farm-snapshot/farm-2017-4
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-4"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-4"
hosts: sibelius
-
name: disk usage on /srv/farm-snapshot/farm-2017-5
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-5"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-5"
hosts: sibelius
-
name: disk usage on /srv/farm-snapshot/farm-2017-6
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-6"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-6"
hosts: sibelius
-
name: disk usage on /srv/farm-snapshot/farm-2017-7
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-2017-7"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /srv/farm-snapshot/farm-2017-7"
hosts: sibelius
-
name: disk usage on /srv/ftp-master.debian.org
-
name: disk usage on /storage/snapshot-farm-1
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-1"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-1"
hosts: lw01
-
name: disk usage on /storage/snapshot-farm-2
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-2"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-2"
hosts: lw02
-
name: disk usage on /storage/snapshot-farm-3
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-3"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-3"
hosts: lw03
-
name: disk usage on /storage/snapshot-farm-4
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 98 92 /storage/snapshot-farm-4"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-4"
hosts: lw04
+ -
+ name: disk usage on /storage/snapshot-farm-90
+ servicegroups: diskspace
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-09"
+ hosts: lw09
+ -
+ name: disk usage on /storage/snapshot-farm-10
+ servicegroups: diskspace
+ nrpe: "/usr/lib/nagios/plugins/check_disk 95 97 /storage/snapshot-farm-10"
+ hosts: lw10
-
name: disk usage on /srv/morgue.debian.org/
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 95 90 /srv/morgue.debian.org"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/morgue.debian.org"
hosts: lw03
-
name: disk usage on /srv/QNAP-big/
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 90 80 /srv/QNAP-big"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /srv/QNAP-big"
hosts: storace
-
name: disk usage on /srv/QNAP-tiny
servicegroups: diskspace
- nrpe: "/usr/lib/nagios/plugins/check_disk 90 80 /srv/QNAP-tiny"
+ nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /srv/QNAP-tiny"
hosts: storace
# }}}
# {{{ ### system
name: processes - total
nrpe: "/usr/lib/nagios/plugins/check_procs 620 700"
hostgroups: computers
- excludehostgroups: manyprocesses
+ excludehostgroups: manyprocesses, crazymanyprocesses
-
name: processes - total
hostgroups: manyprocesses
nrpe: "/usr/lib/nagios/plugins/check_procs 1500 1700"
+ -
+ name: processes - total
+ hostgroups: crazymanyprocesses
+ nrpe: "/usr/lib/nagios/plugins/check_procs 15000 25000"
-
name: free memory - mb
nrpe: "/usr/lib/nagios/plugins/dsa-check-memory -m mb"
remotecheck: "/usr/lib/nagios/plugins/dsa-check-bacula $HOSTNAME$.debian.org"
runfrom: dinis
hostgroups: computers
- excludehostgroups: buildd, porterbox, no-bacula
+ excludehostgroups: buildd, pybuildd, porterbox, no-bacula
check_interval: 60
retry_interval: 15
-
remotecheck: "/usr/lib/nagios/plugins/dsa-check-bacula -w 1080 -c 1560 $HOSTNAME$.debian.org F"
runfrom: dinis
hostgroups: computers
- excludehostgroups: buildd, porterbox, no-bacula
+ excludehostgroups: buildd, pybuildd, porterbox, no-bacula
check_interval: 60
retry_interval: 15
-
name: "sso CRL"
nrpe: "if [ -e /var/lib/dsa/sso/ca.crl ]; then /usr/lib/nagios/plugins/dsa-check-crl-expire -w 129600 -c 86400 /var/lib/dsa/sso/ca.crl; else echo 'No sso/ca.crl on this host.'; fi"
hostgroups: computers
- -
- name: SSL certs - puppet
- hosts: global
- remotecheck: "/usr/lib/nagios/plugins/dsa-check-cert-expire-dir /etc/puppet/modules/ssl/files/servicecerts"
- runfrom: handel
-
name: SSL certs - LE
hosts: global
nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C buildd -a '/usr/bin/buildd'"
hostgroups: buildd
contact_groups: buildd
+ -
+ name: process - buildd
+ servicegroups: buildd
+ nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C python3 -a 'buildd.py'"
+ hostgroups: pybuildd
+ contact_groups: buildd
-
name: processes - zombie schroot
nrpe: "(/usr/lib/nagios/plugins/check_procs -a schroot -s Zs -c 0 > /dev/null || /usr/lib/nagios/plugins/check_procs -a schroot -s Zs -c 0) && /usr/lib/nagios/plugins/check_procs -a schroot -s ZNs -c 0"
- hostgroups: buildd
+ hostgroups: buildd, pybuildd
contact_groups: +buildd
check_interval: 5
max_check_attempts: 24
retry_interval: 5
- -
- name: processes - lvcreate
- nrpe: "/usr/lib/nagios/plugins/check_procs -m 'ELAPSED' -c 500 -C lvcreate -u root -a 'lvcreate'"
- hostgroups: buildd
- contact_groups: +buildd
# }}}
# {{{ NFS Stuff
-