# Non comment lines are YAML # # Strings ought to be in double quotes, but it works in most cases if they aren't :) # # vim:set syntax=yaml: # TODO # - *: check munin stats collection works # - *: check backups are successful # - *: unwanted: network: auth, discard, daytime, time (on some), cvs-pserver, rsync (on some), ftp (on some), http (on some) --- ############################# # hosts ############################# servers: # {{{ gateways global: hostgroups: notacomputer pingable: false check_command: dsa_check_always_ok gw-1und1: parents: gw-ubcece hostgroups: notacomputer pingable: false check_command: dsa_check_always_ok gw-1und1-sec: parents: gw-ubcece hostgroups: notacomputer pingable: false check_command: dsa_check_always_ok gw-accumu: address: 130.239.18.97 parents: gw-ubcece hostgroups: layer3-infrastructure gw-bytemark: address: 89.16.160.116 parents: gw-ubcece hostgroups: layer3-infrastructure gw-c3sl: address: 200.17.202.254 parents: gw-ubcece hostgroups: layer3-infrastructure gw-cecsit: address: 150.203.164.38 parents: gw-ubcece hostgroups: layer3-infrastructure gw-arm: address: 213.104.121.213 parents: gw-ubcece hostgroups: layer3-infrastructure gw-brown: address: 138.16.160.1 parents: gw-ubcece hostgroups: layer3-infrastructure gw-carnet: address: 161.53.160.1 parents: gw-ubcece hostgroups: layer3-infrastructure gw-conova: address: 217.196.149.238 parents: gw-ubcece hostgroups: layer3-infrastructure gw-csail: address: 128.31.0.1 parents: gw-ubcece hostgroups: layer3-infrastructure gw-dgi: address: 93.94.132.102 parents: gw-ubcece hostgroups: layer3-infrastructure contacts: bzed gw-freenet: address: 62.104.23.249 parents: gw-ubcece hostgroups: layer3-infrastructure gw-ftcollins: address: 192.25.206.1 parents: gw-ubcece hostgroups: layer3-infrastructure gw-grnet: address: 194.177.211.193 parents: gw-ubcece hostgroups: layer3-infrastructure gw-isc: address: 149.20.20.1 parents: gw-ubcece hostgroups: layer3-infrastructure gw-karlsruhe: address: 129.143.57.177 parents: gw-ubcece hostgroups: layer3-infrastructure gw-man-da: address: 82.195.75.126 parents: gw-ubcece hostgroups: layer3-infrastructure gw-marist: address: 148.100.88.1 parents: gw-ubcece hostgroups: layer3-infrastructure gw-osuosl: address: 140.211.166.1 parents: gw-ubcece hostgroups: layer3-infrastructure gw-rapidswitch: address: 193.201.200.129 parents: gw-ubcece hostgroups: layer3-infrastructure gw-sanger: address: 193.62.202.20 parents: gw-ubcece hostgroups: layer3-infrastructure contacts: tjrc1, dave gw-scanplus-lobos: address: 212.211.132.249 parents: gw-ubcece hostgroups: layer3-infrastructure gw-scanplus-villa: address: 212.211.132.1 parents: gw-ubcece hostgroups: layer3-infrastructure gw-sil: address: 86.59.118.145 parents: gw-ubcece hostgroups: layer3-infrastructure gw-ubcece: address: 206.12.19.254 hostgroups: layer3-infrastructure contacts: lfilipoz gw-ugent: address: 193.191.17.50 parents: gw-ubcece hostgroups: layer3-infrastructure gw-umn: address: 128.101.240.222 parents: gw-ubcece hostgroups: layer3-infrastructure gw-utwente: address: 130.89.149.1 parents: gw-ubcece hostgroups: layer3-infrastructure gw-ynic: # really janet, because ynic is stupid about firewalling #address: 146.97.42.26 address: 146.97.41.66 parents: gw-ubcece hostgroups: layer3-infrastructure gw-zivit: address: 80.245.144.3 parents: gw-ubcece hostgroups: layer3-infrastructure # }}} # {{{ servers # {{{ gw-1und1 powell: address: 87.106.64.223 parents: gw-1und1 hostgroups: computers, service, acpid-hosts, wheezy pkgmirror-1and1: address: 213.165.95.4 parents: powell hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, no-bacula, apache-https babin: address: 213.165.95.6 parents: powell hostgroups: computers, buildd, hassrvfs, kvmdomains, wheezy # }}} # {{{ gw-1und1-sec schumann: address: 212.227.126.54 parents: gw-1und1-sec hostgroups: computers, acpid-hosts, service, wheezy chopin: address: 195.20.242.124 parents: schumann hostgroups: computers, service, apache2-hosts, hassrvfs, hasbootfs, rsyncd-hosts, uploadqueue, kvmdomains, heavy-exim, xinetd-hosts, apache-https, postgres91-hosts, wheezy geo3: address: 195.20.242.125 parents: schumann hostgroups: computers, service, hasbootfs, bind9-hosts, kvmdomains, wheezy soler: address: 195.20.242.126 parents: schumann hostgroups: computers, service, hasbootfs, hassrvfs, kvmdomains, apache2-hosts, wheezy, apache-https wieck: address: 195.20.242.89 parents: gw-1und1-sec hostgroups: computers, service, apache2-hosts, rsyncd-hosts, acpid-hosts, xinetd-hosts, wheezy, security_mirror, hasvarlogfs, no-bacula # }}} # {{{ gw-accumu pettersson: address: 130.239.18.123 parents: gw-accumu hostgroups: computers, hasbootfs, aacraid, nfs-client, acpid-hosts, service, apache2-hosts, wheezy, autofs praetorius: address: 130.239.18.121 parents: gw-accumu hostgroups: computers, buildd, hassrvfs, wheezy # }}} # {{{ gw-arm abel: address: 217.140.96.56 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, porterbox, wheezy, deadslow alain: address: 217.140.96.58 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, deadslow alwyn: address: 217.140.96.59 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, deadslow antheil: address: 217.140.96.60 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, deadslow arne: address: 217.140.96.61 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, deadslow arnold: address: 217.140.96.57 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, buildd, wheezy, deadslow harris: address: 217.140.96.66 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, porterbox, deadslow hasse: address: 217.140.96.68 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd, deadslow henze: address: 217.140.96.70 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, wheezy, armhf, buildd, deadslow hoiby: address: 217.140.96.71 parents: gw-arm hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, buildd, deadslow # }}} # {{{ gw-brown franck: address: 138.16.160.12 parents: gw-brown hostgroups: computers, service, apache2-hosts, dl380, rsyncd-hosts, postgres91-hosts, spamd, heavy-exim, acpid-hosts, uploadqueue, xinetd-hosts, apache-https, hassrvfs, wheezy # }}} # {{{ gw-bytemark bm-bl1: address: 5.153.231.241 parents: gw-bytemark hostgroups: computers, bm-bl, acpid-hosts, service, wheezy bm-bl2: address: 5.153.231.242 parents: gw-bytemark hostgroups: computers, bm-bl, acpid-hosts, service, wheezy bm-bl3: address: 5.153.231.243 parents: gw-bytemark hostgroups: computers, bm-bl, acpid-hosts, service, wheezy bm-bl4: address: 5.153.231.244 parents: gw-bytemark hostgroups: computers, bm-bl, acpid-hosts, service, wheezy bm-bl5: address: 5.153.231.245 parents: gw-bytemark hostgroups: computers, bm-bl, acpid-hosts, service, wheezy bm-bl6: address: 5.153.231.246 parents: gw-bytemark hostgroups: computers, bm-bl, acpid-hosts, service, wheezy bm-bl7: address: 5.153.231.247 parents: gw-bytemark hostgroups: computers, bm-bl, acpid-hosts, service, wheezy bm-bl8: address: 5.153.231.248 parents: gw-bytemark hostgroups: computers, bm-bl, acpid-hosts, service, wheezy milanollo: address: 5.153.231.2 parents: gw-bytemark hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, nfs-server, xinetd-hosts milanollo2: address: 5.153.231.9 parents: milanollo hostgroups: secondary-IPs picconi: address: 5.153.231.3 parents: gw-bytemark hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, nfs-client, autofs, heavy-exim, spamd, apache-https senfter: address: 5.153.231.4 parents: gw-bytemark hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, no-bacula, apache-https adayevskaya: address: 5.153.231.5 parents: gw-bytemark hostgroups: computers, service, kvmdomains, wheezy pejacevic: address: 5.153.231.6 parents: gw-bytemark hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, nfs-client, autofs, apache-https contacts: holger piu-slave-bm-a: address: 5.153.231.7 parents: gw-bytemark hostgroups: computers, service, kvmdomains, wheezy, nfs-client, autofs contacts: holger binet: address: 5.153.231.8 parents: gw-bytemark hostgroups: computers, buildd, hassrvfs, kvmdomains, wheezy bmdb1: address: 5.153.231.10 parents: gw-bytemark hostgroups: computers, hassrvfs, kvmdomains, wheezy, postgres91-hosts ganeti-bytemark: address: 82.195.75.111 parents: gw-bytemark hostgroups: notacomputer coccia: address: 5.153.231.11 parents: ganeti-bytemark hostgroups: computers, hassrvfs, kvmdomains, wheezy, autofs, nfs-client backuphost: address: 5.153.231.12 parents: ganeti-bytemark hostgroups: computers, hassrvfs, kvmdomains, wheezy philp: address: 5.153.231.13 parents: ganeti-bytemark hostgroups: computers, hassrvfs, kvmdomains, wheezy, apache2-hosts petrova: address: 5.153.231.25 parents: ganeti-bytemark hostgroups: computers, kvmdomains, wheezy, apache2-hosts couper: address: 5.153.231.14 parents: ganeti-bytemark hostgroups: computers, hassrvfs, kvmdomains, wheezy, apache2-hosts, nfs-client, autofs rainier: address: 5.153.231.15 parents: ganeti-bytemark hostgroups: computers, kvmdomains, wheezy, no-bacula rapoport: address: 5.153.231.16 parents: ganeti-bytemark hostgroups: computers, kvmdomains, wheezy, no-bacula delfin: address: 5.153.231.17 parents: ganeti-bytemark hostgroups: computers, hassrvfs, kvmdomains, wheezy, apache2-hosts wuiet: address: 5.153.231.18 parents: ganeti-bytemark hostgroups: computers, general, kvmdomains, wheezy, service, apache-https, apache2-hosts, heavy-exim, xinetd-hosts dinis: address: 5.153.231.19 parents: ganeti-bytemark hostgroups: computers, general, kvmdomains, wheezy donizetti: address: 5.153.231.20 parents: ganeti-bytemark hostgroups: computers, general, kvmdomains, wheezy, nfs-client, autofs dillon: address: 5.153.231.22 parents: ganeti-bytemark hostgroups: computers, general, kvmdomains, wheezy, nfs-client, autofs, hassrvfs ticharich: address: 5.153.231.23 parents: ganeti-bytemark hostgroups: computers, general, kvmdomains, wheezy, nfs-client, autofs, apache2-hosts, apache-https, service diamond: address: 5.153.231.24 parents: ganeti-bytemark hostgroups: computers, service, kvmdomains, wheezy, bind9-hosts, no-bacula # }}} # {{{ gw-c3sl santoro: address: 200.17.202.197 parents: gw-c3sl hostgroups: computers, service, apache2-hosts, rsyncd-hosts, xinetd-hosts, hassrvfs, wheezy, high-RTT, security_mirror, no-bacula, apache-https contacts: faw # }}} # {{{ gw-carnet lebrun: address: 193.198.184.10 parents: gw-carnet hostgroups: computers, buildd, sw-raid, hasorgfs, sparc, wheezy schroeder: address: 193.198.184.11 parents: gw-carnet hostgroups: computers, buildd, sw-raid, hassrvfs, sparc, wheezy # }}} # {{{ gw-cecsit gluck: address: 150.203.164.38 parents: gw-cecsit hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, hassrvfs, acpid-hosts, xinetd-hosts, wheezy, security_mirror, no-bacula, apache-https # }}} # {{{ gw-conova sompek: address: 217.196.149.225 parents: gw-conova hostgroups: computers, buildd, hassrvfs, sw-raid, wheezy, sparc stadler: address: 217.196.149.226 parents: gw-conova hostgroups: computers, buildd, hassrvfs, sw-raid, wheezy, sparc # }}} # {{{ gw-csail senfl: address: 128.31.0.51 parents: gw-csail hostgroups: computers, service, dl360, acpid-hosts, hassrvfs, apache2-hosts, rsyncd-hosts, bind9-hosts, xinetd-hosts, squeeze, apache-https steffani: address: 128.31.0.36 parents: gw-csail hostgroups: computers, service, apache2-hosts, rsyncd-hosts, sw-raid, acpid-hosts, hasbootfs, hasorgfs, xinetd-hosts, wheezy, security_mirror, no-bacula # }}} # {{{ gw-dgi argento: address: 93.94.130.160 parents: gw-dgi hostgroups: computers, sw-raid, hassrvfs, wheezy # }}} # {{{ gw-ftcollins #alkman: # address: 192.25.206.63 # parents: gw-ftcollins # hostgroups: computers, buildd, acpid-hosts, wheezy #merulo: # address: 192.25.206.58 # parents: gw-ftcollins # hostgroups: computers, porterbox, hasusrfs, wheezy #mundy: # address: 192.25.206.62 # parents: gw-ftcollins # hostgroups: computers, buildd, hassrvfs, sw-raid, acpid-hosts, wheezy spohr: address: 192.25.206.33 parents: gw-ftcollins hostgroups: computers, service, dl380, apache2-hosts, wheezy, no-bacula # }}} # {{{ gw-grnet barber: address: 194.177.211.203 parents: gw-grnet hostgroups: computers, acpid-hosts, buildd, hassrvfs, mptraid, wheezy biber: address: 194.177.211.204 parents: gw-grnet hostgroups: computers, acpid-hosts, buildd, hassrvfs, mptraid, wheezy cilea: address: 194.177.211.205 parents: gw-grnet hostgroups: computers, acpid-hosts, mptraid, hassrvfs, service, squeeze orff: address: 194.177.211.209 parents: gw-grnet hostgroups: computers, acpid-hosts, bind9-hosts, mptraid, service, hassrvfs, apache2-hosts, squeeze rautavaara: address: 194.177.211.199 parents: gw-grnet hostgroups: computers, acpid-hosts, megaraid, service, squeeze, nfs-server vitry: address: 194.177.211.206 parents: gw-grnet hostgroups: computers, acpid-hosts, mptraid, no-bacula, wheezy # }}} # {{{ gw-isc schein: address: 149.20.20.6 parents: gw-isc hostgroups: computers, service, apache2-hosts, rsyncd-hosts, acpid-hosts, dl360, hasorgfs, xinetd-hosts, wheezy, security_mirror, no-bacula # }}} # {{{ gw-karlsruhe zemlinsky: address: 129.143.160.6 parents: gw-karlsruhe hostgroups: computers, buildd, hassrvfs, wheezy contacts: pkern # }}} # {{{ gw-man-da ball: address: 82.195.75.70 parents: gw-man-da hostgroups: computers, buildd, hasbootfs, wheezy # bartok TODO czerny: address: 82.195.75.109 parents: gw-man-da hostgroups: computers, service, dl380, acpid-hosts, wheezy, drbd-hosts clementi: address: 82.195.75.103 parents: gw-man-da hostgroups: computers, service, dl380, acpid-hosts, wheezy, drbd-hosts bendel: address: 82.195.75.100 parents: ganeti3 hostgroups: computers, service, hasbootfs, kvmdomains, hassrvfs, apache2-hosts, wheezy, postfix-hosts, heavy-postfix, acpid-hosts, apache-https, amavis-hosts, hasvarlogfs master: address: 82.195.75.110 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, spamd, heavy-exim, highload fils: address: 82.195.75.89 parents: ganeti3 hostgroups: computers, freebsd, wheezy, buildd, hassrvfs contacts: christoph fayrfax: address: 82.195.75.82 parents: ganeti3 hostgroups: computers, freebsd, wheezy, buildd, hassrvfs contacts: christoph vento: address: 82.195.75.98 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts, apache-https, heavy-exim lully: address: 82.195.75.99 parents: ganeti3 hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, hasvarlogfs rem: address: 82.195.75.68 parents: gw-man-da hostgroups: computers, buildd, hasbootfs, hassrvfs, wheezy unger: address: 82.195.75.102 parents: gw-man-da hostgroups: computers, service, dl360, acpid-hosts, wheezy draghi: address: 82.195.75.106 parents: ganeti3 hostgroups: computers, service, hasbootfs, hassrvfs, apache2-hosts, spamd, heavy-exim, kvmdomains, xinetd-hosts, apache-https, wheezy geo1: address: 82.195.75.105 parents: ganeti3 hostgroups: computers, service, bind9-hosts, kvmdomains, wheezy handel: address: 82.195.75.104 parents: ganeti3 hostgroups: computers, service, kvmdomains, apache2-hosts, wheezy, apache-https kaufmann: address: 82.195.75.107 parents: ganeti3 hostgroups: computers, service, apache2-hosts, rsyncd-hosts, kvmdomains, xinetd-hosts, wheezy stockhausen: address: 82.195.75.108 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy, acpid-hosts, jetty-hosts ganeti3: address: 82.195.75.111 parents: gw-man-da hostgroups: notacomputer wilder: address: 82.195.75.112 parents: ganeti3 hostgroups: computers, service, hassrvfs, apache2-hosts, kvmdomains, wheezy, acpid-hosts, apache-https, rsyncd-hosts, xinetd-hosts vieuxtemps: address: 82.195.75.113 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy, varnish-hosts mailly: address: 82.195.75.114 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy, spamd, heavy-exim, mail-relay denis: address: 82.195.75.91 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy, bind9-hosts vogler: address: 82.195.75.92 parents: ganeti3 hostgroups: computers, service, kvmdomains, wheezy # }}} # {{{ gw-marist zani: address: 148.100.88.22 parents: gw-marist hostgroups: computers, buildd, hassrvfs, wheezy, incomingmailrelayed # }}} # {{{ gw-osuosl busoni: address: 140.211.15.34 parents: gw-osuosl hostgroups: computers, service, dl360, hassrvfs, acpid-hosts, wheezy, hasvarlogfs, apache2-hosts, no-bacula, apache-https byrd: address: 140.211.166.20 parents: gw-osuosl hostgroups: computers, service, dl380, acpid-hosts, wheezy buxtehude: address: 140.211.166.26 parents: byrd hostgroups: computers, service, hassrvfs, acpid-hosts, apache2-hosts, heavy-exim, postgres91-hosts, wheezy, hasvarlogfs, apache-https # malo TODO mayer: address: 140.211.166.78 parents: gw-osuosl hostgroups: computers, buildd, hasbootfs, wheezy # mayr: # address: 140.211.166.58 # parents: gw-osuosl # hostgroups: computers, buildd, hasbootfs parry: address: 140.211.15.153 parents: gw-osuosl hostgroups: computers, wheezy, buildd, hassrvfs partch: address: 140.211.15.152 parents: gw-osuosl hostgroups: computers, wheezy, hassrvfs, porterbox rietz: address: 140.211.166.43 parents: gw-osuosl hostgroups: computers, service, rsyncd-hosts, dl385, hassrvfs, acpid-hosts, xinetd-hosts, wheezy #, bosserver rietz2: address: 140.211.166.44 parents: rietz hostgroups: secondary-IPs # zee TODO # }}} # {{{ gs-rapidswitch caballero: address: 193.201.200.200 parents: gw-rapidswitch hostgroups: computers, buildd, sw-raid, wheezy, hassrvfs, acpid-hosts # }}} # {{{ gw-sanger sibelius: address: 193.62.202.28 parents: gw-sanger hostgroups: computers, acpid-hosts, postgres91-hosts, service, apache2-hosts, sw-raid, squeeze, rsyncd-hosts, xinetd-hosts, hasvarlogfs contacts: tjrc1, dave smetana: address: 193.62.202.29 parents: gw-sanger hostgroups: computers, porterbox, sw-raid, sparc, wheezy contacts: tjrc1, dave # }}} # {{{ gw-scanplus lobos: address: 212.211.132.250 parents: gw-scanplus-lobos hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, hasvarfs, hasusrfs, hasorgfs, xinetd-hosts, wheezy, security_mirror, no-bacula villa: address: 212.211.132.32 parents: gw-scanplus-villa hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, hasvarfs, hasusrfs, hasorgfs, xinetd-hosts, wheezy, security_mirror, no-bacula # }}} # {{{ gw-sil beethoven: address: 86.59.118.146 parents: gw-sil hostgroups: computers, hasbootfs, aacraid, service, acpid-hosts, wheezy eder: address: 86.59.118.151 parents: gw-sil hostgroups: computers, porterbox, wheezy, hassrvfs eysler: address: 86.59.118.152 parents: gw-sil hostgroups: computers, buildd, wheezy eberlin: address: 86.59.118.155 parents: gw-sil hostgroups: computers, buildd, wheezy # }}} # {{{ gw-ubcece sw-ubcece: hostgroups: layer2-infrastructure contacts: lfilipoz pingable: false check_command: dsa_check_always_ok sw-ubcece-mcld: hostgroups: layer2-infrastructure parents: sw-ubcece contacts: lfilipoz pingable: false check_command: dsa_check_always_ok sw-ubcece-kais: hostgroups: layer2-infrastructure parents: sw-ubcece contacts: lfilipoz pingable: false check_command: dsa_check_always_ok spontini: address: 206.12.19.14 parents: sw-ubcece-mcld hostgroups: computers, buildd, hasbootfs, hassrvfs, sparc, wheezy contacts: lfilipoz ravel: address: 206.12.19.5 parents: sw-ubcece-kais hostgroups: computers, general, dl385, apache2-hosts, acpid-hosts, hasbootfs, nfs-client, rsyncd-hosts, bind9-hosts, uploadqueue, hasorgfs, heavy-exim, xinetd-hosts, wheezy, autofs dijkstra: address: 206.12.19.218 parents: sw-ubcece-kais hostgroups: computers, bl460, acpid-hosts, service, wheezy, drbd-hosts pasquini: address: 206.12.19.217 parents: sw-ubcece-kais hostgroups: computers, bl460, acpid-hosts, service, wheezy, drbd-hosts luchesi: address: 206.12.19.214 parents: sw-ubcece-kais hostgroups: computers, bl460, acpid-hosts, service, wheezy, drbd-hosts tristano: address: 206.12.19.213 parents: sw-ubcece-kais hostgroups: computers, bl460, acpid-hosts, service, wheezy, drbd-hosts boito: address: 206.12.19.216 parents: sw-ubcece-kais hostgroups: computers, bl460, acpid-hosts, service, wheezy, drbd-hosts bertali: address: 206.12.19.212 parents: sw-ubcece-kais hostgroups: computers, bl460, acpid-hosts, service, wheezy, drbd-hosts ganeti2: address: 206.12.19.23 parents: sw-ubcece-kais hostgroups: notacomputer tchaikovsky: address: 206.12.19.118 parents: ganeti2 hostgroups: computers, general, apache2-hosts, hasbootfs, kvmdomains, apache-https, wheezy wolkenstein: address: 206.12.19.116 parents: ganeti2 hostgroups: computers, hasbootfs, hassrvfs, kvmdomains, service, xinetd-hosts, rsyncd-hosts, apache2-hosts, wheezy brahms: address: 206.12.19.115 parents: ganeti2 hostgroups: computers, buildd, hassrvfs, kvmdomains, wheezy geo2: address: 206.12.19.113 parents: ganeti2 hostgroups: computers, service, bind9-hosts, kvmdomains, wheezy stabile: address: 206.12.19.13 parents: sw-ubcece-kais hostgroups: computers, hashomefs, sw-raid, rsyncd-hosts, apache2-hosts, xinetd-hosts, service, nfs-server, squeeze, hassrvfs respighi: address: 206.12.19.11 parents: sw-ubcece-kais hostgroups: computers, hasbootfs, aacraid, hassrvfs, service, apache2-hosts, squeeze # MSA 2000 (2012i) giustini: address: 192.168.2.6 parents: dijkstra hostgroups: notacomputer # unless we implement runfrom for host alive checks pingable: false check_command: dsa_check_always_ok falla: address: 206.12.19.117 parents: ganeti2 hostgroups: computers, freebsd, hassrvfs, porterbox, wheezy fano: address: 206.12.19.110 parents: ganeti2 hostgroups: computers, freebsd, wheezy, buildd, hassrvfs contacts: christoph finzi: address: 206.12.19.111 parents: ganeti2 hostgroups: computers, freebsd, wheezy, buildd, hassrvfs contacts: christoph fischer: address: 206.12.19.112 parents: ganeti2 hostgroups: computers, freebsd, hassrvfs, porterbox, wheezy gabrielli: address: 206.12.19.17 parents: sw-ubcece-kais hostgroups: computers, porterbox, wheezy corelli: address: 206.12.19.16 parents: sw-ubcece-kais hostgroups: computers, buildd, wheezy lucatelli: address: 206.12.19.15 parents: sw-ubcece-kais hostgroups: computers, buildd, wheezy rossini: address: 206.12.19.19 parents: sw-ubcece-kais hostgroups: computers, dl585, acpid-hosts, service, wheezy salieri: address: 206.12.19.20 parents: sw-ubcece-kais hostgroups: computers, dl585, acpid-hosts, service, wheezy traetta: address: 206.12.19.21 parents: sw-ubcece-kais hostgroups: computers, dl585, acpid-hosts, service, wheezy # locke: # address: 206.12.19.120 # parents: sw-ubcece-kais # hostgroups: computers, service, hasbootfs, kvmdomains, squeeze, hasvicepa lotti: address: 206.12.19.121 parents: sw-ubcece-kais hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, hassrvfs quantz: address: 206.12.19.122 parents: traetta hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, hassrvfs, nfs-client, xinetd-hosts, heavy-exim, apache2-hosts, autofs nono: address: 206.12.19.123 parents: traetta hostgroups: computers, service, kvmdomains, wheezy, heavy-exim, xinetd-hosts, apache2-hosts, apache-https, broken_https_default_vhost reger: address: 206.12.19.124 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, apache-https, heavy-exim danzi: address: 206.12.19.125 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, postgres91-hosts, xinetd-hosts glinka: address: 206.12.19.126 parents: traetta hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, nfs-client, autofs, xinetd-hosts tye: address: 206.12.19.129 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, heavy-exim, apache2-hosts, nfs-client, autofs, hassrvfs elgar: address: 206.12.19.130 parents: salieri hostgroups: computers, service, kvmdomains, wheezy gombert: address: 206.12.19.132 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, heavy-exim, apache2-hosts jenkins: address: 206.12.19.133 parents: salieri hostgroups: computers, service, kvmdomains, wheezy blavet: address: 206.12.19.134 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, xinetd-hosts, nfs-client, autofs barriere: address: 206.12.19.135 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, porterbox diabelli: address: 206.12.19.136 parents: traetta hostgroups: computers, service, hasbootfs, kvmdomains, wheezy, apache2-hosts, apache-https, broken_https_default_vhost bizet: address: 206.12.19.137 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, no-bacula lilburn: address: 206.12.19.138 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts, nfs-client, autofs popov: address: 206.12.19.119 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts, nfs-client, autofs, heavy-exim beach: address: 206.12.19.140 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, apache2-hosts, xinetd-hosts, hassrvfs, nfs-server, rsyncd-hosts, no-bacula, apache-https ullmann: address: 206.12.19.141 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, postgres91-hosts, nfs-client, apache2-hosts, autofs, apache-https sonntag: address: 206.12.19.142 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, nfs-client, autofs menotti: address: 206.12.19.143 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, hassrvfs, apache2-hosts, apache-https muffat: address: 206.12.19.146 parents: ganeti2 hostgroups: computers, service, kvmdomains, wheezy, spamd, heavy-exim, mail-relay # }}} # {{{ gw-ugent ancina: address: 157.193.39.13 parents: gw-ugent hostgroups: computers, buildd, hassrvfs, hasbootfs, incomingmailrelayed2025, xinetd-hosts, wheezy contacts: luk # }}} # {{{ gw-umn saens: address: 128.101.240.212 parents: gw-umn hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, hasvarfs, hasusrfs, hasorgfs, xinetd-hosts, wheezy, security_mirror, no-bacula # }}} # {{{ gw-utwente klecker: address: 130.89.148.10 parents: gw-utwente hostgroups: computers, service, apache2-hosts, rsyncd-hosts, dl380, acpid-hosts, xinetd-hosts, wheezy, incomingmailrelayed2025, hassrvfs klecker-ftp: address: 130.89.148.12 parents: klecker hostgroups: secondary-IPs klecker-archive: address: 130.89.148.13 parents: klecker hostgroups: secondary-IPs klecker-static: address: 130.89.148.14 parents: klecker hostgroups: secondary-IPs # }}} # {{{ gw-ynic hildegard: address: 144.32.168.74 parents: gw-ynic hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, deadslow, buildd howells: address: 144.32.168.75 parents: gw-ynic hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, deadslow, buildd hummel: address: 144.32.168.76 parents: gw-ynic hostgroups: computers, hasbootfs, hassrvfs, armhf, wheezy, deadslow, buildd porpora: address: 144.32.168.78 parents: gw-ynic hostgroups: computers, buildd, sw-raid, hassrvfs, wheezy poulenc: address: 144.32.168.77 parents: gw-ynic hostgroups: computers, buildd, sw-raid, hassrvfs, wheezy # }}} # {{{ gw-zivit zandonai: address: 80.245.147.46 parents: gw-zivit hostgroups: computers, buildd, hassrvfs, wheezy zelenka: address: 80.245.147.40 parents: gw-zivit hostgroups: computers, porterbox, hassrvfs, wheezy # }}} # }}} ############################# # host groups # # hostgroups ircd and all are automatically defined # ############################# hostgroups: computers: alias: computers private: 1 layer2-infrastructure: alias: Layer 2 Devices extinfo-icon_image: base/switch40.png extinfo-icon_image_alt: switch layer3-infrastructure: alias: Layer 3 Devices extinfo-icon_image: base/switch40.png extinfo-icon_image_alt: router notacomputer: alias: Systems that are not really systems. Yeah :) private: 1 deadslow: alias: Systems too slow to run any real checks freebsd: alias: freebsd private: 1 armhf: alias: armhf private: 1 sparc: alias: sparc private: 1 porterbox: alias: developer accessible porter machines extinfo-icon_image: base/debian.png extinfo-icon_image_alt: Debian GNU/Linux extinfo-notes_url: http://db.debian.org/machines.cgi?host=%s service: alias: machines running services extinfo-icon_image: base/debian.png extinfo-icon_image_alt: Debian GNU/Linux extinfo-notes_url: http://db.debian.org/machines.cgi?host=%s buildd: alias: buildd systems extinfo-icon_image: base/debian.png extinfo-icon_image_alt: Debian GNU/Linux extinfo-notes_url: http://db.debian.org/machines.cgi?host=%s general: alias: general purpose developer accessible machines extinfo-icon_image: base/debian.png extinfo-icon_image_alt: Debian GNU/Linux extinfo-notes_url: http://db.debian.org/machines.cgi?host=%s dl380: alias: HP DL380 hosts private: 1 dl385: alias: HP DL385 hosts private: 1 dl360: alias: HP DL360 hosts private: 1 bl460: alias: HP BL460 blades private: 1 bm-bl: alias: HP blades at bytemark private: 1 dl585: alias: HP DL385 hosts private: 1 sw-raid: alias: Hosts with Linux software raid private: 1 aacraid: alias: Hosts with Adaptec AACraid private: 1 # megactl: # alias: Hosts with LSI Logic MegaRAID, but not usable with megaraid check # private: 1 megaraid: alias: Hosts with LSI Logic MegaRAID private: 1 mptraid: alias: Hosts with LSI Logic Fusion-MPT private: 1 squeeze: alias: Hosts running squeeze wheezy: alias: Hosts running wheezy kvmdomains: alias: Hosts that are KVM domains private: 1 drbd-hosts: alias: hosts running drbd postfix-hosts: alias: hosts running postfix instead of exim private: 1 heavy-exim: alias: "hosts running the full mail stuff, including clamav and postgrey" private: 1 mail-relay: alias: "relays usually are hosts with more exim processes" private: 1 spamd: alias: "hosts running spamassassin as daemon" private: 1 heavy-postfix: alias: "postfix hosts running the full mail stuff, including clamav, SA, postgrey, policyd-weight" private: 1 apache2-hosts: alias: hosts running apache2 private: 1 jetty-hosts: alias: hosts running jetty private: 1 varnish-hosts: alias: hosts running varnish private: 1 bind9-hosts: alias: hosts running bind9 private: 1 # once every host runs unbound, do away with this group and check "computers" instead unbound-hosts: alias: hosts running unbound private: 1 amavis-hosts: alias: hosts running amavis private: 1 #tftpd-hosts: # alias: hosts running a tftpd (tftpd-hpa as a daemon) # private: 1 rsyncd-hosts: alias: hosts providing rsync services via xinetd private: 1 xinetd-hosts: alias: hosts providing services via xinetd private: 1 #postgres81-hosts: # alias: hosts running postgres81 # private: 1 postgres91-hosts: alias: hosts running postgres91 private: 1 no-ulogd: alias: hosts not running ulogd private: 1 acpid-hosts: alias: hosts running acpid private: 1 uploadqueue: alias: hosts that are an anonymous ftp uploadqueue private: 1 bosserver: alias: hosts running bosserver private: 1 apache-https: alias: hosts with https services private: 1 no-bacula: alias: hosts which are not being backed up with bacula private: 1 nfs-client: alias: hosts mounting filesystems using NFS private: 1 nfs-server: alias: hosts serving filesystems using NFS private: 1 autofs: alias: hosts running the automounter private: 1 highload: alias: "hosts on which high load is normal" private: 1 secondary-IPs: alias: secondary IP addresses private: 1 hasbootfs: alias: hosts with a /boot filesystem private: 1 hassrvfs: alias: hosts with a /srv filesystem private: 1 hasorgfs: alias: hosts with a /org filesystem private: 1 hashomefs: alias: hosts with a /home filesystem private: 1 hasvarfs: alias: hosts with a /var filesystem private: 1 hasvarlogfs: alias: hosts with a /var/log filesystem private: 1 hasusrfs: alias: hosts with a /usr filesystem private: 1 # hasvicepa: # alias: hosts with a /vicepa # private: 1 incomingmailrelayed: alias: incoming mail needs to go through a mail relay # i.e. no port 25 private: 1 incomingmailrelayed2025: alias: incoming mail needs to go through a mail relay # i.e. no port 25 private: 1 ntpsuckers: alias: "hosts who's ntp offset is often unknown" private: 1 brokensamhain: alias: machines that can not run samhain private: 1 high-RTT: alias: machines with hight round trip times private: 1 security_mirror: alias: hosts that are security mirrors private: 1 ############################# # servicegroups ############################# servicegroups: diskspace: alias: diskusage checks buildd: alias: buildd checks raid: alias: raid checks backup: alias: backup checks kernel: alias: kernel checks apt: alias: apt upgrade status samhain: alias: samhain integrity status time: alias: time stuff security: alias: security servicegroup_members: apt, kernel, samhain ############################# # services ############################# services: - name: PING check: "check_ping!350.0,20%!600.0,40%" hostgroups: pingable excludehostgroups: layer3-infrastructure, high-RTT normal_check_interval: 5 max_check_attempts: 4 retry_check_interval: 1 - name: PING check: "check_ping!600.0,20%!900.0,40%" hostgroups: high-RTT normal_check_interval: 5 max_check_attempts: 4 retry_check_interval: 1 - name: PING check: "check_ping!2000.0,60%!3000.0,80%" hostgroups: layer3-infrastructure normal_check_interval: 5 max_check_attempts: 4 retry_check_interval: 1 ############ Services ############ ### ############ Disk Usage ############ #### - name: disk usage - all servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk -w 5% -c 2% -A -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs --ignore-eregi-path='/home/buildd/build-tr|/var/lib/schroot/mount'" hostgroups: computers excludehosts: sibelius,stabile - name: disk usage - all servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk -w 5% -c 3% -A -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs --ignore-eregi-path=/srv/snapshot.debian.org" hosts: stabile - name: disk usage - all servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk -X devpts -X proc -X linprocfs -X devfs -X fdescfs -X sysfs -X nfs 95 98" hosts: sibelius - name: disk usage on / servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 90 95 /" hostgroups: computers excludehosts: spohr - name: disk usage on / servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 90 93 /" hosts: spohr - name: disk usage on /boot servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 85 /boot" hostgroups: hasbootfs - name: disk usage on /var servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /var" hostgroups: hasvarfs - name: disk usage on /org servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 80 90 /org" hostgroups: hasorgfs - name: disk usage on /srv servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 95 98 /srv" hostgroups: hassrvfs - name: disk usage on /tmp servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 60 80 /tmp" hosts: saens - name: disk usage on /usr servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /usr" hostgroups: hasusrfs - name: disk usage on /home servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /home" hostgroups: hashomefs - name: disk usage on /var/lib/postgresql servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /var/lib/postgresql" hosts: sibelius, busoni, buxtehude - name: disk usage on /var/log servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /var/log" hostgroups: hasvarlogfs - name: disk usage on /var/spool/postfix servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 90 /var/spool/postfix" hosts: bendel - name: disk usage on /srv/mirrors servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 95 98 /srv/mirrors" hosts: beethoven, sibelius - name: disk usage on /srv/snapshot.debian.org servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 98 99 /srv/snapshot.debian.org" hosts: stabile - name: disk usage on /srv/snapshot.debian.org servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 90 94 /srv/snapshot.debian.org" hosts: sibelius - name: disk usage on /srv/farm-snapshot/farm-misc servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 97 95 /srv/farm-snapshot/farm-misc" hosts: sibelius - name: disk usage on /var/lib/postgresql/9.1 servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 85 /var/lib/postgresql/9.1" hosts: franck - name: disk usage on /srv/ftp-master.debian.org servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 85 95 /srv/ftp-master.debian.org" hosts: franck - name: disk usage on /srv/pgbackup servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 75 85 /srv/pgbackup" hosts: franck - name: disk usage on /srv/pgbackup servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 85 95 /srv/pgbackup" hosts: beethoven - name: disk usage on /srv/git-backup servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 85 95 /srv/git-backup" hosts: beethoven - name: disk usage on /srv/da-backup servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 85 95 /srv/da-backup" hosts: beethoven - name: disk usage on /srv/bacula servicegroups: diskspace nrpe: "/usr/lib/nagios/plugins/check_disk 85 95 /srv/bacula" hosts: beethoven ############ All Computers ############ #### - name: apt - security updates servicegroups: apt nrpe: "/usr/lib/nagios/plugins/dsa-check-statusfile /var/cache/dsa/nagios/apt" hostgroups: computers normal_check_interval: 60 retry_check_interval: 15 #### - name: backup servicegroups: backup nrpe: "sudo /usr/lib/nagios/plugins/dsa-check-dabackup" hostgroups: computers excludehosts: backuphost normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 - name: backup server config servicegroups: backup nrpe: "/usr/lib/nagios/plugins/dsa-check-dabackup-server" hosts: beethoven, backuphost normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 - name: backup - bacula - last backup servicegroups: backup remotecheck: "/usr/lib/nagios/plugins/dsa-check-bacula $HOSTNAME$.debian.org" runfrom: dinis hostgroups: computers excludehostgroups: buildd, porterbox, no-bacula normal_check_interval: 60 retry_check_interval: 15 - name: backup - bacula - last full backup servicegroups: backup remotecheck: "/usr/lib/nagios/plugins/dsa-check-bacula -w 1080 -c 1560 $HOSTNAME$.debian.org F" runfrom: dinis hostgroups: computers excludehostgroups: buildd, porterbox, no-bacula normal_check_interval: 60 retry_check_interval: 15 - name: process - bacula-fd servicegroups: backup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u bacula -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" hostgroups: computers excludehostgroups: freebsd - name: process - bacula-fd servicegroups: backup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C bacula-fd -a '/usr/sbin/bacula-fd -c /etc/bacula/bacula-fd.conf'" hostgroups: freebsd #### - name: running kernel servicegroups: kernel nrpe: "/usr/lib/nagios/plugins/dsa-check-running-kernel" hostgroups: computers normal_check_interval: 60 retry_check_interval: 5 #### # - name: afs - space # hostgroups: bosserver # nrpe: "/usr/lib/nagios/plugins/dsa-check-afs-space -H localhost" # normal_check_interval: 60 # max_check_attempts: 2 # retry_check_interval: 5 # # - name: afs - bos # hostgroups: bosserver # nrpe: "/usr/lib/nagios/plugins/dsa-check-afs-bos -H localhost" # normal_check_interval: 60 # max_check_attempts: 2 # retry_check_interval: 5 # # - name: afs - waiting connections # hostgroups: bosserver # nrpe: "/usr/lib/nagios/plugins/dsa-check-afs-rxdebug -H localhost" # normal_check_interval: 60 # max_check_attempts: 2 # retry_check_interval: 5 # #- name: afs - udebug # hostgroups: bosserver # nrpe: "/usr/lib/nagios/plugins/dsa-check-afs-udebug -H localhost" # normal_check_interval: 60 # max_check_attempts: 2 # retry_check_interval: 5 #### #- # name: puppet # nrpe: "/usr/lib/nagios/plugins/dsa-check-file_age -i 540 -f /var/lib/puppet/state/state.yaml" # hostgroups: computers #### - name: installed firewall nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/ferm.conf" hostgroups: computers excludehostgroups: freebsd - name: puppetized firewall nrpe: "/usr/lib/nagios/plugins/dsa-check-file -w -f /etc/ferm/conf.d/defs.conf" hostgroups: computers excludehostgroups: freebsd #### - name: ganeti - job watcher paused nrpe: "/usr/lib/nagios/plugins/negate /usr/lib/nagios/plugins/dsa-check-file -f /var/lib/ganeti/watcher.pause" hostgroups: computers #### - name: process - samhain nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C samhain -a '/usr/sbin/samhain'" hostgroups: computers excludehostgroups: brokensamhain - name: samhain servicegroups: samhain nrpe: "/usr/lib/nagios/plugins/dsa-check-statusfile /var/cache/dsa/nagios/samhain" hostgroups: computers depends: process - samhain normal_check_interval: 60 retry_check_interval: 5 excludehostgroups: brokensamhain #### - name: process - acc.umu.se backup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -a 'dsmc'" hosts: sibelius #### - name: users nrpe: "/usr/lib/nagios/plugins/check_users 30 35" hostgroups: computers #### - name: load nrpe: "/usr/lib/nagios/plugins/check_load -w 30,28,26 -c 50,45,50" hostgroups: computers excludehostgroups: highload - name: load nrpe: "/usr/lib/nagios/plugins/check_load -w 140,120,100 -c 240,220,200" hostgroups: highload #### - name: uptime check nrpe: "/usr/lib/nagios/plugins/dsa-check-uptime" hostgroups: computers #### - name: processes - samhain zombies nrpe: "/usr/lib/nagios/plugins/check_procs 3 6 -s Z -u root -a samhain" event_handler: dsa_event_handler_restart_samhain hostgroups: computers excludehostgroups: brokensamhain - name: processes - zombies nrpe: "/usr/lib/nagios/plugins/check_procs 5 10 -s Z" hostgroups: computers #### - name: processes - total nrpe: "/usr/lib/nagios/plugins/check_procs 620 700" hostgroups: computers #### - name: swap usage - percent nrpe: "/usr/lib/nagios/plugins/check_swap -w 20% -c 10%" hostgroups: computers #### - name: swap usage - mb nrpe: "/usr/lib/nagios/plugins/check_swap -w 20000 -c 5000" hostgroups: computers #### - name: process - getty nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:8 -c 1: -u root -C getty -a /sbin/getty" hostgroups: computers excludehosts: zelenka, zandonai #### - name: process - sshd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:20 -c 1: -u root -C sshd -a '/usr/sbin/sshd'" hostgroups: computers - name: "network service - sshd" check: dsa_check_ssh hostgroups: computers depends: process - sshd normal_check_interval: 60 notification_interval: 1440 #### - name: network service - nrpe check: check_tcp!5666 hostgroups: computers max_check_attempts: -2 notification_interval: 1440 - name: process - nrpe nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:25 -c 1: -u nagios -C nrpe -a '/usr/sbin/nrpe -c /etc/nagios/nrpe.cfg -d'" hostgroups: computers max_check_attempts: -1 depends: network service - nrpe ### - name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a '/usr/sbin/munin-node'" hostgroups: computers excludehostgroups: freebsd, armhf - name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C perl -a '/usr/bin/perl -wT /usr/sbin/munin-node'" hostgroups: freebsd - name: process - munin-node nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C munin-node -a 'munin-node'" hostgroups: wheezy excludehostgroups: freebsd - name: network service - munin-node check: check_tcp!4949 hostgroups: computers depends: process - munin-node ### - name: process - ntpd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -p 1 -C ntpd -a '/usr/sbin/ntpd -p /var/run/ntpd.pid'" hostgroups: computers servicegroups: time - name: network service - ntp check: dsa_check_ntp hostgroups: computers depends: process - ntpd excludehosts: ancina excludehostgroups: ntpsuckers, deadslow servicegroups: time # - name: network service - time check: dsa_check_time hosts: ancina depends: process - xinetd servicegroups: time ### - name: process - atd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u daemon -C atd -a /usr/sbin/atd" hostgroups: computers ### - name: process - cron nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u root -C cron -a /usr/sbin/cron" hostgroups: computers ### - name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" hostgroups: computers excludehostgroups: freebsd - name: process - syslog-ng nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:2 -c 2: -u root -C syslog-ng -a '/sbin/syslog-ng -p /var/run/syslog-ng.pid'" hostgroups: freebsd - name: remote logging on lotti remotecheck: "/usr/lib/nagios/plugins/dsa-check-log-age-loghost $HOSTNAME$" runfrom: lotti hostgroups: computers - name: remote logging on lully remotecheck: "/usr/lib/nagios/plugins/dsa-check-log-age-loghost $HOSTNAME$" runfrom: lully hostgroups: computers - name: MQ connection on rainier remotecheck: "/usr/lib/nagios/plugins/dsa-check-mq-connection $HOSTNAME$ ud dsa" runfrom: rainier hostgroups: computers normal_check_interval: 60 retry_check_interval: 15 - name: MQ connection on rapoport remotecheck: "/usr/lib/nagios/plugins/dsa-check-mq-connection $HOSTNAME$ ud dsa" runfrom: rapoport hostgroups: computers normal_check_interval: 60 retry_check_interval: 15 ### MAIL STUFF ### - name: process - exim nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u Debian-exim -C exim4 -a '/usr/sbin/exim4 -bd -q'" hostgroups: computers excludehostgroups: postfix-hosts, mail-relay excludehosts: master, busoni, quantz, buxtehude - name: process - exim nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:25 -c 1: -u Debian-exim -C exim4 -a '/usr/sbin/exim4 -bd -q'" hostgroups: mail-relay - name: process - exim - total nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1: -C exim4" hostgroups: computers excludehostgroups: postfix-hosts excludehosts: master, busoni, quantz, buxtehude - name: process - exim nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:300 -c 1:500 -C exim4 -a '/usr/sbin/exim4'" hosts: master, busoni, quantz, buxtehude - name: mail queue nrpe: "/usr/lib/nagios/plugins/check_mailq -M exim -w 1000 -c 2000" hostgroups: heavy-exim ### - name: process - clamav - clamd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:2 -c 1: -u clamav -C clamd -a '/usr/sbin/clamd'" hostgroups: heavy-exim, heavy-postfix - name: service - clamav nrpe: "/usr/lib/nagios/plugins/check_clamd -H /var/run/clamav/clamd.ctl" hostgroups: heavy-exim, heavy-postfix depends: process - clamav - clamd - name: process - clamav - freshclam nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u clamav -C freshclam -a '/usr/bin/freshclam -d --quiet'" hostgroups: heavy-exim, heavy-postfix - name: unwanted process - clamav nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C clamd" hostgroups: computers excludehostgroups: heavy-exim, heavy-postfix, deadslow - name: unwanted process - freshclam nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C freshclam" hostgroups: computers excludehostgroups: heavy-exim, heavy-postfix, deadslow ### - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" hostgroups: spamd excludehosts: picconi excludehostgroups: deadslow - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 20 --min-spare=5 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" hosts: picconi - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C spamd -a '/usr/sbin/spamd --create-prefs --max-children 10 --helper-home-dir -d --pidfile=/var/run/spamd.pid'" hosts: bendel - name: process - spamd - child nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:11 -c 1: -C spamd -a 'spamd child'" hosts: bendel hostgroups: spamd depends: process - spamd - master # - name: process - spamd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u debbugs -C spamd -a '/usr/sbin/spamd -d '" hosts: buxtehude - name: process - spamd - child nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u debbugs -C spamd -a 'spamd child'" hosts: buxtehude # - name: unwanted process - spamd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C spamd" hostgroups: computers excludehostgroups: spamd, deadslow excludehosts: bendel, busoni, buxtehude ### #- # name: process - greylistd # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u greylist -C greylistd -a '/usr/bin/python /usr/sbin/greylistd'" # hostgroups: heavy-exim # - name: unwanted process - greylistd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C greylistd" hostgroups: computers excludehostgroups: deadslow ### - name: process - postgrey nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -a '/usr/sbin/postgrey --pidfile=/var/run/postgrey.pid --daemonize --unix=/var/run/postgrey/socket --retry-window=4 --auto-whitelist-clients=10 --exim'" hostgroups: heavy-exim - name: process - postgrey nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgrey -a '/usr/sbin/postgrey --pidfile=/var/run/postgrey.pid --daemonize --inet=127.0.0.1:60000'" hostgroups: heavy-postfix # - name: unwanted process - postgrey nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C postgrey" hostgroups: computers excludehostgroups: heavy-postfix, heavy-exim, deadslow ### - name: process - amavis - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u amavis -a 'amavisd-new (master)'" hostgroups: amavis-hosts - name: process - amavis - all nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1:10 -u amavis -a 'amavisd-new '" hostgroups: amavis-hosts depends: process - amavis - master # - name: unwanted process - amavis nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C amavisd-new" hostgroups: computers excludehostgroups: amavis-hosts, deadslow ### - name: process - weightd - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u polw -a 'policyd-weight (master)'" hostgroups: heavy-postfix - name: process - weightd - cache nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u polw -a 'policyd-weight (cache)'" hostgroups: heavy-postfix depends: process - weightd - master - name: process - weightd - child nrpe: "/usr/lib/nagios/plugins/check_procs -w 2:50 -c 1: -u polw -a 'policyd-weight (child)'" hostgroups: heavy-postfix depends: process - weightd - master ### - name: unwanted process - policyd-weight nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C policyd-weight" hostgroups: computers excludehostgroups: heavy-postfix, deadslow ### - name: process - postfix - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C master -a '/usr/lib/postfix/master'" hostgroups: postfix-hosts - name: process - postfix - qmgr nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postfix -C qmgr -a 'qmgr -l -t fifo -u'" hostgroups: postfix-hosts depends: process - postfix - master #- # name: process - postfix - tlsmgr # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postfix -C tlsmgr -a 'tlsmgr -l -t fifo -u'" # hostgroups: postfix-hosts # depends: process - postfix - master - name: process - postfix - pickup nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postfix -C pickup -a 'pickup -l -t fifo -u -c'" hostgroups: postfix-hosts depends: process - postfix - master - name: process - postfix - anvil nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:1 -c 0: -u postfix -C anvil -a 'anvil -l -t unix -u'" hostgroups: postfix-hosts depends: process - postfix - master - name: process - postfix - trivial-rewrite nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:10 -c 0:15 -u postfix -C trivial-rewrite -a 'trivial-rewrite -n rewrite -t unix -u -c'" hostgroups: postfix-hosts depends: process - postfix - master - name: process - postfix - proxymap nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:10 -c 0:15 -u postfix -C proxymap -a 'proxymap -t unix -u'" hostgroups: postfix-hosts depends: process - postfix - master - name: process - postfix - cleanup nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:30 -c 0:50 -u postfix -C cleanup -a 'cleanup -z -t unix -u -c'" hostgroups: postfix-hosts depends: process - postfix - master - name: process - postfix - local nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:30 -c 0:50 -u postfix -C local -a 'local -t unix'" hostgroups: postfix-hosts depends: process - postfix - master - name: unwanted process - openvpn nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C openvpn" hostgroups: computers normal_check_interval: 120 ### - name: network service - smtp check: dsa_check_smtp hostgroups: computers excludehostgroups: postfix-hosts, incomingmailrelayed, incomingmailrelayed2025 depends: process - exim - name: network service - smtp check: dsa_check_smtp hostgroups: postfix-hosts depends: process - postfix - master - name: network service - submission check: dsa_check_smtp_port!587 hostgroups: incomingmailrelayed depends: process - exim - name: network service - smtp 2025 check: dsa_check_smtp_port!2025 hostgroups: incomingmailrelayed2025 depends: process - exim - name: network service local - smtps cert nrpe: "/usr/lib/nagios/plugins/check_http -H localhost -p 465 -S -C 14 -t 45" hostgroups: postfix-hosts depends: process - postfix - master normal_check_interval: 120 - name: setup - dsa config nrpe: "/usr/lib/nagios/plugins/dsa-check-config" hostgroups: computers normal_check_interval: 60 - name: setup - local hostname etc-hosts nrpe: 'if getent ahosts `hostname` | grep -q 127.0; then echo "Warning: local hostname resolves to 127/8 address"; exit 1; else echo "OK: Hostname resolves to non-127/8 address."; exit 0; fi' hostgroups: computers normal_check_interval: 60 - name: system - available entropy nrpe: "/usr/lib/nagios/plugins/dsa-check-entropy" event_handler: dsa_event_handler_restart_ekey hostgroups: computers excludehostgroups: freebsd - name: system - filesystem check nrpe: "/usr/bin/sudo /usr/lib/nagios/plugins/dsa-check-filesystems" normal_check_interval: 60 retry_check_interval: 15 hostgroups: computers ### - name: local resolver nrpe: "/usr/lib/nagios/plugins/dsa-check-resolver www.debian.org www.google.com" hostgroups: computers normal_check_interval: 60 - name: process - unbound nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u unbound -C unbound -a '/usr/sbin/unbound'" hostgroups: unbound-hosts, squeeze, wheezy ### - name: process - uptimed nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u daemon -C uptimed -a '/usr/sbin/uptimed'" hostgroups: computers ### - name: unwanted process - irqbalance nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C irqbalance" hostgroups: computers excludehostgroups: deadslow #### ### #- # name: unwanted process - system-tools-backends # nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C system-tools-ba" # hostgroups: computers #- # name: unwanted process - dbus-daemon # nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C dbus-daemon" # hostgroups: computers - name: unwanted process - gkrellmd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C gkrellmd" hostgroups: computers excludehostgroups: deadslow - name: unwanted process - rpc.statd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C rpc.statd" hostgroups: computers excludehostgroups: nfs-client, nfs-server, deadslow - name: unwanted process - inetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C inetd" hostgroups: computers excludehosts: abel, alwyn excludehostgroups: deadslow - name: unwanted process - snmpd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C snmpd" hostgroups: computers excludehostgroups: deadslow #### - name: "host SSL cert" nrpe: "if [ -e /etc/ssl/certs/thishost.pem ]; then /usr/lib/nagios/plugins/dsa-check-cert-expire /etc/ssl/certs/thishost.pem; else echo 'No thishost.pem on this host.'; fi" hostgroups: computers ############ Processes/Services that only run on some computers ############ #### ### - name: process - rngd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C rngd -a '/usr/sbin/rngd -r /dev/hwrng'" hostgroups: dl385 ### - name: process - mdadm monitor servicegroups: raid nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /var/run/mdadm/monitor.pid --daemonise --scan'" hostgroups: sw-raid excludehostgroups: wheezy - # wheezy: name: process - mdadm monitor servicegroups: raid nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C mdadm -a '/sbin/mdadm --monitor --pid-file /run/mdadm/monitor.pid --daemonise --scan'" hostgroups: sw-raid excludehostgroups: squeeze - name: RAID - sw raid servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-raid-sw" hostgroups: sw-raid ### - name: process - ud-replicated nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C ud-replicated -a '/usr/bin/python /usr/bin/ud-replicated'" hostgroups: computers excludehostgroups: squeeze,freebsd - name: process - ud-replicated nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C python2.7 -a '/usr/bin/python /usr/bin/ud-replicated'" hostgroups: freebsd - name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/sbin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" hostgroups: squeeze - name: process - monit nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C monit -a '/usr/bin/monit -d 300 -I -c /etc/monit/monitrc -s /var/lib/monit/monit.state'" hostgroups: computers excludehostgroups: squeeze - name: HW - hpacucli status servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli" normal_check_interval: 120 hostgroups: dl385, dl380, dl360, bl460 excludehosts: schein, rietz - name: HW - hpacucli status servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --no-controller-ok --ignore-controller='P700m'" normal_check_interval: 120 hostgroups: bm-bl - name: HW - hpacucli status servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --no-battery" normal_check_interval: 120 hosts: schein, rietz - name: HW - hpacucli enclosure status servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli-enclosure 1 1E:1" normal_check_interval: 120 hosts: franck - name: HW - hpacucli status servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-hpacucli --ignore-transfer-speed=1I:1:1 --ignore-transfer-speed=1I:1:2" normal_check_interval: 120 hostgroups: dl585 ### - name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm" normal_check_interval: 120 hostgroups: dl385, dl380, dl360, bl460, dl585, bm-bl excludehosts: villa, lobos, senfl, schein - name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm --ps-no-redundant" normal_check_interval: 120 hosts: villa, lobos - name: HW - hpasmcli status nrpe: "/usr/lib/nagios/plugins/dsa-check-hpasm --fan-no-redundant" normal_check_interval: 120 hosts: senfl, schein ### - name: RAID - 3ware servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-raid-3ware" hosts: powell ### - name: RAID - aacraid servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-raid-aacraid" hostgroups: aacraid ### - name: RAID - megaraid servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-raid-megaraid" hostgroups: megaraid ### #- # name: RAID - 3ware # servicegroups: raid # nrpe: "/usr/lib/nagios/plugins/dsa-check-raid-3ware" # hosts: puccini ### - name: RAID - MPT servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-raid-mpt" hostgroups: mptraid ### # - # name: RAID - megactl # servicegroups: raid # nrpe: "/usr/lib/nagios/plugins/dsa-check-raid-megactl" # hostgroups: megactl ### - name: RAID - DRBD servicegroups: raid nrpe: "/usr/lib/nagios/plugins/dsa-check-drbd -d All" hostgroups: drbd-hosts ### - name: process - slapd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:20 -c 1:50 -u openldap -C slapd -a '/usr/sbin/slapd -h ldap:/// ldaps:/// -g openldap -u openldap'" hosts: draghi - name: network service - ldaps cert check: dsa_check_cert!636 depends: process - slapd normal_check_interval: 60 hosts: draghi ### - name: process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C ulogd -a '/usr/sbin/ulogd -d'" hostgroups: computers excludehostgroups: freebsd, sparc - name: unexpected process - ulogd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C ulogd" hostgroups: freebsd, sparc ### - name: process - udevd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -p 1 -C udevd -a 'udevd'" hostgroups: computers excludehostgroups: freebsd - name: unexpected process - udev nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C udevd" hostgroups: freebsd ### - name: process - acpid nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C acpid -a '/usr/sbin/acpid'" hostgroups: acpid-hosts - name: unexpected process - acpid nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C acpid" hostgroups: computers excludehostgroups: acpid-hosts, kvmdomains ### # - # name: process - bosserver # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C bosserver -a '/usr/sbin/bosserver'" # hostgroups: bosserver # ### - name: process - xinetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C xinetd -a '/usr/sbin/xinetd -pidfile /var/run/xinetd.pid -stayalive'" hostgroups: xinetd-hosts - name: unwanted process - xinetd nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C xinetd" hostgroups: computers excludehostgroups: xinetd-hosts, deadslow ### - name: network service - finger check: check_tcp!79 hosts: draghi depends: process - xinetd ### - name: network service - rsync check: check_tcp!873 hostgroups: rsyncd-hosts depends: process - xinetd excludehosts: rietz - name: network service - rsync check: check_tcp!873 hosts: rietz2 depends: rietz:process - xinetd - name: network service - rsync check: check_tcp!873 hosts: milanollo2 depends: milanollo:process - xinetd ### - name: process - icinga # there is always one extra process per check currently running.. nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:30 -c 1: -u nagios -C icinga -a '/usr/sbin/icinga -d /etc/icinga/icinga.cfg'" hosts: tchaikovsky ### - name: process - jetty - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -a 'jsvc.exec'" hostgroups: jetty-hosts - name: process - jetty - worker nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1:100 -u jetty -a 'jsvc.exec -user jetty'" hostgroups: jetty-hosts depends: process - jetty - master ### - name: process - apache2 - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -a /usr/sbin/apache2" hostgroups: apache2-hosts - name: process - apache2 - worker nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:50 -c 1:100 -u www-data -a /usr/sbin/apache2" hostgroups: apache2-hosts depends: process - apache2 - master - name: unwanted process - apache2 nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C apache2" hostgroups: computers excludehostgroups: apache2-hosts, deadslow - name: network service - http check: check_http hostgroups: apache2-hosts excludehosts: klecker depends: process - apache2 - master - name: network service - http check: check_http depends: klecker:process - apache2 - master hosts: klecker-ftp # keyserver on kaufmann - name: network service - http keyserver check: dsa_check_http_port!11371 hosts: kaufmann depends: process - apache2 - master # https on various hosts - name: network service - https check: check_https hostgroups: apache-https excludehosts: handel,menotti excludehostgroups: broken_https_default_vhost depends: "process - apache2 - master" normal_check_interval: 120 - name: network service - https check: dsa_check_https_want_auth hosts: handel,menotti depends: "process - apache2 - master" normal_check_interval: 120 - name: network service - https check: dsa_check_https_any_status hostgroups: broken_https_default_vhost depends: "process - apache2 - master" normal_check_interval: 120 - name: network service - https cert check: dsa_check_cert!443 hostgroups: apache-https depends: network service - https normal_check_interval: 60 - name: unwanted network service - https check: dsa_check_port_closed!443 hostgroups: apache2-hosts excludehostgroups: apache-https, deadslow # ravel does ssh on port 443 excludehosts: ravel normal_check_interval: 60 ### - name: process - varnish - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u root -C varnishd -a '/usr/sbin/varnishd -P /var/run/varnishd.pid -a :80 -T localhost:6082 -f /etc/varnish/default.vcl'" hostgroups: varnish-hosts - name: process - varnish - worker nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1:1 -u nobody -C varnishd -a '/usr/sbin/varnishd -P /var/run/varnishd.pid -a :80 -T localhost:6082 -f /etc/varnish/default.vcl'" hostgroups: varnish-hosts depends: process - varnish - master - name: network service - http check: check_http hostgroups: varnish-hosts depends: process - varnish - master ### #### - name: process - named nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:15 -c 1: -u bind -C named -a '/usr/sbin/named -u bind'" hostgroups: bind9-hosts - name: network service - dns check: check_dns hostgroups: bind9-hosts depends: process - named - name: unwanted process - named nrpe: "/usr/lib/nagios/plugins/check_procs -w 0:0 -C named" hostgroups: computers excludehostgroups: bind9-hosts, deadslow #### - name: network service - ftp check: check_ftp hostgroups: uploadqueue, security_mirror excludehosts: klecker - name: network service - ftp check: check_ftp hosts: klecker-ftp depends: klecker:process - xinetd #### #- # name: process - debianqueued # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u dak -C debianqueued" - name: process - debianqueued nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:3 -c 1: -u dak-unpriv -C debianqueued" hostgroups: uploadqueue ### #- # name: process - postgresql81 - master # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a '/usr/lib/postgresql/8.1/bin/postmaster -D /var/lib/postgresql/8.1/main -c config_file=/etc/postgresql/8.1/main/postgresql.conf'" # hostgroups: postgres81-hosts #- # name: process - postgresql81 - writer # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: writer process'" # hostgroups: postgres81-hosts # depends: process - postgresql81 - master #- # name: process - postgresql81 - buffer # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: stats buffer process'" # hostgroups: postgres81-hosts # depends: process - postgresql81 - master #- # name: process - postgresql81 - collector # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u postgres -C postmaster -a 'postgres: stats collector process'" # hostgroups: postgres81-hosts # depends: process - postgresql81 - master #### - name: unwanted process - postgresql nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres" hostgroups: computers excludehostgroups: postgres91-hosts, deadslow - name: unwanted process - postgresql 9.0 nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C postgres -a '9.0/bin/postgres'" hostgroups: computers - name: process - postgresql91 - master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u postgres -C postgres -a '/usr/lib/postgresql/9.1/bin/postgres'" hostgroups: postgres91-hosts - name: postgresql backups nrpe: "/usr/bin/sudo -u debbackup /usr/lib/nagios/plugins/dsa-check-backuppg" #hosts: beethoven hosts: backuphost #### #### - name: process - stunnel4 - puppet-ekeyd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:6 -c 1: -u stunnel4 -C stunnel4 -a '/usr/bin/stunnel4 /etc/stunnel/puppet-ekeyd.conf'" hostgroups: squeeze, wheezy excludehostgroups: freebsd #### - name: process - UPS - nut usbhid-ups - ups1 nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u nut -C usbhid-ups -a '/lib/nut/usbhid-ups -a ups1'" hosts: franck - name: process - UPS - nut upsd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u nut -C upsd -a '/sbin/upsd'" hosts: franck - name: process - UPS - nut upsmon master nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C upsmon -a '/sbin/upsmon'" hosts: franck - name: process - UPS - nut upsmon worker nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u nut -C upsmon -a '/sbin/upsmon'" hosts: franck depends: process - UPS - nut upsmon master - name: UPS - on line power nrpe: "/usr/lib/nagios/plugins/dsa-check-ups" hosts: franck depends: process - UPS - nut upsd ### - name: process - buildd servicegroups: buildd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C perl -a '/usr/bin/buildd'" hosts: fano, finzi, fils, fayrfax contact_groups: buildd - name: process - buildd servicegroups: buildd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:5 -u buildd -C buildd -a '/usr/bin/buildd'" hostgroups: buildd excludehosts: fano, finzi, fils, fayrfax contact_groups: buildd - name: processes - zombie schroot #nrpe: "/usr/lib/nagios/plugins/check_procs -a schroot -s Zs -c 0" nrpe: "(/usr/lib/nagios/plugins/check_procs -a schroot -s Zs -c 0 > /dev/null || /usr/lib/nagios/plugins/check_procs -a schroot -s Zs -c 0) && /usr/lib/nagios/plugins/check_procs -a schroot -s ZNs -c 0" hostgroups: buildd contact_groups: +buildd normal_check_interval: 5 max_check_attempts: 24 retry_check_interval: 5 - name: processes - lvcreate nrpe: "/usr/lib/nagios/plugins/check_procs -m 'ELAPSED' -c 500 -C lvcreate -u root -a 'lvcreate'" hostgroups: buildd contact_groups: +buildd #### - name: network service - gobby check: check_tcp!6523 hosts: gombert contact_groups: gobby #### #- # name: process - tftpd # nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C in.tftpd -a '/usr/sbin/in.tftpd -l -B 1450 -s /var/lib/tftpboot'" # hostgroups: tftpd-hosts ### ############ NFS Stuff ############ #### - name: process - statd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u statd -C rpc.statd -a '/sbin/rpc.statd'" hostgroups: nfs-client, nfs-server - name: process - nfsd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:10 -c 1: -u root -C nfsd -a '[nfsd]'" hostgroups: nfs-server - name: process - lockd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C lockd -a '[lockd]'" hostgroups: nfs-server - name: process - mountd nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C rpc.mountd -a '/sbin/rpc.mountd'" hostgroups: nfs-server - name: nfs server glinka reachable nrpe: "/usr/lib/nagios/plugins/check_ping -H 192.168.2.76 -w 50,10% -c 200,30%" hosts: quantz # - name: process - automount nrpe: "/usr/lib/nagios/plugins/check_procs -w 1:1 -c 1: -u root -C automount -a '/usr/sbin/automount'" hostgroups: autofs - name: unwanted process - automount nrpe: "/usr/lib/nagios/plugins/check_procs -w 0 -C automount" hostgroups: computers excludehostgroups: autofs, deadslow ############ MISC OTHER Stuff ############ ##### - name: puppetmaster cert nrpe: "/usr/lib/nagios/plugins/dsa-check-cert-expire /var/lib/puppet/ssl/certs/ca.pem" hosts: handel normal_check_interval: 60 max_check_attempts: 2 retry_check_interval: 5 - name: mirror sync - bugs check: "dsa_check_mirrorsync_skew!bugs.debian.org!project/trace/bugs-master.debian.org!120:600" hosts: global - name: mirror sync - security check: "dsa_check_mirrorsync_skew!security-nagios.debian.org!project/trace/security-master.debian.org!150:3600" hosts: global - name: mirror sync - packages check: "dsa_check_mirrorsync_skew!packages.debian.org!Pics/.trace!3600:57600" hosts: global normal_check_interval: 15 max_check_attempts: 5 retry_check_interval: 5 - name: mirror sync - snapshot check: "dsa_check_mirrorsync_skew!snapshot.debian.org!project/trace/snapshot-master.debian.org!3600:28800" hosts: global normal_check_interval: 15 max_check_attempts: 5 retry_check_interval: 5 - name: DNS SOA sync - debian.org check: "dsa_check_soas_add!denis.debian.org!debian.org" hosts: global - name: DNS SOA sync - debian.net check: "dsa_check_soas_add!denis.debian.org!debian.net" hosts: global - name: DNS SOA sync - debian.com check: "dsa_check_soas_add!denis.debian.org!debian.com" hosts: global - name: DNS SOA sync - mirror.debian.net check: "dsa_check_soas_add!denis.debian.org!mirror.debian.net" hosts: global - name: DNS SOA sync - 144-28.118.59.86.in-addr.arpa check: "dsa_check_soas_add!denis.debian.org!144-28.118.59.86.in-addr.arpa" hosts: global - name: DNS SOA sync - alioth.debian.org check: "dsa_check_soas_add!alioth.debian.org!alioth.debian.org" hosts: global - name: DNS - delegation and signature expiry hosts: global remotecheck: "/usr/lib/nagios/plugins/dsa-check-zone-rrsig-expiration-many --warn 20d --critical 7d --geozonedir /srv/dns.debian.org/repositories/auto-dns/zones /srv/dns.debian.org/repositories/domains" runfrom: denis - name: DNS - security delegations hosts: global remotecheck: "/usr/lib/nagios/plugins/dsa-check-dnssec-delegation --dir /srv/dns.debian.org/repositories/domains --dir /srv/dns.debian.org/repositories/auto-dns/zones check-header" runfrom: denis - name: DNS - key coverage hosts: global remotecheck: "/usr/lib/nagios/plugins/dsa-check-statusfile /srv/dns.debian.org/var/nagios/coverage" runfrom: denis - name: DNS - DS expiry hosts: global remotecheck: "/usr/lib/nagios/plugins/dsa-check-statusfile /srv/dns.debian.org/var/nagios/ds" runfrom: denis ############ - name: ping alive check remotecheck: "/usr/lib/nagios/plugins/check_ping -H $HOSTADDRESS$ -w 50,10% -c 200,30%" runfrom: dijkstra hosts: giustini normal_check_interval: 5 max_check_attempts: 4 retry_check_interval: 1 - name: Overall Unit Status remotecheck: "/usr/lib/nagios/plugins/check_snmp -H $HOSTADDRESS$ -C public -P 2c -o connUnitStatus -n -c 3 -w 3" runfrom: dijkstra hosts: giustini - name: event log remotecheck: "/usr/lib/nagios/plugins/dsa-check-msa-eventlog --start=7778 $HOSTADDRESS$ public" runfrom: dijkstra hosts: giustini ############ - name: current chroots nrpe: "/usr/lib/nagios/plugins/dsa-check-dchroots-current" hostgroups: porterbox normal_check_interval: 60 retry_check_interval: 15 # vim: set ts=2 sw=2 et ai si fdm=marker: