From: Matt Birkholz Date: Sun, 18 Jan 2026 23:29:40 +0000 (-0700) Subject: Add Munin and NAGIOS monitoring for Ord Mantell. X-Git-Url: https://birchwood-abbey.net/git?a=commitdiff_plain;h=6feec433c046c4c58a6fc2c709768d35248a9755;p=Network.git Add Munin and NAGIOS monitoring for Ord Mantell. --- diff --git a/README.org b/README.org index 7dfdfc4..cb49a9b 100644 --- a/README.org +++ b/README.org @@ -1417,10 +1417,11 @@ fi *** Configure NAGIOS Monitoring of The Cloister -The abbey adds monitoring for more servers: Dantooine and Kessel. -They are ~abbey-cloister~ servers, so they are configured as small -institute ~campus~ servers, like Gate, with an NRPE (a NAGIOS Remote -Plugin Executor) server and an ~inst_sensors~ command. +The abbey adds monitoring for more servers: Dantooine, Kessel and Ord +Mantell. They are ~abbey-cloister~ servers, so they are configured as +small institute ~campus~ servers, like Gate, with an NRPE (a NAGIOS +Remote Plugin Executor) server and an ~inst_sensors~ or +~abbey_pisensors~ command. The configurations for these servers are very similar to Gate's, but are idiosyncratically in flux. @@ -1436,6 +1437,7 @@ included in =private/vars-abbey.yml=. --- dantooine_addr: 10.84.138.8 kessel_addr: 10.84.138.10 +ord_mantell_addr: 10.84.138.12 #+END_SRC **** Install NAGIOS Configurations @@ -1450,7 +1452,7 @@ The following task installs each host's NAGIOS configuration. template: src: nagios-{{ item }}.cfg dest: /etc/nagios4/conf.d/{{ item }}.cfg - loop: [ dantooine, kessel ] + loop: [ dantooine, kessel, ord-mantell ] notify: Reload NAGIOS4. #+END_SRC @@ -1567,6 +1569,59 @@ define service { } #+END_SRC +**** NAGIOS Monitoring of Ord-Mantell + +#+CAPTION: [[file:roles_t/abbey-core/templates/nagios-ord-mantell.cfg][=roles_t/abbey-core/templates/nagios-ord-mantell.cfg=]] +#+BEGIN_SRC conf :tangle roles_t/abbey-core/templates/nagios-ord-mantell.cfg +define host { + use linux-server + host_name ord-mantell + address {{ ord_mantell_addr }} +} + +define service { + use generic-service + host_name ord-mantell + service_description Root Partition + check_command check_nrpe!inst_root +} + +# define service { +# use generic-service +# host_name ord-mantell +# service_description Current Load +# check_command check_nrpe!check_load +# } + +define service { + use generic-service + host_name ord-mantell + service_description Zombie Processes + check_command check_nrpe!check_zombie_procs +} + +# define service { +# use generic-service +# host_name ord-mantell +# service_description Total Processes +# check_command check_nrpe!check_total_procs +# } + +define service { + use generic-service + host_name ord-mantell + service_description Swap Usage + check_command check_nrpe!inst_swap +} + +define service { + use generic-service + host_name ord-mantell + service_description Temperature Sensors + check_command check_nrpe!abbey_pisensors +} +#+END_SRC + ** Install Munin The abbey is experimenting with Munin. NAGIOS is all about notifying @@ -1620,6 +1675,9 @@ trends in resource usage. [kessel.birchwood.private] address {{ kessel_addr }} + + [ord-mantell.birchwood.private] + address {{ ord_mantell_addr }} dest: /etc/munin/munin-conf.d/zzz-site.cfg notify: Restart Munin. diff --git a/private_ex/vars-abbey.yml b/private_ex/vars-abbey.yml index 036e5c5..9ddfe89 100644 --- a/private_ex/vars-abbey.yml +++ b/private_ex/vars-abbey.yml @@ -1,3 +1,4 @@ --- dantooine_addr: 10.84.138.8 kessel_addr: 10.84.138.10 +ord_mantell_addr: 10.84.138.12 diff --git a/roles_t/abbey-core/tasks/main.yml b/roles_t/abbey-core/tasks/main.yml index 316f850..5d4f04f 100644 --- a/roles_t/abbey-core/tasks/main.yml +++ b/roles_t/abbey-core/tasks/main.yml @@ -283,7 +283,7 @@ template: src: nagios-{{ item }}.cfg dest: /etc/nagios4/conf.d/{{ item }}.cfg - loop: [ dantooine, kessel ] + loop: [ dantooine, kessel, ord-mantell ] notify: Reload NAGIOS4. - name: Install Munin. @@ -330,6 +330,9 @@ [kessel.birchwood.private] address {{ kessel_addr }} + + [ord-mantell.birchwood.private] + address {{ ord_mantell_addr }} dest: /etc/munin/munin-conf.d/zzz-site.cfg notify: Restart Munin. diff --git a/roles_t/abbey-core/templates/nagios-ord-mantell.cfg b/roles_t/abbey-core/templates/nagios-ord-mantell.cfg new file mode 100644 index 0000000..bf3e7d8 --- /dev/null +++ b/roles_t/abbey-core/templates/nagios-ord-mantell.cfg @@ -0,0 +1,47 @@ +define host { + use linux-server + host_name ord-mantell + address {{ ord_mantell_addr }} +} + +define service { + use generic-service + host_name ord-mantell + service_description Root Partition + check_command check_nrpe!inst_root +} + +# define service { +# use generic-service +# host_name ord-mantell +# service_description Current Load +# check_command check_nrpe!check_load +# } + +define service { + use generic-service + host_name ord-mantell + service_description Zombie Processes + check_command check_nrpe!check_zombie_procs +} + +# define service { +# use generic-service +# host_name ord-mantell +# service_description Total Processes +# check_command check_nrpe!check_total_procs +# } + +define service { + use generic-service + host_name ord-mantell + service_description Swap Usage + check_command check_nrpe!inst_swap +} + +define service { + use generic-service + host_name ord-mantell + service_description Temperature Sensors + check_command check_nrpe!abbey_pisensors +}