#check_by_ssh check_disk on lxg0447 (special command because of a path to check_disk on lxg0447)
define command {
command_name check_disk_by_ssh_lxg0447
- command_line /usr/local/nagios/libexec/check_by_ssh -H $HOSTADDRESS$ -C "/misc/hadaq/nagios/nagios-plugins-1.4.5/plugins/check_disk -w $ARG1$ -c $ARG2$ -p $ARG3$"
+ command_line /usr/local/nagios/libexec/check_by_ssh -H $HOSTADDRESS$ -C "/misc/hadaq/nagios/plugins/check_disk -w $ARG1$ -c $ARG2$ -p $ARG3$"
}
#check_by_ssh check_disk on lxg0451 (special command because of a path to check_disk on lxg0451)
define command {
command_name check_disk_by_ssh_lxg0451
- command_line /usr/local/nagios/libexec/check_by_ssh -H $HOSTADDRESS$ -C "/misc/hadaq/nagios/nagios-plugins-1.4.5/plugins/check_disk -w $ARG1$ -c $ARG2$ -p $ARG3$"
+ command_line /usr/local/nagios/libexec/check_by_ssh -H $HOSTADDRESS$ -C "/misc/hadaq/nagios/plugins/check_disk -w $ARG1$ -c $ARG2$ -p $ARG3$"
}
#check_by_ssh check_disk
define hostgroup{
hostgroup_name hadeb-group
alias EB Servers
-# contact_groups <edit-this> ; This needs to be the same value as the value located in service.cfg file. Nagios 2.5 produces an error if you define this.
- members hadeb01,hadeb03,hadeb04,hadeb05,hadeb06a,hadeb07,lxhadesdaq
+# contact_groups <edit-this>
+ members hadeb01,hadeb04,hadeb05,hadeb06a,hadeb07,lxhadesdaq
}
-# lxg-hosts group definition
+#--- lxg-hosts group (in the experimental area, counting house)
define hostgroup{
hostgroup_name lxg-group
alias lxg hosts
-# contact_groups <edit-this> ; This needs to be the same value as the value located in service.cfg file. Nagios 2.5 produces an error if you define this.
- members lxg0447,lxg0411,lxg0451,lxg0434,lxg0440,lxg0441,lxg0442,lxg0443,lxg0444,lxg0430,lxg0438,lxg0449,lxg0450
+# contact_groups <edit-this>
+ members lxg0430,lxg0434,lxg0438,lxg0440,lxg0441,lxg0442,lxg0443,lxg0444,lxg0447,lxg0449,lxg0450,lxg0451,lxg0452
}
-# hades-hosts group definition
+#--- desktop group
+define hostgroup{
+ hostgroup_name desktop-group
+ alias lxg desktop hosts
+# contact_groups <edit-this>
+ members lxg0429,lxg0433,lxg0435,lxg0437,lxg0439,lxg0445,lxg0446,lxg0448,lxg0452,lxg0453,lxg0454,lxg0455
+ }
+
+#--- lustre-hosts group
+define hostgroup{
+ hostgroup_name nightqueue-group
+ alias night-queue hosts
+# contact_groups <edit-this>
+ members lxg0429,lxg0433,lxg0435,lxg0437,lxg0439,lxg0440,lxg0441,lxg0442,lxg0443,lxg0444,lxg0445,lxg0446,lxg0447,lxg0448,lxg0452,lxg0453,lxg0454,lxg0455
+ }
+
+# hades-hosts group
define hostgroup{
hostgroup_name hades-group
alias hades hosts
-# contact_groups <edit-this> ; This needs to be the same value as the value located in service.cfg file. Nagios 2.5 produces an error if you define this.
+# contact_groups <edit-this>
members hades25,hades17,hades27
}
define hostgroup{
hostgroup_name scs-group
alias scs hosts
-# contact_groups <edit-this> ; This needs to be the same value as the value located in service.cfg file. Nagios 2.5 produces an error if you define this.
+# contact_groups <edit-this>
members hadsc1
}
register 1
}
-# hadeb03 host definition
-define host{
- name hadeb03
- use hadeb-host ; Name of host template to use
- host_name hadeb03
- alias backup server
- address 140.181.97.118
- register 1
- }
-
# hadeb04 host definition
define host{
name hadeb04
register 1
}
-#lxg0411
-define host{
- name lxg0411
- use lxg-host ; Name of host template to use
- host_name lxg0411
- alias QA Server (Go4)
- address 140.181.74.222
- register 1
- }
-
-#lxg0447
+#lxg0429
define host{
- name lxg0447
+ name lxg0429
use lxg-host ; Name of host template to use
- host_name lxg0447
- alias QA RAM-Disk
- address 140.181.92.234
+ host_name lxg0429
+ alias desktop PC (A.Sadovsky)
+ address 140.181.115.110
register 1
}
register 1
}
+#lxg0433
+define host{
+ name lxg0433
+ use lxg-host ; Name of host template to use
+ host_name lxg0433
+ alias desktop PC (M.Sudol)
+ address 140.181.84.30
+ register 1
+ }
+
#lxg0434
define host{
name lxg0434
register 1
}
+#lxg0435
+define host{
+ name lxg0435
+ use lxg-host ; Name of host template to use
+ host_name lxg0435
+ alias desktop PC (K.Teilab)
+ address 140.181.69.119
+ register 1
+ }
+
+#lxg0437
+define host{
+ name lxg0437
+ use lxg-host ; Name of host template to use
+ host_name lxg0437
+ alias desktop PC (R.Holzmann)
+ address 140.181.84.38
+ register 1
+ }
+
#lxg0438
define host{
name lxg0438
register 1
}
+#lxg0439
+define host{
+ name lxg0439
+ use lxg-host ; Name of host template to use
+ host_name lxg0439
+ alias desktop PC (A.Schmah)
+ address 140.181.67.194
+ register 1
+ }
#lxg0440
define host{
name lxg0440
use lxg-host ; Name of host template to use
host_name lxg0440
- alias RICH acc PC
+ alias RICH PC
address 140.181.92.220
register 1
}
name lxg0441
use lxg-host ; Name of host template to use
host_name lxg0441
- alias MDC acc PC
+ alias MDC PC
address 140.181.92.222
register 1
}
name lxg0442
use lxg-host ; Name of host template to use
host_name lxg0442
- alias Start/Veto/Trigger acc PC
+ alias Start/Veto/Trigger PC
address 140.181.92.224
register 1
}
name lxg0443
use lxg-host ; Name of host template to use
host_name lxg0443
- alias TOF/TOFino acc PC
+ alias TOF/TOFino PC
address 140.181.92.226
register 1
}
name lxg0444
use lxg-host ; Name of host template to use
host_name lxg0444
- alias Shower acc PC
+ alias Shower PC
address 140.181.92.228
register 1
}
+#lxg0445
+define host{
+ name lxg0445
+ use lxg-host ; Name of host template to use
+ host_name lxg0445
+ alias desktop PC (I.Koenig)
+ address 140.181.85.49
+ register 1
+ }
+
+#lxg0446
+define host{
+ name lxg0446
+ use lxg-host ; Name of host template to use
+ host_name lxg0446
+ alias desktop PC (T.Galatyuk)
+ address 140.181.92.232
+ register 1
+ }
+
+#lxg0447
+define host{
+ name lxg0447
+ use lxg-host ; Name of host template to use
+ host_name lxg0447
+ alias QA RAM-Disk
+ address 140.181.92.234
+ register 1
+ }
+
+#lxg0448
+define host{
+ name lxg0448
+ use lxg-host ; Name of host template to use
+ host_name lxg0448
+ alias desktop PC (Y.Pachmayer)
+ address 140.181.92.236
+ register 1
+ }
+
#lxg0449
define host{
name lxg0449
register 1
}
+#lxg0452
+define host{
+ name lxg0452
+ use lxg-host ; Name of host template to use
+ host_name lxg0452
+ alias RPC PC
+ address 140.181.106.208
+ register 1
+ }
+
+#lxg0453
+define host{
+ name lxg0453
+ use lxg-host ; Name of host template to use
+ host_name lxg0453
+ alias desktop PC (J.Markert)
+ address 140.181.86.57
+ register 1
+ }
+
+#lxg0454
+define host{
+ name lxg0454
+ use lxg-host ; Name of host template to use
+ host_name lxg0454
+ alias desktop PC (A.Rustamov)
+ address 140.181.106.214
+ register 1
+ }
+
+#lxg0455
+define host{
+ name lxg0455
+ use lxg-host ; Name of host template to use
+ host_name lxg0455
+ alias desktop PC (M.Lorenz)
+ address 140.181.112.116
+ register 1
+ }
+
#hades25
define host{
name hades25
-# SOUND SERVER service group
+#--- SOUND SERVER service group
define servicegroup{
servicegroup_name soundserver-group
alias SOUND SERVER
members hadesdaq,SOUND_SERVER,lxhadesdaq,SOUND_SERVER,hadc08,SOUND_SERVER;
}
-# HARD DISK TEST service group
+#--- HARD DISK TEST service group
define servicegroup{
servicegroup_name harddisk-group
alias DISK TEST
members hadesdaq,DISK TEST,hadesdaq,RAID1,hadeb07,DISK_AB TEST,hadeb07,DISK_CD TEST,hades17,DISK TEST,hades17,RAID1,hades25,DISK TEST,hades25,RAID1,hades27,DISK TEST,hades27,RAID1;
}
+#--- Lustre mount
+define servicegroup{
+ servicegroup_name lustre-group
+ alias Lustre mount
+ members lxg0429,LUSTRE,lxg0433,LUSTRE,lxg0435,LUSTRE,lxg0437,LUSTRE,lxg0439,LUSTRE,lxg0440,LUSTRE,lxg0441,LUSTRE,lxg0442,LUSTRE,lxg0443,LUSTRE,lxg0444,LUSTRE,lxg0445,LUSTRE,lxg0446,LUSTRE,lxg0447,LUSTRE,lxg0448,LUSTRE,lxg0452,LUSTRE,lxg0453,LUSTRE,lxg0454,LUSTRE,lxg0455,LUSTRE;
+ }
+
# online QA/DST service group
#define servicegroup{
# servicegroup_name onlinedst-group
# alias online QA/DST
-# members lxg0411,updateQA,lxg0411,updateDST,lxg0430,runPairDST,lxg0440,runPairDST,lxg0441,runPairDST,lxg0442,runPairDST,lxg0443,runPairDST,lxg0444,runPairDST,lxg0451,runQA,lxg0452,runPairDST;
+# members lxg0411,updateQA,lxg0430,runPairDST,lxg0440,runPairDST,lxg0441,runPairDST,lxg0442,runPairDST,lxg0443,runPairDST,lxg0444,runPairDST,lxg0451,runQA,lxg0452,runPairDST;
# }
\ No newline at end of file
hostgroups *
register 0
- }
+ }
+
+# LUSTRE-SERVICE for lxg hosts
+define service{
+ use generic-service
+ name lustre-service-lxg
+ is_volatile 0
+ check_period 24x7
+ max_check_attempts 3
+ normal_check_interval 600
+ retry_check_interval 1
+ contact_groups linux-admins
+ notification_interval 600
+ notification_period 24x7
+ notification_options c,r
+ hostgroups *
+
+ register 0
+ }
# PING
define service{
}
############# COMMON SERVICES FOR LXG04**
-# PING
+#--- PING
define service{
use ping-service-lxg ; Name of service template to use
- hostgroup_name lxg-group,hades-group
+ hostgroup_name lxg-group,desktop-group,hades-group
# host_name *
service_description PING
check_command check_ping!100.0,20%!500.0,60%
}
-# SSH
+#--- SSH
define service{
use ssh-service-lxg
# host_name *
- hostgroup_name lxg-group,hades-group
+ hostgroup_name lxg-group,desktop-group,hades-group
service_description SSH
check_command check_ssh!2
}
+#--- Lustre mount
+define service{
+ use lustre-service-lxg
+# host_name *
+ hostgroup_name nightqueue-group
+ service_description LUSTRE
+ check_command check_proc_status!50502!check_lustre!
+}
+
####################### hadesdaq ##########################
# local raid
define service{
# check_command check_disk_by_ssh!20%!10%!/var!
# }
-####################### hadeb03 ###########################
-# remote disk check
-define service{
- use generic-service
- host_name hadeb03
- service_description /D/HADEB03
- is_volatile 0
- check_period 24x7
- max_check_attempts 3
- normal_check_interval 60
- retry_check_interval 1
- contact_groups linux-admins
- notification_interval 120
- notification_period 24x7
- notification_options c,r
- check_command check_disk_by_ssh!20%!10%!/d/hadeb03!
- }
-
-# remote disk check
-define service{
- use generic-service
- host_name hadeb03
- service_description /D/HADEB03B
- is_volatile 0
- check_period 24x7
- max_check_attempts 3
- normal_check_interval 60
- retry_check_interval 1
- contact_groups linux-admins
- notification_interval 120
- notification_period 24x7
- notification_options c,r
- check_command check_disk_by_ssh!20%!10%!/d/hadeb03b!
- }
-
-# remote raid check
-define service{
- use generic-service
- host_name hadeb03
- service_description RAID1
- is_volatile 0
- check_period 24x7
- max_check_attempts 3
- normal_check_interval 60
- retry_check_interval 1
- contact_groups linux-admins
- notification_interval 120
- notification_period 24x7
- notification_options c,r
- check_command check_raid_by_ssh
- }
-
####################### hadeb04 ###########################
# remote disk check
define service{