Hosts randomly disappearing
Thomas Donnelly
tad1214 at aol.com
Mon Dec 8 21:39:30 CET 2008
Hello All,
I have about 115 hosts in my nagios pool and I recently added a group of
7 UPSs. I made my own check using the check_snmp to check the load
percentage. Funny thing is, some times they show up in the host detail
and some times they do not. Refreshing a few times will get them to
show, then another refresh usually causes them to disappear. Opening one
of the hosts usually results in the message: "Error: Host Status
Information Not Found!" a few refreshes gets the host state to become
viewable. I find this behavior only with the 7 hosts i just added. The
config file is:
#cat ups.cfg
#UPS1
define host{
host_name ups-r1.hou.example.com
alias UPS Rack 1
address 192.168.96.8
check_command check-host-alive
max_check_attempts 10
process_perf_data 1
retain_status_information 1
retain_nonstatus_information 0
contact_groups web-admins
notification_options d,r
notification_interval 30
notification_period 24x7
parents co1.hou.example.com
}
define hostextinfo{
host_name ups-r1.hou.example.com
icon_image www.jpg
statusmap_image www.gd2
}
define service{
host_name ups-r1.hou.example.com
service_description check_ping
check_command check_ping!140,25%!180,50%
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
define service{
host_name ups-r1.hou.example.com
service_description check_ups_load
check_command check_ups_load!84!89
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
#UPS2
define host{
host_name ups-r2.hou.example.com
alias UPS Rack 2
address 192.168.96.9
check_command check-host-alive
max_check_attempts 10
process_perf_data 1
retain_status_information 1
retain_nonstatus_information 0
contact_groups web-admins
notification_options d,r
notification_interval 30
notification_period 24x7
parents co1.hou.example.com
}
define hostextinfo{
host_name ups-r2.hou.example.com
icon_image www.jpg
statusmap_image www.gd2
}
define service{
host_name ups-r2.hou.example.com
service_description check_ping
check_command check_ping!140,25%!180,50%
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
define service{
host_name ups-r2.hou.example.com
service_description check_ups_load
check_command check_ups_load!84!89
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
#UPS3
define host{
host_name ups-r3.hou.example.com
alias UPS Rack 3
address 192.168.96.10
check_command check-host-alive
max_check_attempts 10
process_perf_data 1
retain_status_information 1
retain_nonstatus_information 0
contact_groups web-admins
notification_options d,r
notification_interval 30
notification_period 24x7
parents co1.hou.example.com
}
define hostextinfo{
host_name ups-r3.hou.example.com
icon_image www.jpg
statusmap_image www.gd2
}
define service{
host_name ups-r3.hou.example.com
service_description check_ping
check_command check_ping!140,25%!180,50%
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
define service{
host_name ups-r3.hou.example.com
service_description check_ups_load
check_command check_ups_load!84!89
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
#UPS5
define host{
host_name ups-r5.hou.example.com
alias UPS Rack 5
address 192.168.96.12
check_command check-host-alive
max_check_attempts 10
process_perf_data 1
retain_status_information 1
retain_nonstatus_information 0
contact_groups web-admins
notification_options d,r
notification_interval 30
notification_period 24x7
parents co1.hou.example.com
}
define hostextinfo{
host_name ups-r5.hou.example.com
icon_image www.jpg
statusmap_image www.gd2
}
define service{
host_name ups-r5.hou.example.com
service_description check_ping
check_command check_ping!140,25%!180,50%
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
define service{
host_name ups-r5.hou.example.com
service_description check_ups_load
check_command check_ups_load!84!89
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
#UPS6
define host{
host_name ups-r6.hou.example.com
alias UPS Rack 6
address 192.168.96.13
check_command check-host-alive
max_check_attempts 10
process_perf_data 1
retain_status_information 1
retain_nonstatus_information 0
contact_groups web-admins
notification_options d,r
notification_interval 30
notification_period 24x7
parents co1.hou.example.com
}
define hostextinfo{
host_name ups-r6.hou.example.com
icon_image www.jpg
statusmap_image www.gd2
}
define service{
host_name ups-r6.hou.example.com
service_description check_ping
check_command check_ping!140,25%!180,50%
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
define service{
host_name ups-r6.hou.example.com
service_description check_ups_load
check_command check_ups_load!84!89
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
#UPS7
define host{
host_name ups-r7.hou.example.com
alias UPS Rack 7
address 192.168.96.11
check_command check-host-alive
max_check_attempts 10
process_perf_data 1
retain_status_information 1
retain_nonstatus_information 0
contact_groups web-admins
notification_options d,r
notification_interval 30
notification_period 24x7
parents co1.hou.example.com
}
define hostextinfo{
host_name ups-r7.hou.example.com
icon_image www.jpg
statusmap_image www.gd2
}
define service{
host_name ups-r7.hou.example.com
service_description check_ping
check_command check_ping!140,25%!180,50%
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
define service{
host_name ups-r7.hou.example.com
service_description check_ups_load
check_command check_ups_load!84!89
max_check_attempts 10
normal_check_interval 5
retry_check_interval 3
check_period 24x7
notification_interval 30
notification_period 24x7
notification_options w,c,r
contact_groups web-admins
}
any and all help is greatly appreciated!
Thanks!!!
-=Tom
------------------------------------------------------------------------------
SF.Net email is Sponsored by MIX09, March 18-20, 2009 in Las Vegas, Nevada.
The future of the web can't happen without you. Join us at MIX09 to help
pave the way to the Next Web now. Learn more and register at
http://ad.doubleclick.net/clk;208669438;13503038;i?http://2009.visitmix.com/
_______________________________________________
Nagios-users mailing list
Nagios-users at lists.sourceforge.net
https://lists.sourceforge.net/lists/listinfo/nagios-users
::: Please include Nagios version, plugin version (-v) and OS when reporting any issue.
::: Messages without supporting info will risk being sent to /dev/null
More information about the Users
mailing list