Hosts randomly disappearing

Thomas Donnelly tad1214 at aol.com
Mon Dec 8 21:39:30 CET 2008


Hello All,

I have about 115 hosts in my nagios pool and I recently added a group of 
7 UPSs. I made my own check using the check_snmp to check the load 
percentage. Funny thing is, some times they show up in the host detail 
and some times they do not. Refreshing a few times will get them to 
show, then another refresh usually causes them to disappear. Opening one 
of the hosts usually results in the message: "Error: Host Status 
Information Not Found!" a few refreshes gets the host state to become 
viewable. I find this behavior only with the 7 hosts i just added. The 
config file is:

#cat ups.cfg

#UPS1
define host{
        host_name                       ups-r1.hou.example.com
        alias                           UPS Rack 1
        address                         192.168.96.8
        check_command                   check-host-alive
        max_check_attempts              10
        process_perf_data               1
        retain_status_information       1
        retain_nonstatus_information    0
        contact_groups                  web-admins
        notification_options            d,r
        notification_interval           30
        notification_period             24x7
        parents                         co1.hou.example.com
}
define hostextinfo{
        host_name                       ups-r1.hou.example.com
        icon_image                      www.jpg
        statusmap_image                 www.gd2
}


define service{
        host_name                       ups-r1.hou.example.com
        service_description             check_ping
        check_command                   check_ping!140,25%!180,50%
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

define service{
        host_name                       ups-r1.hou.example.com
        service_description             check_ups_load
        check_command                   check_ups_load!84!89
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

#UPS2
define host{
        host_name                       ups-r2.hou.example.com
        alias                           UPS Rack 2
        address                         192.168.96.9
        check_command                   check-host-alive
        max_check_attempts              10
        process_perf_data               1
        retain_status_information       1
        retain_nonstatus_information    0
        contact_groups                  web-admins
        notification_options            d,r
        notification_interval           30
        notification_period             24x7
        parents                         co1.hou.example.com
}
define hostextinfo{
        host_name                       ups-r2.hou.example.com
        icon_image                      www.jpg
        statusmap_image                 www.gd2
}


define service{
        host_name                       ups-r2.hou.example.com
        service_description             check_ping
        check_command                   check_ping!140,25%!180,50%
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

define service{
        host_name                       ups-r2.hou.example.com
        service_description             check_ups_load
        check_command                   check_ups_load!84!89
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

#UPS3
define host{
        host_name                       ups-r3.hou.example.com
        alias                           UPS Rack 3
        address                         192.168.96.10
        check_command                   check-host-alive
        max_check_attempts              10
        process_perf_data               1
        retain_status_information       1
        retain_nonstatus_information    0
        contact_groups                  web-admins
        notification_options            d,r
        notification_interval           30
        notification_period             24x7
        parents                         co1.hou.example.com
}
define hostextinfo{
        host_name                       ups-r3.hou.example.com
        icon_image                      www.jpg
        statusmap_image                 www.gd2
}


define service{
        host_name                       ups-r3.hou.example.com
        service_description             check_ping
        check_command                   check_ping!140,25%!180,50%
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

define service{
        host_name                       ups-r3.hou.example.com
        service_description             check_ups_load
        check_command                   check_ups_load!84!89
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

#UPS5
define host{
        host_name                       ups-r5.hou.example.com
        alias                           UPS Rack 5
        address                         192.168.96.12
        check_command                   check-host-alive
        max_check_attempts              10
        process_perf_data               1
        retain_status_information       1
        retain_nonstatus_information    0
        contact_groups                  web-admins
        notification_options            d,r
        notification_interval           30
        notification_period             24x7
        parents                         co1.hou.example.com
}
define hostextinfo{
        host_name                       ups-r5.hou.example.com
        icon_image                      www.jpg
        statusmap_image                 www.gd2
}


define service{
        host_name                       ups-r5.hou.example.com
        service_description             check_ping
        check_command                   check_ping!140,25%!180,50%
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

define service{
        host_name                       ups-r5.hou.example.com
        service_description             check_ups_load
        check_command                   check_ups_load!84!89
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

#UPS6
define host{
        host_name                       ups-r6.hou.example.com
        alias                           UPS Rack 6
        address                         192.168.96.13
        check_command                   check-host-alive
        max_check_attempts              10
        process_perf_data               1
        retain_status_information       1
        retain_nonstatus_information    0
        contact_groups                  web-admins
        notification_options            d,r
        notification_interval           30
        notification_period             24x7
        parents                         co1.hou.example.com
}
define hostextinfo{
        host_name                       ups-r6.hou.example.com
        icon_image                      www.jpg
        statusmap_image                 www.gd2
}


define service{
        host_name                       ups-r6.hou.example.com
        service_description             check_ping
        check_command                   check_ping!140,25%!180,50%
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

define service{
        host_name                       ups-r6.hou.example.com
        service_description             check_ups_load
        check_command                   check_ups_load!84!89
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

#UPS7
define host{
        host_name                       ups-r7.hou.example.com
        alias                           UPS Rack 7
        address                         192.168.96.11
        check_command                   check-host-alive
        max_check_attempts              10
        process_perf_data               1
        retain_status_information       1
        retain_nonstatus_information    0
        contact_groups                  web-admins
        notification_options            d,r
        notification_interval           30
        notification_period             24x7
        parents                         co1.hou.example.com
}
define hostextinfo{
        host_name                       ups-r7.hou.example.com
        icon_image                      www.jpg
        statusmap_image                 www.gd2
}


define service{
        host_name                       ups-r7.hou.example.com
        service_description             check_ping
        check_command                   check_ping!140,25%!180,50%
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

define service{
        host_name                       ups-r7.hou.example.com
        service_description             check_ups_load
        check_command                   check_ups_load!84!89
        max_check_attempts              10
        normal_check_interval           5
        retry_check_interval            3
        check_period                    24x7
        notification_interval           30
        notification_period             24x7
        notification_options            w,c,r
        contact_groups                  web-admins
}

any and all help is greatly appreciated!

Thanks!!!
-=Tom


------------------------------------------------------------------------------
SF.Net email is Sponsored by MIX09, March 18-20, 2009 in Las Vegas, Nevada.
The future of the web can't happen without you.  Join us at MIX09 to help
pave the way to the Next Web now. Learn more and register at
http://ad.doubleclick.net/clk;208669438;13503038;i?http://2009.visitmix.com/
_______________________________________________
Nagios-users mailing list
Nagios-users at lists.sourceforge.net
https://lists.sourceforge.net/lists/listinfo/nagios-users
::: Please include Nagios version, plugin version (-v) and OS when reporting any issue. 
::: Messages without supporting info will risk being sent to /dev/null





More information about the Users mailing list