Nagios 3.1.1 eats cpu like mad

Marc Powell marc at ena.com
Sat Jul 18 00:40:13 CEST 2009


On Jul 15, 2009, at 2:10 PM, Hiren Patel wrote:

> Ricardo Maraschini wrote:
>> Hi,
>>
>> ----- "Ethan Galstad" <egalstad at nagios.org> escreveu:
>>> Patch is in CVS now.  Can someone who was experience scheduling
>>> problems
>>> with the 3.0.6 release test the latest 3.1.2 release?
>>
>> Just to let you know that the original scheduler bug remains there  
>> on Nagios release 3.1.2, but now when something wrong happens with  
>> service scheduling Nagios write a log line saying:
>>
>> Warning: Check of service 'fake-test' on host 'localhost' could not  
>> be rescheduled properly.  Scheduling check for next week...
>>
>> We need to look more closely to problem.
> could you provide simple configuration that can be used to replicate  
> the
> problem on 3.1.2? thanks.

Using -HEAD from a few days ago. I see this as well, but most of my  
checks are passive only. I use the old trick of enabling active checks  
but with check_period none to keep the GUI clean. It's happening for  
many (all?) of my passive checks. I'm just upgrading to -3x so I'm not  
sure it's really a problem per se, given that these are related to  
passive-only services, but at the least it's annoying... Here's an  
example, pulled from objects.cache on the host receiving the passive  
checks. I do not see the error on the actual polling machines.

--
Marc


[1247869976] Warning: Check of service '5 MIN CPU UTIL' on host 'eakin- 
es.davidson.tn.ena.net' could not be rescheduled properly.  Scheduling  
check for next week...
[1247870015] Warning: Check of service 'PING' on host 'eakin- 
es.davidson.tn.ena.net' could not be rescheduled properly.  Scheduling  
check for next week...

define host {
         host_name       eakin-es.davidson.tn.ena.net
         alias   Eakin Elementary - 2557
         address 172.31.35.124
         check_period    none
         contact_groups  tnops,stupid, 
86389,74350,87857,15386,66918,89727,71056,66875,15384,61345,85030,15443,60214,35512,59110,68542,56158,72073,87697,85424,48295,85956,80685,81285,15441,53052,48298,48299,78367,82123,79800,75220,15475,56022,82718,15387,62143,19519,53051,67449,52243,56980,67888,10656,86063,87457,79510,55494,56023,52963,80647,55508,56021,16330,63894
         notification_period     none
         initial_state   o
         check_interval  5.000000
         retry_interval  1.000000
         max_check_attempts      1
         active_checks_enabled   1
         passive_checks_enabled  1
         obsess_over_host        1
         event_handler_enabled   0
         low_flap_threshold      0.000000
         high_flap_threshold     0.000000
         flap_detection_enabled  1
         flap_detection_options  o,d,u
         freshness_threshold     0
         check_freshness 0
         notification_options    n
         notifications_enabled   1
         notification_interval   10080.000000
         first_notification_delay        0.000000
         stalking_options        n
         process_perf_data       0
         failure_prediction_enabled      1
         retain_status_information       1
         retain_nonstatus_information    1
         }

define service {
         host_name       eakin-es.davidson.tn.ena.net
         service_description     5 MIN CPU UTIL
         check_period    none
         check_command   check_cisco_cpu_5
         contact_groups  tnops,stupid, 
86389,74350,87857,15386,66918,89727,71056,66875,15384,61345,85030,15443,60214,35512,59110,68542,56158,72073,87697,85424,48295,85956,80685,81285,15441,53052,48298,48299,78367,82123,79800,75220,15475,56022,82718,15387,62143,19519,53051,67449,52243,56980,67888,10656,86063,87457,79510,55494,56023,52963,80647,55508,56021,16330,63894
         notification_period     24x7
         initial_state   o
         check_interval  5.000000
         retry_interval  3.000000
         max_check_attempts      3
         is_volatile     0
         parallelize_check       1
         active_checks_enabled   1
         passive_checks_enabled  1
         obsess_over_service     0
         event_handler_enabled   0
         low_flap_threshold      0.000000
         high_flap_threshold     0.000000
         flap_detection_enabled  1
         flap_detection_options  o,w,u,c
         freshness_threshold     0
         check_freshness 0
         notification_options    c,r
         notifications_enabled   1
         notification_interval   10080.000000
         first_notification_delay        0.000000
         stalking_options        n
         process_perf_data       0
         failure_prediction_enabled      1
         retain_status_information       1
         retain_nonstatus_information    1
         }

define service {
         host_name       eakin-es.davidson.tn.ena.net
         service_description     PING
         check_period    none
         check_command   check_ping
         contact_groups  tnops,stupid, 
86389,74350,87857,15386,66918,89727,71056,66875,15384,61345,85030,15443,60214,35512,59110,68542,56158,72073,87697,85424,48295,85956,80685,81285,15441,53052,48298,48299,78367,82123,79800,75220,15475,56022,82718,15387,62143,19519,53051,67449,52243,56980,67888,10656,86063,87457,79510,55494,56023,52963,80647,55508,56021,16330,63894
         notification_period     24x7
         initial_state   o
         check_interval  5.000000
         retry_interval  3.000000
         max_check_attempts      3
         is_volatile     0
         parallelize_check       1
         active_checks_enabled   1
         passive_checks_enabled  1
         obsess_over_service     0
         event_handler_enabled   0
         low_flap_threshold      0.000000
         high_flap_threshold     0.000000
         flap_detection_enabled  1
         flap_detection_options  o,w,u,c
         freshness_threshold     0
         check_freshness 0
         notification_options    c,r
         notifications_enabled   1
         notification_interval   10080.000000
         first_notification_delay        0.000000
         stalking_options        n
         process_perf_data       0
         failure_prediction_enabled      1
         retain_status_information       1
         retain_nonstatus_information    1
         }




------------------------------------------------------------------------------
Enter the BlackBerry Developer Challenge  
This is your chance to win up to $100,000 in prizes! For a limited time, 
vendors submitting new applications to BlackBerry App World(TM) will have
the opportunity to enter the BlackBerry Developer Challenge. See full prize  
details at: http://p.sf.net/sfu/Challenge




More information about the Developers mailing list