1 /*****************************************************************************
3 * Nagios check_nagios plugin
6 * Copyright (c) 1999-2007 Nagios Plugins Development Team
8 * Last Modified: $Date$
12 * This file contains the check_nagios plugin
14 * This plugin checks the status of the Nagios process on the local machine.
15 * The plugin will check to make sure the Nagios status log is no older than
16 * the number of minutes specified by the expires option.
17 * It also checks the process table for a process matching the command
21 * This program is free software: you can redistribute it and/or modify
22 * it under the terms of the GNU General Public License as published by
23 * the Free Software Foundation, either version 3 of the License, or
24 * (at your option) any later version.
26 * This program is distributed in the hope that it will be useful,
27 * but WITHOUT ANY WARRANTY; without even the implied warranty of
28 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
29 * GNU General Public License for more details.
31 * You should have received a copy of the GNU General Public License
32 * along with this program. If not, see <http://www.gnu.org/licenses/>.
36 *****************************************************************************/
38 const char *progname
= "check_nagios";
39 const char *revision
= "$Revision$";
40 const char *copyright
= "1999-2007";
41 const char *email
= "nagiosplug-devel@lists.sourceforge.net";
47 int process_arguments (int, char **);
48 void print_help (void);
49 void print_usage (void);
51 char *status_log
= NULL
;
52 char *process_string
= NULL
;
53 int expire_minutes
= 0;
58 main (int argc
, char **argv
)
60 int result
= STATE_UNKNOWN
;
61 char input_buffer
[MAX_INPUT_BUFFER
];
62 unsigned long latest_entry_time
= 0L;
63 unsigned long temp_entry_time
= 0L;
75 #ifdef PS_USES_PROCETIME
76 char procetime
[MAX_INPUT_BUFFER
];
77 #endif /* PS_USES_PROCETIME */
78 char procprog
[MAX_INPUT_BUFFER
];
81 int expected_cols
= PS_COLS
- 1;
82 const char *zombie
= "Z";
84 output chld_out
, chld_err
;
87 setlocale (LC_ALL
, "");
88 bindtextdomain (PACKAGE
, LOCALEDIR
);
91 if (process_arguments (argc
, argv
) == ERROR
)
92 usage_va(_("Could not parse arguments"));
94 /* Set signal handling and alarm timeout */
95 if (signal (SIGALRM
, timeout_alarm_handler
) == SIG_ERR
) {
96 usage_va(_("Cannot catch SIGALRM"));
99 /* handle timeouts gracefully... */
100 alarm (timeout_interval
);
102 /* open the status log */
103 fp
= fopen (status_log
, "r");
105 die (STATE_CRITICAL
, "NAGIOS %s: %s\n", _("CRITICAL"), _("Cannot open status log for reading!"));
108 /* get the date/time of the last item updated in the log */
109 while (fgets (input_buffer
, MAX_INPUT_BUFFER
- 1, fp
)) {
110 if ((temp_ptr
= strstr (input_buffer
, "created=")) != NULL
) {
111 temp_entry_time
= strtoul (temp_ptr
+ 8, NULL
, 10);
112 latest_entry_time
= temp_entry_time
;
114 } else if ((temp_ptr
= strtok (input_buffer
, "]")) != NULL
) {
115 temp_entry_time
= strtoul (temp_ptr
+ 1, NULL
, 10);
116 if (temp_entry_time
> latest_entry_time
)
117 latest_entry_time
= temp_entry_time
;
123 printf("command: %s\n", PS_COMMAND
);
125 /* run the command to check for the Nagios process.. */
126 if((result
= np_runcmd(PS_COMMAND
, &chld_out
, &chld_err
, 0)) != 0)
127 result
= STATE_WARNING
;
129 /* count the number of matching Nagios processes... */
130 for(i
= 0; i
< chld_out
.lines
; i
++) {
131 cols
= sscanf (chld_out
.line
[i
], PS_FORMAT
, PS_VARLIST
);
132 /* Zombie processes do not give a procprog command */
133 if ( cols
== (expected_cols
- 1) && strstr(procstat
, zombie
) ) {
134 cols
= expected_cols
;
135 /* Set some value for procargs for the strip command further below
136 * Seen to be a problem on some Solaris 7 and 8 systems */
137 chld_out
.line
[i
][pos
] = '\n';
138 chld_out
.line
[i
][pos
+1] = 0x0;
140 if ( cols
>= expected_cols
) {
141 asprintf (&procargs
, "%s", chld_out
.line
[i
] + pos
);
144 /* Some ps return full pathname for command. This removes path */
145 temp_string
= strtok ((char *)procprog
, "/");
146 while (temp_string
) {
147 strcpy(procprog
, temp_string
);
148 temp_string
= strtok (NULL
, "/");
151 /* May get empty procargs */
152 if (!strstr(procargs
, argv
[0]) && strstr(procargs
, process_string
) && strcmp(procargs
,"")) {
155 printf (_("Found process: %s %s\n"), procprog
, procargs
);
161 /* If we get anything on stderr, at least set warning */
163 result
= max_state (result
, STATE_WARNING
);
165 /* reset the alarm handler */
168 if (proc_entries
== 0) {
169 die (STATE_CRITICAL
, "NAGIOS %s: %s\n", _("CRITICAL"), _("Could not locate a running Nagios process!"));
172 if (latest_entry_time
== 0L) {
173 die (STATE_CRITICAL
, "NAGIOS %s: %s\n", _("CRITICAL"), _("Cannot parse Nagios log file for valid time"));
176 time (¤t_time
);
177 if ((int)(current_time
- latest_entry_time
) > (expire_minutes
* 60)) {
178 result
= STATE_WARNING
;
183 printf ("NAGIOS %s: ", (result
== STATE_OK
) ? _("OK") : _("WARNING"));
184 printf (ngettext ("%d process", "%d processes", proc_entries
), proc_entries
);
187 ngettext ("status log updated %d second ago",
188 "status log updated %d seconds ago",
189 (int) (current_time
- latest_entry_time
) ),
190 (int) (current_time
- latest_entry_time
) );
198 /* process command-line arguments */
200 process_arguments (int argc
, char **argv
)
205 static struct option longopts
[] = {
206 {"filename", required_argument
, 0, 'F'},
207 {"expires", required_argument
, 0, 'e'},
208 {"command", required_argument
, 0, 'C'},
209 {"version", no_argument
, 0, 'V'},
210 {"help", no_argument
, 0, 'h'},
211 {"verbose", no_argument
, 0, 'v'},
218 if (!is_option (argv
[1])) {
219 status_log
= argv
[1];
220 if (is_intnonneg (argv
[2]))
221 expire_minutes
= atoi (argv
[2]);
224 _("Expiration time must be an integer (seconds)\n"));
225 process_string
= argv
[3];
230 c
= getopt_long (argc
, argv
, "+hVvF:C:e:", longopts
, &option
);
232 if (c
== -1 || c
== EOF
|| c
== 1)
239 case 'V': /* version */
240 print_revision (progname
, revision
);
242 case 'F': /* status log */
245 case 'C': /* command */
246 process_string
= optarg
;
248 case 'e': /* expiry time */
249 if (is_intnonneg (optarg
))
250 expire_minutes
= atoi (optarg
);
253 _("Expiration time must be an integer (seconds)\n"));
258 default: /* print short usage_va statement if args not parsable */
264 if (status_log
== NULL
)
265 die (STATE_UNKNOWN
, _("You must provide the status_log\n"));
267 if (process_string
== NULL
)
268 die (STATE_UNKNOWN
, _("You must provide a process string\n"));
278 print_revision (progname
, revision
);
280 printf (_(COPYRIGHT
), copyright
, email
);
282 printf ("%s\n", _("This plugin checks the status of the Nagios process on the local machine"));
283 printf ("%s\n", _("The plugin will check to make sure the Nagios status log is no older than"));
284 printf ("%s\n", _("the number of minutes specified by the expires option."));
285 printf ("%s\n", _("It also checks the process table for a process matching the command argument."));
291 printf (_(UT_HELP_VRSN
));
293 printf (" %s\n", "-F, --filename=FILE");
294 printf (" %s\n", _("Name of the log file to check"));
295 printf (" %s\n", "-e, --expires=INTEGER");
296 printf (" %s\n", _("Minutes aging after which logfile is considered stale"));
297 printf (" %s\n", "-C, --command=STRING");
298 printf (" %s\n", _("Substring to search for in process arguments"));
299 printf (_(UT_VERBOSE
));
301 printf ("%s\n", _("Examples:"));
302 printf (" %s\n", "check_nagios -e 5 -F /usr/local/nagios/var/status.log -C /usr/local/nagios/bin/nagios");
303 printf (_(UT_SUPPORT
));
311 printf (_("Usage:"));
312 printf ("%s -F <status log file> -e <expire_minutes> -C <process_string>\n", progname
);