X-Git-Url: https://git.tokkee.org/?a=blobdiff_plain;f=plugins%2Fcheck_procs.c;h=5742b72799545cfd583841f9a07ffc1d96753b58;hb=5e3fc41c6143676cf01b7aad789fc5f2cae5ce84;hp=5313b977e0e0760759775aac59b916ad6e318c8d;hpb=f4f92be60c94fd4e0dd4b2b4b3101543eedb706a;p=nagiosplug.git diff --git a/plugins/check_procs.c b/plugins/check_procs.c index 5313b97..5742b72 100644 --- a/plugins/check_procs.c +++ b/plugins/check_procs.c @@ -14,21 +14,25 @@ along with this program; if not, write to the Free Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. + $Id$ + ******************************************************************************/ const char *progname = "check_procs"; const char *revision = "$Revision$"; -const char *copyright = "2000-2003"; +const char *copyright = "2000-2004"; const char *email = "nagiosplug-devel@lists.sourceforge.net"; #include "common.h" #include "popen.h" #include "utils.h" + #include int process_arguments (int, char **); int validate_arguments (void); int check_thresholds (int); +int convert_to_seconds (char *); void print_help (void); void print_usage (void); @@ -47,14 +51,15 @@ int options = 0; /* bitmask of filter criteria to test against */ #define VSZ 64 #define RSS 128 #define PCPU 256 - +#define ELAPSED 512 /* Different metrics */ char *metric_name; enum metric { METRIC_PROCS, METRIC_VSZ, METRIC_RSS, - METRIC_CPU + METRIC_CPU, + METRIC_ELAPSED }; enum metric metric = METRIC_PROCS; @@ -73,22 +78,23 @@ char tmp[MAX_INPUT_BUFFER]; - - - int main (int argc, char **argv) { - char input_buffer[MAX_INPUT_BUFFER]; + char *input_buffer; + char *input_line; + char *procprog; int procuid = 0; int procppid = 0; int procvsz = 0; int procrss = 0; + int procseconds = 0; float procpcpu = 0; char procstat[8]; - char procprog[MAX_INPUT_BUFFER]; + char procetime[MAX_INPUT_BUFFER]; char *procargs; + char *temp_string; const char *zombie = "Z"; @@ -97,17 +103,31 @@ main (int argc, char **argv) int procs = 0; /* counter for number of processes meeting filter criteria */ int pos; /* number of spaces before 'args' in `ps` output */ int cols; /* number of columns in ps output */ + int expected_cols = PS_COLS - 1; int warn = 0; /* number of processes in warn state */ int crit = 0; /* number of processes in crit state */ int i = 0; int result = STATE_UNKNOWN; + setlocale (LC_ALL, ""); + bindtextdomain (PACKAGE, LOCALEDIR); + textdomain (PACKAGE); + + input_buffer = malloc (MAX_INPUT_BUFFER); + procprog = malloc (MAX_INPUT_BUFFER); + asprintf (&metric_name, "PROCS"); metric = METRIC_PROCS; - if (process_arguments (argc, argv) == ERROR) - usage (_("Unable to parse command line\n")); + if (process_arguments (argc, argv) != TRUE) + usage4 (_("Could not parse arguments")); + + /* Set signal handling and alarm timeout */ + if (signal (SIGALRM, popen_timeout_alarm_handler) == SIG_ERR) { + usage4 (_("Cannot catch SIGALRM")); + } + alarm (timeout_interval); if (verbose >= 2) printf (_("CMD: %s\n"), PS_COMMAND); @@ -122,27 +142,56 @@ main (int argc, char **argv) if (child_stderr == NULL) printf (_("Could not open stderr for %s\n"), PS_COMMAND); + /* flush first line */ fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process); + while ( input_buffer[strlen(input_buffer)-1] != '\n' ) + fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process); while (fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process)) { + asprintf (&input_line, "%s", input_buffer); + while ( input_buffer[strlen(input_buffer)-1] != '\n' ) { + fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process); + asprintf (&input_line, "%s%s", input_line, input_buffer); + } + + if (verbose >= 3) + printf ("%s", input_line); + strcpy (procprog, ""); asprintf (&procargs, "%s", ""); - cols = sscanf (input_buffer, PS_FORMAT, PS_VARLIST); + cols = sscanf (input_line, PS_FORMAT, PS_VARLIST); /* Zombie processes do not give a procprog command */ - if ( cols == 6 && strstr(procstat, zombie) ) { - cols = 7; - /* Set some value for procargs for the strip command further below - Seen to be a problem on some Solaris 7 and 8 systems */ - input_buffer[pos] = '\n'; - input_buffer[pos+1] = 0x0; + if ( cols == (expected_cols - 1) && strstr(procstat, zombie) ) { + cols = expected_cols; } - if ( cols >= 7 ) { + if ( cols >= expected_cols ) { resultsum = 0; - asprintf (&procargs, "%s", input_buffer + pos); + asprintf (&procargs, "%s", input_line + pos); strip (procargs); + /* Some ps return full pathname for command. This removes path */ + temp_string = strtok ((char *)procprog, "/"); + while (temp_string) { + strcpy(procprog, temp_string); + temp_string = strtok (NULL, "/"); + } + + /* we need to convert the elapsed time to seconds */ + procseconds = convert_to_seconds(procetime); + + if (verbose >= 3) + printf ("%d %d %d %d %d %.2f %s %s %s %s\n", + procs, procuid, procvsz, procrss, + procppid, procpcpu, procstat, + procetime, procprog, procargs); + + /* Ignore self */ + if (strcmp (procprog, progname) == 0) { + continue; + } + if ((options & STAT) && (strstr (statopts, procstat))) resultsum |= STAT; if ((options & ARGS) && procargs && (strstr (procargs, args) != NULL)) @@ -160,15 +209,6 @@ main (int argc, char **argv) if ((options & PCPU) && (procpcpu >= pcpu)) resultsum |= PCPU; - if (verbose >= 3) - printf ("%d %d %d %d %d %.2f %s %s %s\n", - procs, procuid, procvsz, procrss, - procppid, procpcpu, procstat, procprog, procargs); - - /* Ignore self */ - if (strcmp (procprog, progname) == 0) - continue; - found++; /* Next line if filters not matched */ @@ -184,17 +224,20 @@ main (int argc, char **argv) /* TODO? float thresholds for --metric=CPU */ else if (metric == METRIC_CPU) i = check_thresholds ((int)procpcpu); + else if (metric == METRIC_ELAPSED) + i = check_thresholds (procseconds); if (metric != METRIC_PROCS) { if (i == STATE_WARNING) { warn++; - asprintf (&fails, "%s%s%s", fails, (fails == "" ? "" : ", "), procprog); + asprintf (&fails, "%s%s%s", fails, (strcmp(fails,"") ? ", " : ""), procprog); + result = max_state (result, i); } if (i == STATE_CRITICAL) { crit++; - asprintf (&fails, "%s%s%s", fails, (fails == "" ? "" : ", "), procprog); + asprintf (&fails, "%s%s%s", fails, (strcmp(fails,"") ? ", " : ""), procprog); + result = max_state (result, i); } - result = max_state (result, i); } } /* This should not happen */ @@ -233,33 +276,25 @@ main (int argc, char **argv) } if ( result == STATE_OK ) { - printf (_("%s OK: %d process%s"), - metric_name, procs, ( procs != 1 ? "es" : "") ); + printf ("%s %s: ", metric_name, _("OK")); } else if (result == STATE_WARNING) { - if ( metric == METRIC_PROCS ) { - printf (_("PROCS WARNING: %d process%s"), procs, - ( procs != 1 ? "es" : "")); - } else { - printf (_("%s WARNING: %d warn out of %d process%s"), - metric_name, warn, procs, - ( procs != 1 ? "es" : "")); + printf ("%s %s: ", metric_name, _("WARNING")); + if ( metric != METRIC_PROCS ) { + printf (_("%d warn out of "), warn); } } else if (result == STATE_CRITICAL) { - if (metric == METRIC_PROCS) { - printf (_("PROCS CRITICAL: %d process%s"), procs, - ( procs != 1 ? "es" : "")); - } else { - printf (_("%s CRITICAL: %d crit, %d warn out of %d process%s"), - metric_name, crit, warn, procs, - ( procs != 1 ? "es" : "")); + printf ("%s %s: ", metric_name, _("CRITICAL")); + if (metric != METRIC_PROCS) { + printf (_("%d crit, %d warn out of "), crit, warn); } } + printf ("%d %s", procs, procs == 1 ? _("process") : _("processes")); - if (fmt != "") { - printf (" with %s", fmt); + if (strcmp(fmt,"") != 0) { + printf (_(" with %s"), fmt); } - if ( verbose >= 1 && fails != "" ) + if ( verbose >= 1 && strcmp(fails,"") ) printf (" [%s]", fails); printf ("\n"); @@ -268,9 +303,6 @@ main (int argc, char **argv) - - - /* process command-line arguments */ int process_arguments (int argc, char **argv) @@ -290,6 +322,7 @@ process_arguments (int argc, char **argv) {"vsz", required_argument, 0, 'z'}, {"rss", required_argument, 0, 'r'}, {"pcpu", required_argument, 0, 'P'}, + {"elapsed", required_argument, 0, 'e'}, {"argument-array", required_argument, 0, 'a'}, {"help", no_argument, 0, 'h'}, {"version", no_argument, 0, 'V'}, @@ -310,6 +343,7 @@ process_arguments (int argc, char **argv) switch (c) { case '?': /* help */ + printf (_("%s: Unknown argument: %s\n\n"), progname, optarg); print_usage (); exit (STATE_UNKNOWN); case 'h': /* help */ @@ -320,7 +354,7 @@ process_arguments (int argc, char **argv) exit (STATE_OK); case 't': /* timeout period */ if (!is_integer (optarg)) - usage (_("Timeout Interval must be an integer!\n\n")); + usage2 (_("Timeout interval must be a positive integer"), optarg); else timeout_interval = atoi (optarg); break; @@ -336,7 +370,7 @@ process_arguments (int argc, char **argv) else usage (_("Critical Process Count must be an integer!\n\n")); break; - case 'w': /* warning time threshold */ + case 'w': /* warning threshold */ if (is_integer (optarg)) wmax = atoi (optarg); else if (sscanf (optarg, ":%d", &wmax) == 1) @@ -346,24 +380,21 @@ process_arguments (int argc, char **argv) else if (sscanf (optarg, "%d:", &wmin) == 1) break; else - usage (_("%s: Warning Process Count must be an integer!\n\n")); + usage (_("Warning Process Count must be an integer!\n\n")); break; case 'p': /* process id */ if (sscanf (optarg, "%d%[^0-9]", &ppid, tmp) == 1) { - asprintf (&fmt, "%s%sPPID = %d", fmt, (options ? ", " : ""), ppid); + asprintf (&fmt, "%s%sPPID = %d", (fmt ? fmt : "") , (options ? ", " : ""), ppid); options |= PPID; break; } - printf (_("%s: Parent Process ID must be an integer!\n\n"), - progname); - print_usage (); - exit (STATE_UNKNOWN); + usage2 (_("%s: Parent Process ID must be an integer!\n\n"), progname); case 's': /* status */ if (statopts) break; else statopts = optarg; - asprintf (&fmt, _("%s%sSTATE = %s"), fmt, (options ? ", " : ""), statopts); + asprintf (&fmt, _("%s%sSTATE = %s"), (fmt ? fmt : ""), (options ? ", " : ""), statopts); options |= STAT; break; case 'u': /* user or user id */ @@ -371,76 +402,63 @@ process_arguments (int argc, char **argv) uid = atoi (optarg); pw = getpwuid ((uid_t) uid); /* check to be sure user exists */ - if (pw == NULL) { - printf (_("UID %d was not found\n"), uid); - print_usage (); - exit (STATE_UNKNOWN); - } + if (pw == NULL) + usage2 (_("UID %s was not found\n"), optarg); } else { pw = getpwnam (optarg); /* check to be sure user exists */ - if (pw == NULL) { - printf (_("User name %s was not found\n"), optarg); - print_usage (); - exit (STATE_UNKNOWN); - } + if (pw == NULL) + usage2 (_("User name %s was not found\n"), optarg); /* then get uid */ uid = pw->pw_uid; } user = pw->pw_name; - asprintf (&fmt, _("%s%sUID = %d (%s)"), fmt, (options ? ", " : ""), + asprintf (&fmt, _("%s%sUID = %d (%s)"), (fmt ? fmt : ""), (options ? ", " : ""), uid, user); options |= USER; break; case 'C': /* command */ + /* TODO: allow this to be passed in with --metric */ if (prog) break; else prog = optarg; - asprintf (&fmt, _("%s%scommand name '%s'"), fmt, (options ? ", " : ""), + asprintf (&fmt, _("%s%scommand name '%s'"), (fmt ? fmt : ""), (options ? ", " : ""), prog); options |= PROG; break; case 'a': /* args (full path name with args) */ + /* TODO: allow this to be passed in with --metric */ if (args) break; else args = optarg; - asprintf (&fmt, _("%s%sargs '%s'"), fmt, (options ? ", " : ""), args); + asprintf (&fmt, _("%s%sargs '%s'"), (fmt ? fmt : ""), (options ? ", " : ""), args); options |= ARGS; break; case 'r': /* RSS */ if (sscanf (optarg, "%d%[^0-9]", &rss, tmp) == 1) { - asprintf (&fmt, _("%s%sRSS >= %d"), fmt, (options ? ", " : ""), rss); + asprintf (&fmt, _("%s%sRSS >= %d"), (fmt ? fmt : ""), (options ? ", " : ""), rss); options |= RSS; break; } - printf (_("%s: RSS must be an integer!\n\n"), - progname); - print_usage (); - exit (STATE_UNKNOWN); + usage2 (_("%s: RSS must be an integer!\n\n"), progname); case 'z': /* VSZ */ if (sscanf (optarg, "%d%[^0-9]", &vsz, tmp) == 1) { - asprintf (&fmt, _("%s%sVSZ >= %d"), fmt, (options ? ", " : ""), vsz); + asprintf (&fmt, _("%s%sVSZ >= %d"), (fmt ? fmt : ""), (options ? ", " : ""), vsz); options |= VSZ; break; } - printf (_("%s: VSZ must be an integer!\n\n"), - progname); - print_usage (); - exit (STATE_UNKNOWN); + usage2 (_("%s: VSZ must be an integer!\n\n"), progname); case 'P': /* PCPU */ /* TODO: -P 1.5.5 is accepted */ if (sscanf (optarg, "%f%[^0-9.]", &pcpu, tmp) == 1) { - asprintf (&fmt, _("%s%sPCPU >= %.2f"), fmt, (options ? ", " : ""), pcpu); + asprintf (&fmt, _("%s%sPCPU >= %.2f"), (fmt ? fmt : ""), (options ? ", " : ""), pcpu); options |= PCPU; break; } - printf (_("%s: PCPU must be a float!\n\n"), - progname); - print_usage (); - exit (STATE_UNKNOWN); + usage2 (_("%s: PCPU must be a float!\n\n"), progname); case 'm': asprintf (&metric_name, "%s", optarg); if ( strcmp(optarg, "PROCS") == 0) { @@ -459,7 +477,12 @@ process_arguments (int argc, char **argv) metric = METRIC_CPU; break; } - printf (_("%s: metric must be one of PROCS, VSZ, RSS, CPU!\n\n"), + else if ( strcmp(optarg, "ELAPSED") == 0) { + metric = METRIC_ELAPSED; + break; + } + + printf (_("%s: metric must be one of PROCS, VSZ, RSS, CPU, ELAPSED!\n\n"), progname); print_usage (); exit (STATE_UNKNOWN); @@ -476,7 +499,7 @@ process_arguments (int argc, char **argv) cmax = atoi (argv[c++]); if (statopts == NULL && argv[c]) { asprintf (&statopts, "%s", argv[c++]); - asprintf (&fmt, _("%s%sSTATE = %s"), fmt, (options ? ", " : ""), statopts); + asprintf (&fmt, _("%s%sSTATE = %s"), (fmt ? fmt : ""), (options ? ", " : ""), statopts); options |= STAT; } @@ -485,7 +508,6 @@ process_arguments (int argc, char **argv) - int validate_arguments () { @@ -533,9 +555,6 @@ validate_arguments () - - - /* Check thresholds against value */ int check_thresholds (int value) @@ -571,15 +590,77 @@ check_thresholds (int value) +/* convert the elapsed time to seconds */ +int +convert_to_seconds(char *etime) { + + char *ptr; + int total; + + int hyphcnt; + int coloncnt; + int days; + int hours; + int minutes; + int seconds; + + hyphcnt = 0; + coloncnt = 0; + days = 0; + hours = 0; + minutes = 0; + seconds = 0; + + for (ptr = etime; *ptr != '\0'; ptr++) { + + if (*ptr == '-') { + hyphcnt++; + continue; + } + if (*ptr == ':') { + coloncnt++; + continue; + } + } + + if (hyphcnt > 0) { + sscanf(etime, "%d-%d:%d:%d", + &days, &hours, &minutes, &seconds); + /* linux 2.6.5/2.6.6 reporting some processes with infinite + * elapsed times for some reason */ + if (days == 49710) { + return 0; + } + } else { + if (coloncnt == 2) { + sscanf(etime, "%d:%d:%d", + &hours, &minutes, &seconds); + } else if (coloncnt == 1) { + sscanf(etime, "%d:%d", + &minutes, &seconds); + } + } + + total = (days * 86400) + + (hours * 3600) + + (minutes * 60) + + seconds; + + if (verbose >= 3) { + printf("seconds: %d\n", total); + } + return total; +} + + - void print_help (void) { print_revision (progname, revision); - printf (_("Copyright (c) 1999 Ethan Galstad ")); - printf (_(COPYRIGHT), copyright, email); + printf ("Copyright (c) 1999 Ethan Galstad "); + printf (COPYRIGHT, copyright, email); printf(_("\ Checks all processes and generates WARNING or CRITICAL states if the specified\n\ @@ -599,10 +680,18 @@ Required Arguments:\n\ Optional Arguments:\n\ -m, --metric=TYPE\n\ Check thresholds against metric. Valid types:\n\ - PROCS - number of processes (default)\n\ - VSZ - virtual memory size\n\ - RSS - resident set memory size\n\ - CPU - percentage cpu\n\ + PROCS - number of processes (default)\n\ + VSZ - virtual memory size\n\ + RSS - resident set memory size\n\ + CPU - percentage cpu\n")); +/* only linux etime is support currently */ +#if defined( __linux__ ) + printf(_("\ + ELAPSED - time elapsed in seconds\n")); +#endif /* defined(__linux__) */ + printf (_(UT_TIMEOUT), DEFAULT_SOCKET_TIMEOUT); + + printf(_("\ -v, --verbose\n\ Extra information. Up to 3 verbosity levels\n")); @@ -627,7 +716,7 @@ Optional Filters:\n\ -a, --argument-array=STRING\n\ Only scan for processes with args that contain STRING.\n\ -C, --command=COMMAND\n\ - Only scan for exact matches to the named COMMAND.\n")); + Only scan for exact matches of COMMAND (without path).\n")); printf(_("\n\ RANGEs are specified 'min:max' or 'min:' or ':max' (or 'max'). If\n\ @@ -650,7 +739,9 @@ Examples:\n\ Warning alert if > 10 processes with command arguments containing \n\ '/usr/local/bin/perl' and owned by root\n\n\ check_procs -w 50000 -c 100000 --metric=VSZ\n\ - Alert if vsz of any processes over 50K or 100K\n\n")); + Alert if vsz of any processes over 50K or 100K\n\ + check_procs -w 10 -c 20 --metric=CPU\n\ + Alert if cpu of any processes over 10%% or 20%%\n\n")); printf (_(UT_SUPPORT)); } @@ -660,8 +751,6 @@ print_usage (void) { printf ("\ Usage: %s -w -c [-m metric] [-s state] [-p ppid]\n\ - [-u user] [-r rss] [-z vsz] [-P %%cpu] [-a argument-array]\n\ - [-C command] [-v]\n", progname); - printf (_(UT_HLP_VRS), progname, progname); + [-u user] [-r rss] [-z vsz] [-P %%cpu] [-a argument-array]\n\ + [-C command] [-t timeout] [-v]\n", progname); } -