X-Git-Url: https://git.tokkee.org/?a=blobdiff_plain;f=plugins%2Fcheck_procs.c;h=8655f6a31fab244a632f8a2d216cc9ecfda256e2;hb=884aee06674755ef44e4042803ae84a0faac5b10;hp=0b0a3c138f674d999b4e8774899e926a3fffd712;hpb=aa01859947d82ea8df23a9258fbbbb21dae7f76e;p=nagiosplug.git diff --git a/plugins/check_procs.c b/plugins/check_procs.c index 0b0a3c1..8655f6a 100644 --- a/plugins/check_procs.c +++ b/plugins/check_procs.c @@ -1,369 +1,407 @@ -/****************************************************************************** -* -* CHECK_PROCS.C -* -* Program: Process plugin for Nagios +/***************************************************************************** +* +* Nagios check_procs plugin +* * License: GPL -* Copyright (c) 1999 Ethan Galstad (nagios@nagios.org) -* -* $Id$ -* +* Copyright (c) 2000-2008 Nagios Plugins Development Team +* * Description: -* -* This plugin checks the number of currently running processes and -* generates WARNING or CRITICAL states if the process count is outside -* the specified threshold ranges. The process count can be filtered by -* process owner, parent process PID, current state (e.g., 'Z'), or may -* be the total number of running processes -* -* License Information: -* -* This program is free software; you can redistribute it and/or modify +* +* This file contains the check_procs plugin +* +* Checks all processes and generates WARNING or CRITICAL states if the +* specified metric is outside the required threshold ranges. The metric +* defaults to number of processes. Search filters can be applied to limit +* the processes to check. +* +* +* This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by -* the Free Software Foundation; either version 2 of the License, or +* the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. -* -* This program is distributed in the hope that it will be useful, but -* WITHOUT ANY WARRANTY; without even the implied warranty of -* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU -* General Public License for more details. -* +* +* This program is distributed in the hope that it will be useful, +* but WITHOUT ANY WARRANTY; without even the implied warranty of +* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +* GNU General Public License for more details. +* * You should have received a copy of the GNU General Public License -* along with this program; if not, write to the Free Software -* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. -* -******************************************************************************/ - -#define PROGNAME "check_snmp" -#define REVISION "$Revision$" -#define COPYRIGHT "1999-2002" -#define AUTHOR "Ethan Galstad" -#define EMAIL "nagios@nagios.org" -#define SUMMARY "Check the number of currently running processes and generates WARNING or\n\ -CRITICAL states if the process count is outside the specified threshold\n\ -ranges. The process count can be filtered by process owner, parent process\n\ -PID, current state (e.g., 'Z'), or may be the total number of running\n\ -processes\n" - -#include "config.h" -#include +* along with this program. If not, see . +* +* +*****************************************************************************/ + +const char *progname = "check_procs"; +const char *program_name = "check_procs"; /* Required for coreutils libs */ +const char *copyright = "2000-2008"; +const char *email = "nagiosplug-devel@lists.sourceforge.net"; + #include "common.h" -#include "popen.h" #include "utils.h" +#include "utils_cmd.h" +#include "regex.h" + +#include int process_arguments (int, char **); int validate_arguments (void); -void print_usage (void); +int check_thresholds (int); +int convert_to_seconds (char *); void print_help (void); +void print_usage (void); int wmax = -1; int cmax = -1; int wmin = -1; int cmin = -1; -int options = 0; +int options = 0; /* bitmask of filter criteria to test against */ #define ALL 1 #define STAT 2 #define PPID 4 #define USER 8 #define PROG 16 #define ARGS 32 - -int verbose = FALSE; +#define VSZ 64 +#define RSS 128 +#define PCPU 256 +#define ELAPSED 512 +#define EREG_ARGS 1024 +/* Different metrics */ +char *metric_name; +enum metric { + METRIC_PROCS, + METRIC_VSZ, + METRIC_RSS, + METRIC_CPU, + METRIC_ELAPSED +}; +enum metric metric = METRIC_PROCS; + +int verbose = 0; int uid; -int ppid; -char *statopts = NULL; -char *prog = NULL; -char *args = NULL; -char *fmt = NULL; +pid_t ppid; +int vsz; +int rss; +float pcpu; +char *statopts; +char *prog; +char *args; +char *input_filename = NULL; +regex_t re_args; +char *fmt; +char *fails; char tmp[MAX_INPUT_BUFFER]; +FILE *ps_input = NULL; + + int main (int argc, char **argv) { - char input_buffer[MAX_INPUT_BUFFER]; + char *input_buffer; + char *input_line; + char *procprog; + pid_t mypid = 0; int procuid = 0; - int procppid = 0; + pid_t procpid = 0; + pid_t procppid = 0; + int procvsz = 0; + int procrss = 0; + int procseconds = 0; + float procpcpu = 0; char procstat[8]; - char procprog[MAX_INPUT_BUFFER]; + char procetime[MAX_INPUT_BUFFER] = { '\0' }; char *procargs; - int resultsum = 0; - int found = 0; - int procs = 0; - int pos; - + const char *zombie = "Z"; + + int resultsum = 0; /* bitmask of the filter criteria met by a process */ + int found = 0; /* counter for number of lines returned in `ps` output */ + int procs = 0; /* counter for number of processes meeting filter criteria */ + int pos; /* number of spaces before 'args' in `ps` output */ + int cols; /* number of columns in ps output */ + int expected_cols = PS_COLS - 1; + int warn = 0; /* number of processes in warn state */ + int crit = 0; /* number of processes in crit state */ + int i = 0, j = 0; int result = STATE_UNKNOWN; + output chld_out, chld_err; - procargs = malloc (MAX_INPUT_BUFFER); + setlocale (LC_ALL, ""); + bindtextdomain (PACKAGE, LOCALEDIR); + textdomain (PACKAGE); + setlocale(LC_NUMERIC, "POSIX"); + + input_buffer = malloc (MAX_INPUT_BUFFER); + procprog = malloc (MAX_INPUT_BUFFER); + + asprintf (&metric_name, "PROCS"); + metric = METRIC_PROCS; + + /* Parse extra opts if any */ + argv=np_extra_opts (&argc, argv, progname); if (process_arguments (argc, argv) == ERROR) - usage ("Unable to parse command line\n"); - - /* run the command */ - if (verbose) - printf ("%s\n", PS_COMMAND); - child_process = spopen (PS_COMMAND); - if (child_process == NULL) { - printf ("Could not open pipe: %s\n", PS_COMMAND); - return STATE_UNKNOWN; + usage4 (_("Could not parse arguments")); + + /* get our pid */ + mypid = getpid(); + + /* Set signal handling and alarm timeout */ + if (signal (SIGALRM, timeout_alarm_handler) == SIG_ERR) { + die (STATE_UNKNOWN, _("Cannot catch SIGALRM")); } + (void) alarm ((unsigned) timeout_interval); - child_stderr = fdopen (child_stderr_array[fileno (child_process)], "r"); - if (child_stderr == NULL) - printf ("Could not open stderr for %s\n", PS_COMMAND); - - fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process); - - while (fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process)) { - if ( -#ifdef USE_PS_VARS - sscanf (input_buffer, PS_FORMAT, PS_VARLIST) >= 4 -#else - sscanf (input_buffer, PS_FORMAT, procstat, &procuid, &procppid, &pos, - procprog) >= 4 -#endif - ) { - found++; + if (verbose >= 2) + printf (_("CMD: %s\n"), PS_COMMAND); + + if (input_filename == NULL) { + result = cmd_run( PS_COMMAND, &chld_out, &chld_err, 0); + if (chld_err.lines > 0) { + printf ("%s: %s", _("System call sent warnings to stderr"), chld_err.line[0]); + exit(STATE_WARNING); + } + } else { + result = cmd_file_read( input_filename, &chld_out, 0); + } + + /* flush first line: j starts at 1 */ + for (j = 1; j < chld_out.lines; j++) { + input_line = chld_out.line[j]; + + if (verbose >= 3) + printf ("%s", input_line); + + strcpy (procprog, ""); + asprintf (&procargs, "%s", ""); + + cols = sscanf (input_line, PS_FORMAT, PS_VARLIST); + + /* Zombie processes do not give a procprog command */ + if ( cols < expected_cols && strstr(procstat, zombie) ) { + cols = expected_cols; + } + if ( cols >= expected_cols ) { resultsum = 0; - procargs = strcpy (procargs, &input_buffer[pos]); + asprintf (&procargs, "%s", input_line + pos); strip (procargs); + + /* Some ps return full pathname for command. This removes path */ + strcpy(procprog, base_name(procprog)); + + /* we need to convert the elapsed time to seconds */ + procseconds = convert_to_seconds(procetime); + + if (verbose >= 3) + printf ("proc#=%d uid=%d vsz=%d rss=%d pid=%d ppid=%d pcpu=%.2f stat=%s etime=%s prog=%s args=%s\n", + procs, procuid, procvsz, procrss, + procpid, procppid, procpcpu, procstat, + procetime, procprog, procargs); + + /* Ignore self */ + if (mypid == procpid) continue; + if ((options & STAT) && (strstr (statopts, procstat))) resultsum |= STAT; - if ((options & ARGS) && (strstr (procargs, args) == procargs)) + if ((options & ARGS) && procargs && (strstr (procargs, args) != NULL)) resultsum |= ARGS; - if ((options & PROG) && (strcmp (prog, procprog) == 0)) + if ((options & EREG_ARGS) && procargs && (regexec(&re_args, procargs, (size_t) 0, NULL, 0) == 0)) + resultsum |= EREG_ARGS; + if ((options & PROG) && procprog && (strcmp (prog, procprog) == 0)) resultsum |= PROG; if ((options & PPID) && (procppid == ppid)) resultsum |= PPID; if ((options & USER) && (procuid == uid)) resultsum |= USER; -#ifdef DEBUG1 - if (procargs == NULL) - printf ("%d %d %d %s %s\n", procs, procuid, procppid, procstat, - procprog); - else - printf ("%d %d %d %s %s %s\n", procs, procuid, procppid, procstat, - procprog, procargs); -#endif - if (options == resultsum) - procs++; - } - } + if ((options & VSZ) && (procvsz >= vsz)) + resultsum |= VSZ; + if ((options & RSS) && (procrss >= rss)) + resultsum |= RSS; + if ((options & PCPU) && (procpcpu >= pcpu)) + resultsum |= PCPU; - /* If we get anything on STDERR, at least set warning */ - while (fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_stderr)) { - if (verbose) - printf ("STDERR: %s", input_buffer); - /*Cannot use max() any more as STATE_UNKNOWN is gt STATE_CRITICAL - result = max (result, STATE_WARNING); */ - if ( !(result == STATE_CRITICAL) ) { - result = STATE_WARNING; - } - printf ("System call sent warnings to stderr\n"); - } - -/* if (result == STATE_UNKNOWN || result == STATE_WARNING) - printf ("System call sent warnings to stderr\n"); -*/ - (void) fclose (child_stderr); - - /* close the pipe */ - if (spclose (child_process)) { - printf ("System call returned nonzero status\n"); - if ( !(result == STATE_CRITICAL) ) { - return STATE_WARNING; - } - else { - return result ; + found++; + + /* Next line if filters not matched */ + if (!(options == resultsum || options == ALL)) + continue; + + procs++; + if (verbose >= 2) { + printf ("Matched: uid=%d vsz=%d rss=%d pid=%d ppid=%d pcpu=%.2f stat=%s etime=%s prog=%s args=%s\n", + procuid, procvsz, procrss, + procpid, procppid, procpcpu, procstat, + procetime, procprog, procargs); + } + + if (metric == METRIC_VSZ) + i = check_thresholds (procvsz); + else if (metric == METRIC_RSS) + i = check_thresholds (procrss); + /* TODO? float thresholds for --metric=CPU */ + else if (metric == METRIC_CPU) + i = check_thresholds ((int)procpcpu); + else if (metric == METRIC_ELAPSED) + i = check_thresholds (procseconds); + + if (metric != METRIC_PROCS) { + if (i == STATE_WARNING) { + warn++; + asprintf (&fails, "%s%s%s", fails, (strcmp(fails,"") ? ", " : ""), procprog); + result = max_state (result, i); + } + if (i == STATE_CRITICAL) { + crit++; + asprintf (&fails, "%s%s%s", fails, (strcmp(fails,"") ? ", " : ""), procprog); + result = max_state (result, i); + } + } + } + /* This should not happen */ + else if (verbose) { + printf(_("Not parseable: %s"), input_buffer); } } - if (options == ALL) - procs = found; - if (found == 0) { /* no process lines parsed so return STATE_UNKNOWN */ - printf ("Unable to read output\n"); - - return result; + printf (_("Unable to read output\n")); + return STATE_UNKNOWN; } - if (verbose && (options & STAT)) - printf ("%s ", statopts); - if (verbose && (options & PROG)) - printf ("%s ", prog); - if (verbose && (options & PPID)) - printf ("%d ", ppid); - if (verbose && (options & USER)) - printf ("%d ", uid); + if ( result == STATE_UNKNOWN ) + result = STATE_OK; - if (wmax == -1 && cmax == -1 && wmin == -1 && cmin == -1) { - if (result == STATE_UNKNOWN) - result = STATE_OK; - printf (fmt, "OK", procs); - return result; - } - else if (cmax >= 0 && cmin >= 0 && cmax < cmin) { - if (procs > cmax && procs < cmin) { - printf (fmt, "CRITICAL", procs); - return STATE_CRITICAL; - } - } - else if (cmax >= 0 && procs > cmax) { - printf (fmt, "CRITICAL", procs); - return STATE_CRITICAL; - } - else if (cmin >= 0 && procs < cmin) { - printf (fmt, "CRITICAL", procs); - return STATE_CRITICAL; + /* Needed if procs found, but none match filter */ + if ( metric == METRIC_PROCS ) { + result = max_state (result, check_thresholds (procs) ); } - if (wmax >= 0 && wmin >= 0 && wmax < wmin) { - if (procs > wmax && procs < wmin) { - printf (fmt, "CRITICAL", procs); - return STATE_CRITICAL; + if ( result == STATE_OK ) { + printf ("%s %s: ", metric_name, _("OK")); + } else if (result == STATE_WARNING) { + printf ("%s %s: ", metric_name, _("WARNING")); + if ( metric != METRIC_PROCS ) { + printf (_("%d warn out of "), warn); } - } - else if (wmax >= 0 && procs > wmax) { - printf (fmt, "WARNING", procs); - if ( !(result == STATE_CRITICAL) ) { - return STATE_WARNING; + } else if (result == STATE_CRITICAL) { + printf ("%s %s: ", metric_name, _("CRITICAL")); + if (metric != METRIC_PROCS) { + printf (_("%d crit, %d warn out of "), crit, warn); } - else { - return result ; - } - /*return max (result, STATE_WARNING); */ - } - else if (wmin >= 0 && procs < wmin) { - printf (fmt, "WARNING", procs); - if ( !(result == STATE_CRITICAL) ) { - return STATE_WARNING; - } - else { - return result ; - } - /*return max (result, STATE_WARNING); */ + } + printf (ngettext ("%d process", "%d processes", (unsigned long) procs), procs); + + if (strcmp(fmt,"") != 0) { + printf (_(" with %s"), fmt); } - printf (fmt, "OK", procs); - if ( result == STATE_UNKNOWN ) { - result = STATE_OK; - } + if ( verbose >= 1 && strcmp(fails,"") ) + printf (" [%s]", fails); + + printf ("\n"); return result; } + + /* process command-line arguments */ int process_arguments (int argc, char **argv) { - int c, i = 1; + int c = 1; char *user; struct passwd *pw; -#ifdef HAVE_GETOPT_H - int option_index = 0; - static struct option long_options[] = { + int option = 0; + int err; + int cflags = REG_NOSUB | REG_EXTENDED; + char errbuf[MAX_INPUT_BUFFER]; + static struct option longopts[] = { {"warning", required_argument, 0, 'w'}, {"critical", required_argument, 0, 'c'}, + {"metric", required_argument, 0, 'm'}, {"timeout", required_argument, 0, 't'}, {"status", required_argument, 0, 's'}, {"ppid", required_argument, 0, 'p'}, {"command", required_argument, 0, 'C'}, + {"vsz", required_argument, 0, 'z'}, + {"rss", required_argument, 0, 'r'}, + {"pcpu", required_argument, 0, 'P'}, + {"elapsed", required_argument, 0, 'e'}, {"argument-array", required_argument, 0, 'a'}, {"help", no_argument, 0, 'h'}, {"version", no_argument, 0, 'V'}, {"verbose", no_argument, 0, 'v'}, + {"ereg-argument-array", required_argument, 0, CHAR_MAX+1}, + {"input-file", required_argument, 0, CHAR_MAX+2}, {0, 0, 0, 0} }; -#endif - - asprintf (&fmt, ""); for (c = 1; c < argc; c++) if (strcmp ("-to", argv[c]) == 0) strcpy (argv[c], "-t"); while (1) { -#ifdef HAVE_GETOPT_H - c = getopt_long (argc, argv, "Vvht:c:w:p:s:u:C:a:", long_options, &option_index); -#else - c = getopt (argc, argv, "Vvht:c:w:p:s:u:C:a:"); -#endif + c = getopt_long (argc, argv, "Vvht:c:w:p:s:u:C:a:z:r:m:P:", + longopts, &option); + if (c == -1 || c == EOF) break; switch (c) { case '?': /* help */ - print_usage (); - exit (STATE_UNKNOWN); + usage5 (); case 'h': /* help */ print_help (); exit (STATE_OK); case 'V': /* version */ - print_revision (PROGNAME, REVISION); + print_revision (progname, NP_VERSION); exit (STATE_OK); case 't': /* timeout period */ - if (!is_integer (optarg)) { - printf ("%s: Timeout Interval must be an integer!\n\n", - my_basename (argv[0])); - print_usage (); - exit (STATE_UNKNOWN); - } - timeout_interval = atoi (optarg); + if (!is_integer (optarg)) + usage2 (_("Timeout interval must be a positive integer"), optarg); + else + timeout_interval = atoi (optarg); break; case 'c': /* critical threshold */ - if (is_integer (optarg)) { + if (is_integer (optarg)) cmax = atoi (optarg); + else if (sscanf (optarg, ":%d", &cmax) == 1) break; - } - else if (sscanf (optarg, ":%d", &cmax) == 1) { + else if (sscanf (optarg, "%d:%d", &cmin, &cmax) == 2) break; - } - else if (sscanf (optarg, "%d:%d", &cmin, &cmax) == 2) { + else if (sscanf (optarg, "%d:", &cmin) == 1) break; - } - else if (sscanf (optarg, "%d:", &cmin) == 1) { - break; - } - else { - printf ("%s: Critical Process Count must be an integer!\n\n", - my_basename (argv[0])); - print_usage (); - exit (STATE_UNKNOWN); - } - case 'w': /* warning time threshold */ - if (is_integer (optarg)) { + else + usage4 (_("Critical Process Count must be an integer!")); + break; + case 'w': /* warning threshold */ + if (is_integer (optarg)) wmax = atoi (optarg); + else if (sscanf (optarg, ":%d", &wmax) == 1) break; - } - else if (sscanf (optarg, ":%d", &wmax) == 1) { + else if (sscanf (optarg, "%d:%d", &wmin, &wmax) == 2) break; - } - else if (sscanf (optarg, "%d:%d", &wmin, &wmax) == 2) { + else if (sscanf (optarg, "%d:", &wmin) == 1) break; - } - else if (sscanf (optarg, "%d:", &wmin) == 1) { - break; - } - else { - printf ("%s: Warning Process Count must be an integer!\n\n", - my_basename (argv[0])); - print_usage (); - exit (STATE_UNKNOWN); - } + else + usage4 (_("Warning Process Count must be an integer!")); + break; case 'p': /* process id */ if (sscanf (optarg, "%d%[^0-9]", &ppid, tmp) == 1) { - asprintf (&fmt, "%s%sPPID = %d", (options ? ", " : ""), ppid); + asprintf (&fmt, "%s%sPPID = %d", (fmt ? fmt : "") , (options ? ", " : ""), ppid); options |= PPID; break; } - printf ("%s: Parent Process ID must be an integer!\n\n", - my_basename (argv[0])); - print_usage (); - exit (STATE_UNKNOWN); + usage4 (_("Parent Process ID must be an integer!")); case 's': /* status */ - asprintf (&statopts, "%s", optarg); - asprintf (&fmt, "%s%sSTATE = %s", fmt, (options ? ", " : ""), statopts); + if (statopts) + break; + else + statopts = optarg; + asprintf (&fmt, _("%s%sSTATE = %s"), (fmt ? fmt : ""), (options ? ", " : ""), statopts); options |= STAT; break; case 'u': /* user or user id */ @@ -371,41 +409,101 @@ process_arguments (int argc, char **argv) uid = atoi (optarg); pw = getpwuid ((uid_t) uid); /* check to be sure user exists */ - if (pw == NULL) { - printf ("UID %d was not found\n", uid); - print_usage (); - exit (STATE_UNKNOWN); - } + if (pw == NULL) + usage2 (_("UID was not found"), optarg); } else { pw = getpwnam (optarg); /* check to be sure user exists */ - if (pw == NULL) { - printf ("User name %s was not found\n", optarg); - print_usage (); - exit (STATE_UNKNOWN); - } + if (pw == NULL) + usage2 (_("User name was not found"), optarg); /* then get uid */ uid = pw->pw_uid; } user = pw->pw_name; - asprintf (&fmt, "%s%sUID = %d (%s)", (options ? ", " : ""), fmt, + asprintf (&fmt, "%s%sUID = %d (%s)", (fmt ? fmt : ""), (options ? ", " : ""), uid, user); options |= USER; break; case 'C': /* command */ - asprintf (&prog, "%s", optarg); - asprintf (&fmt, "%s%scommand name %s", fmt, (options ? ", " : ""), + /* TODO: allow this to be passed in with --metric */ + if (prog) + break; + else + prog = optarg; + asprintf (&fmt, _("%s%scommand name '%s'"), (fmt ? fmt : ""), (options ? ", " : ""), prog); options |= PROG; break; case 'a': /* args (full path name with args) */ - asprintf (&args, "%s", optarg); - asprintf (&fmt, "%s%sargs %s", fmt, (options ? ", " : ""), args); + /* TODO: allow this to be passed in with --metric */ + if (args) + break; + else + args = optarg; + asprintf (&fmt, "%s%sargs '%s'", (fmt ? fmt : ""), (options ? ", " : ""), args); options |= ARGS; break; + case CHAR_MAX+1: + err = regcomp(&re_args, optarg, cflags); + if (err != 0) { + regerror (err, &re_args, errbuf, MAX_INPUT_BUFFER); + die (STATE_UNKNOWN, "PROCS %s: %s - %s\n", _("UNKNOWN"), _("Could not compile regular expression"), errbuf); + } + asprintf (&fmt, "%s%sregex args '%s'", (fmt ? fmt : ""), (options ? ", " : ""), optarg); + options |= EREG_ARGS; + break; + case 'r': /* RSS */ + if (sscanf (optarg, "%d%[^0-9]", &rss, tmp) == 1) { + asprintf (&fmt, "%s%sRSS >= %d", (fmt ? fmt : ""), (options ? ", " : ""), rss); + options |= RSS; + break; + } + usage4 (_("RSS must be an integer!")); + case 'z': /* VSZ */ + if (sscanf (optarg, "%d%[^0-9]", &vsz, tmp) == 1) { + asprintf (&fmt, "%s%sVSZ >= %d", (fmt ? fmt : ""), (options ? ", " : ""), vsz); + options |= VSZ; + break; + } + usage4 (_("VSZ must be an integer!")); + case 'P': /* PCPU */ + /* TODO: -P 1.5.5 is accepted */ + if (sscanf (optarg, "%f%[^0-9.]", &pcpu, tmp) == 1) { + asprintf (&fmt, "%s%sPCPU >= %.2f", (fmt ? fmt : ""), (options ? ", " : ""), pcpu); + options |= PCPU; + break; + } + usage4 (_("PCPU must be a float!")); + case 'm': + asprintf (&metric_name, "%s", optarg); + if ( strcmp(optarg, "PROCS") == 0) { + metric = METRIC_PROCS; + break; + } + else if ( strcmp(optarg, "VSZ") == 0) { + metric = METRIC_VSZ; + break; + } + else if ( strcmp(optarg, "RSS") == 0 ) { + metric = METRIC_RSS; + break; + } + else if ( strcmp(optarg, "CPU") == 0 ) { + metric = METRIC_CPU; + break; + } + else if ( strcmp(optarg, "ELAPSED") == 0) { + metric = METRIC_ELAPSED; + break; + } + + usage4 (_("Metric must be one of PROCS, VSZ, RSS, CPU, ELAPSED!")); case 'v': /* command */ - verbose = TRUE; + verbose++; + break; + case CHAR_MAX+2: + input_filename = optarg; break; } } @@ -417,7 +515,7 @@ process_arguments (int argc, char **argv) cmax = atoi (argv[c++]); if (statopts == NULL && argv[c]) { asprintf (&statopts, "%s", argv[c++]); - asprintf (&fmt, "%s%sSTATE = %s", fmt, (options ? ", " : ""), statopts); + asprintf (&fmt, _("%s%sSTATE = %s"), (fmt ? fmt : ""), (options ? ", " : ""), statopts); options |= STAT; } @@ -425,21 +523,22 @@ process_arguments (int argc, char **argv) } + int validate_arguments () { -if (wmax >= 0 && wmin == -1) + if (wmax >= 0 && wmin == -1) wmin = 0; if (cmax >= 0 && cmin == -1) cmin = 0; if (wmax >= wmin && cmax >= cmin) { /* standard ranges */ if (wmax > cmax && cmax != -1) { - printf ("wmax (%d) cannot be greater than cmax (%d)\n", wmax, cmax); + printf (_("wmax (%d) cannot be greater than cmax (%d)\n"), wmax, cmax); return ERROR; } if (cmin > wmin && wmin != -1) { - printf ("wmin (%d) cannot be less than cmin (%d)\n", wmin, cmin); + printf (_("wmin (%d) cannot be less than cmin (%d)\n"), wmin, cmin); return ERROR; } } @@ -449,57 +548,217 @@ if (wmax >= 0 && wmin == -1) /* return ERROR; */ /* } */ - if (options == 0) { - options = 1; - asprintf (&fmt, "%%s - %%d processes running\n"); + if (options == 0) + options = ALL; + + if (statopts==NULL) + statopts = strdup(""); + + if (prog==NULL) + prog = strdup(""); + + if (args==NULL) + args = strdup(""); + + if (fmt==NULL) + fmt = strdup(""); + + if (fails==NULL) + fails = strdup(""); + + return options; +} + + + +/* Check thresholds against value */ +int +check_thresholds (int value) +{ + if (wmax == -1 && cmax == -1 && wmin == -1 && cmin == -1) { + return OK; + } + else if (cmax >= 0 && cmin >= 0 && cmax < cmin) { + if (value > cmax && value < cmin) + return STATE_CRITICAL; + } + else if (cmax >= 0 && value > cmax) { + return STATE_CRITICAL; } - else { - asprintf (&fmt, "%%s - %%d processes running with %s\n", fmt); + else if (cmin >= 0 && value < cmin) { + return STATE_CRITICAL; } - return options; + if (wmax >= 0 && wmin >= 0 && wmax < wmin) { + if (value > wmax && value < wmin) { + return STATE_WARNING; + } + } + else if (wmax >= 0 && value > wmax) { + return STATE_WARNING; + } + else if (wmin >= 0 && value < wmin) { + return STATE_WARNING; + } + return STATE_OK; +} + + +/* convert the elapsed time to seconds */ +int +convert_to_seconds(char *etime) { + + char *ptr; + int total; + + int hyphcnt; + int coloncnt; + int days; + int hours; + int minutes; + int seconds; + + hyphcnt = 0; + coloncnt = 0; + days = 0; + hours = 0; + minutes = 0; + seconds = 0; + + for (ptr = etime; *ptr != '\0'; ptr++) { + + if (*ptr == '-') { + hyphcnt++; + continue; + } + if (*ptr == ':') { + coloncnt++; + continue; + } + } + + if (hyphcnt > 0) { + sscanf(etime, "%d-%d:%d:%d", + &days, &hours, &minutes, &seconds); + /* linux 2.6.5/2.6.6 reporting some processes with infinite + * elapsed times for some reason */ + if (days == 49710) { + return 0; + } + } else { + if (coloncnt == 2) { + sscanf(etime, "%d:%d:%d", + &hours, &minutes, &seconds); + } else if (coloncnt == 1) { + sscanf(etime, "%d:%d", + &minutes, &seconds); + } + } + + total = (days * 86400) + + (hours * 3600) + + (minutes * 60) + + seconds; + + if (verbose >= 3 && metric == METRIC_ELAPSED) { + printf("seconds: %d\n", total); + } + return total; } void print_help (void) { - print_revision (PROGNAME, REVISION); - printf - ("Copyright (c) %s %s <%s>\n\n%s\n", - COPYRIGHT, AUTHOR, EMAIL, SUMMARY); + print_revision (progname, NP_VERSION); + + printf ("Copyright (c) 1999 Ethan Galstad \n"); + printf (COPYRIGHT, copyright, email); + + printf ("%s\n", _("Checks all processes and generates WARNING or CRITICAL states if the specified")); + printf ("%s\n", _("metric is outside the required threshold ranges. The metric defaults to number")); + printf ("%s\n", _("of processes. Search filters can be applied to limit the processes to check.")); + + printf ("\n\n"); + print_usage (); - printf - ("\nRequired Arguments:\n" - " -w, --warning=RANGE\n" - " generate warning state if process count is outside this range\n" - " -c, --critical=RANGE\n" - " generate critical state if process count is outside this range\n\n" - "Optional Filters:\n" - " -s, --state=STATUSFLAGS\n" - " Only scan for processes that have, in the output of `ps`, one or\n" - " more of the status flags you specify (for example R, Z, S, RS,\n" - " RSZDT, plus others based on the output of your 'ps' command).\n" - " -p, --ppid=PPID\n" - " Only scan for children of the parent process ID indicated.\n" - " -u, --user=USER\n" - " Only scan for proceses with user name or ID indicated.\n" - " -a, --argument-array=STRING\n" - " Only scan for ARGS that match up to the length of the given STRING\n" - " -C, --command=COMMAND\n" - " Only scan for exact matches to the named COMMAND.\n\n" - "RANGEs are specified 'min:max' or 'min:' or ':max' (or 'max'). If\n" - "specified 'max:min', a warning status will be generated if the\n" - - "count is inside the specified range\n");} + printf (UT_HELP_VRSN); + printf (UT_EXTRA_OPTS); + printf (" %s\n", "-w, --warning=RANGE"); + printf (" %s\n", _("Generate warning state if metric is outside this range")); + printf (" %s\n", "-c, --critical=RANGE"); + printf (" %s\n", _("Generate critical state if metric is outside this range")); + printf (" %s\n", "-m, --metric=TYPE"); + printf (" %s\n", _("Check thresholds against metric. Valid types:")); + printf (" %s\n", _("PROCS - number of processes (default)")); + printf (" %s\n", _("VSZ - virtual memory size")); + printf (" %s\n", _("RSS - resident set memory size")); + printf (" %s\n", _("CPU - percentage CPU")); +/* only linux etime is support currently */ +#if defined( __linux__ ) + printf (" %s\n", _("ELAPSED - time elapsed in seconds")); +#endif /* defined(__linux__) */ + printf (UT_TIMEOUT, DEFAULT_SOCKET_TIMEOUT); + + printf (" %s\n", "-v, --verbose"); + printf (" %s\n", _("Extra information. Up to 3 verbosity levels")); + + printf ("\n"); + printf ("%s\n", "Filters:"); + printf (" %s\n", "-s, --state=STATUSFLAGS"); + printf (" %s\n", _("Only scan for processes that have, in the output of `ps`, one or")); + printf (" %s\n", _("more of the status flags you specify (for example R, Z, S, RS,")); + printf (" %s\n", _("RSZDT, plus others based on the output of your 'ps' command).")); + printf (" %s\n", "-p, --ppid=PPID"); + printf (" %s\n", _("Only scan for children of the parent process ID indicated.")); + printf (" %s\n", "-z, --vsz=VSZ"); + printf (" %s\n", _("Only scan for processes with VSZ higher than indicated.")); + printf (" %s\n", "-r, --rss=RSS"); + printf (" %s\n", _("Only scan for processes with RSS higher than indicated.")); + printf (" %s\n", "-P, --pcpu=PCPU"); + printf (" %s\n", _("Only scan for processes with PCPU higher than indicated.")); + printf (" %s\n", "-u, --user=USER"); + printf (" %s\n", _("Only scan for processes with user name or ID indicated.")); + printf (" %s\n", "-a, --argument-array=STRING"); + printf (" %s\n", _("Only scan for processes with args that contain STRING.")); + printf (" %s\n", "--ereg-argument-array=STRING"); + printf (" %s\n", _("Only scan for processes with args that contain the regex STRING.")); + printf (" %s\n", "-C, --command=COMMAND"); + printf (" %s\n", _("Only scan for exact matches of COMMAND (without path).")); + + printf(_("\n\ +RANGEs are specified 'min:max' or 'min:' or ':max' (or 'max'). If\n\ +specified 'max:min', a warning status will be generated if the\n\ +count is inside the specified range\n\n")); + + printf(_("\ +This plugin checks the number of currently running processes and\n\ +generates WARNING or CRITICAL states if the process count is outside\n\ +the specified threshold ranges. The process count can be filtered by\n\ +process owner, parent process PID, current state (e.g., 'Z'), or may\n\ +be the total number of running processes\n\n")); + + printf ("%s\n", _("Examples:")); + printf (" %s\n", "check_procs -w 2:2 -c 2:1024 -C portsentry"); + printf (" %s\n", _("Warning if not two processes with command name portsentry.")); + printf (" %s\n\n", _("Critical if < 2 or > 1024 processes")); + printf (" %s\n", "check_procs -w 10 -a '/usr/local/bin/perl' -u root"); + printf (" %s\n", _("Warning alert if > 10 processes with command arguments containing")); + printf (" %s\n\n", _("'/usr/local/bin/perl' and owned by root")); + printf (" %s\n", "check_procs -w 50000 -c 100000 --metric=VSZ"); + printf (" %s\n\n", _("Alert if VSZ of any processes over 50K or 100K")); + printf (" %s\n", "check_procs -w 10 -c 20 --metric=CPU"); + printf (" %s\n", _("Alert if CPU of any processes over 10%% or 20%%")); + + printf (UT_SUPPORT); +} void print_usage (void) { - printf - ("Usage:\n" - " check_procs -w -c [-s state] [-p ppid] [-u user]\n" - " [-a argument-array] [-C command]\n" - " check_procs --version\n" " check_procs --help\n"); + printf (_("Usage: ")); + printf ("%s -w -c [-m metric] [-s state] [-p ppid]\n", progname); + printf (" [-u user] [-r rss] [-z vsz] [-P %%cpu] [-a argument-array]\n"); + printf (" [-C command] [-t timeout] [-v]\n"); }