diff --git a/plugins/check_procs.c b/plugins/check_procs.c
index 5313b977e0e0760759775aac59b916ad6e318c8d..3f40e087c51ed6f4c92131deb62498a1d9d896f0 100644 (file)
--- a/plugins/check_procs.c
+++ b/plugins/check_procs.c
along with this program; if not, write to the Free Software
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+ $Id$
+
******************************************************************************/
const char *progname = "check_procs";
const char *revision = "$Revision$";
-const char *copyright = "2000-2003";
+const char *copyright = "2000-2004";
const char *email = "nagiosplug-devel@lists.sourceforge.net";
#include "common.h"
#include "popen.h"
#include "utils.h"
+
#include <pwd.h>
int process_arguments (int, char **);
int validate_arguments (void);
int check_thresholds (int);
+int convert_to_seconds (char *);
void print_help (void);
void print_usage (void);
#define VSZ 64
#define RSS 128
#define PCPU 256
-
+#define ELAPSED 512
/* Different metrics */
char *metric_name;
enum metric {
METRIC_PROCS,
METRIC_VSZ,
METRIC_RSS,
- METRIC_CPU
+ METRIC_CPU,
+ METRIC_ELAPSED
};
enum metric metric = METRIC_PROCS;
-
-
-\f
int
main (int argc, char **argv)
{
- char input_buffer[MAX_INPUT_BUFFER];
+ char *input_buffer;
+ char *input_line;
+ char *procprog;
+ pid_t mypid = 0;
int procuid = 0;
+ int procpid = 0;
int procppid = 0;
int procvsz = 0;
int procrss = 0;
+ int procseconds = 0;
float procpcpu = 0;
char procstat[8];
- char procprog[MAX_INPUT_BUFFER];
+ char procetime[MAX_INPUT_BUFFER] = { '\0' };
char *procargs;
+#ifdef HAVE_BASENAME
+ char *temp_string;
+#endif
const char *zombie = "Z";
int procs = 0; /* counter for number of processes meeting filter criteria */
int pos; /* number of spaces before 'args' in `ps` output */
int cols; /* number of columns in ps output */
+ int expected_cols = PS_COLS - 1;
int warn = 0; /* number of processes in warn state */
int crit = 0; /* number of processes in crit state */
int i = 0;
-
int result = STATE_UNKNOWN;
+ setlocale (LC_ALL, "");
+ bindtextdomain (PACKAGE, LOCALEDIR);
+ textdomain (PACKAGE);
+
+ input_buffer = malloc (MAX_INPUT_BUFFER);
+ procprog = malloc (MAX_INPUT_BUFFER);
+
asprintf (&metric_name, "PROCS");
metric = METRIC_PROCS;
if (process_arguments (argc, argv) == ERROR)
- usage (_("Unable to parse command line\n"));
+ usage4 (_("Could not parse arguments"));
+
+ /* get our pid */
+ mypid = getpid();
+
+ /* Set signal handling and alarm timeout */
+ if (signal (SIGALRM, popen_timeout_alarm_handler) == SIG_ERR) {
+ usage4 (_("Cannot catch SIGALRM"));
+ }
+ alarm (timeout_interval);
if (verbose >= 2)
printf (_("CMD: %s\n"), PS_COMMAND);
if (child_stderr == NULL)
printf (_("Could not open stderr for %s\n"), PS_COMMAND);
+ /* flush first line */
fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process);
+ while ( input_buffer[strlen(input_buffer)-1] != '\n' )
+ fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process);
while (fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process)) {
+ asprintf (&input_line, "%s", input_buffer);
+ while ( input_buffer[strlen(input_buffer)-1] != '\n' ) {
+ fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_process);
+ asprintf (&input_line, "%s%s", input_line, input_buffer);
+ }
+
+ if (verbose >= 3)
+ printf ("%s", input_line);
+
strcpy (procprog, "");
asprintf (&procargs, "%s", "");
- cols = sscanf (input_buffer, PS_FORMAT, PS_VARLIST);
+ cols = sscanf (input_line, PS_FORMAT, PS_VARLIST);
/* Zombie processes do not give a procprog command */
- if ( cols == 6 && strstr(procstat, zombie) ) {
- cols = 7;
- /* Set some value for procargs for the strip command further below
- Seen to be a problem on some Solaris 7 and 8 systems */
- input_buffer[pos] = '\n';
- input_buffer[pos+1] = 0x0;
+ if ( cols == (expected_cols - 1) && strstr(procstat, zombie) ) {
+ cols = expected_cols;
}
- if ( cols >= 7 ) {
+ if ( cols >= expected_cols ) {
resultsum = 0;
- asprintf (&procargs, "%s", input_buffer + pos);
+ asprintf (&procargs, "%s", input_line + pos);
strip (procargs);
+ /* Some ps return full pathname for command. This removes path */
+#ifdef HAVE_BASENAME
+ temp_string = strdup(procprog);
+ procprog = basename(temp_string);
+#endif /* HAVE_BASENAME */
+
+ /* we need to convert the elapsed time to seconds */
+ procseconds = convert_to_seconds(procetime);
+
+ if (verbose >= 3)
+ printf ("%d %d %d %d %d %d %.2f %s %s %s %s\n",
+ procs, procuid, procvsz, procrss,
+ procpid, procppid, procpcpu, procstat,
+ procetime, procprog, procargs);
+
+ /* Ignore self */
+ if (mypid == procpid) continue;
+
if ((options & STAT) && (strstr (statopts, procstat)))
resultsum |= STAT;
if ((options & ARGS) && procargs && (strstr (procargs, args) != NULL))
if ((options & PCPU) && (procpcpu >= pcpu))
resultsum |= PCPU;
- if (verbose >= 3)
- printf ("%d %d %d %d %d %.2f %s %s %s\n",
- procs, procuid, procvsz, procrss,
- procppid, procpcpu, procstat, procprog, procargs);
-
- /* Ignore self */
- if (strcmp (procprog, progname) == 0)
- continue;
-
found++;
/* Next line if filters not matched */
/* TODO? float thresholds for --metric=CPU */
else if (metric == METRIC_CPU)
i = check_thresholds ((int)procpcpu);
+ else if (metric == METRIC_ELAPSED)
+ i = check_thresholds (procseconds);
if (metric != METRIC_PROCS) {
if (i == STATE_WARNING) {
warn++;
- asprintf (&fails, "%s%s%s", fails, (fails == "" ? "" : ", "), procprog);
+ asprintf (&fails, "%s%s%s", fails, (strcmp(fails,"") ? ", " : ""), procprog);
+ result = max_state (result, i);
}
if (i == STATE_CRITICAL) {
crit++;
- asprintf (&fails, "%s%s%s", fails, (fails == "" ? "" : ", "), procprog);
+ asprintf (&fails, "%s%s%s", fails, (strcmp(fails,"") ? ", " : ""), procprog);
+ result = max_state (result, i);
}
- result = max_state (result, i);
}
}
/* This should not happen */
/* If we get anything on STDERR, at least set warning */
while (fgets (input_buffer, MAX_INPUT_BUFFER - 1, child_stderr)) {
if (verbose)
- printf (_("STDERR: %s"), input_buffer);
+ printf ("STDERR: %s", input_buffer);
result = max_state (result, STATE_WARNING);
printf (_("System call sent warnings to stderr\n"));
}
}
if ( result == STATE_OK ) {
- printf (_("%s OK: %d process%s"),
- metric_name, procs, ( procs != 1 ? "es" : "") );
+ printf ("%s %s: ", metric_name, _("OK"));
} else if (result == STATE_WARNING) {
- if ( metric == METRIC_PROCS ) {
- printf (_("PROCS WARNING: %d process%s"), procs,
- ( procs != 1 ? "es" : ""));
- } else {
- printf (_("%s WARNING: %d warn out of %d process%s"),
- metric_name, warn, procs,
- ( procs != 1 ? "es" : ""));
+ printf ("%s %s: ", metric_name, _("WARNING"));
+ if ( metric != METRIC_PROCS ) {
+ printf (_("%d warn out of "), warn);
}
} else if (result == STATE_CRITICAL) {
- if (metric == METRIC_PROCS) {
- printf (_("PROCS CRITICAL: %d process%s"), procs,
- ( procs != 1 ? "es" : ""));
- } else {
- printf (_("%s CRITICAL: %d crit, %d warn out of %d process%s"),
- metric_name, crit, warn, procs,
- ( procs != 1 ? "es" : ""));
+ printf ("%s %s: ", metric_name, _("CRITICAL"));
+ if (metric != METRIC_PROCS) {
+ printf (_("%d crit, %d warn out of "), crit, warn);
}
}
+ printf (ngettext ("%d process", "%d processes", (unsigned long) procs), procs);
- if (fmt != "") {
- printf (" with %s", fmt);
+ if (strcmp(fmt,"") != 0) {
+ printf (_(" with %s"), fmt);
}
- if ( verbose >= 1 && fails != "" )
+ if ( verbose >= 1 && strcmp(fails,"") )
printf (" [%s]", fails);
printf ("\n");
-
-
-\f
/* process command-line arguments */
int
process_arguments (int argc, char **argv)
{"vsz", required_argument, 0, 'z'},
{"rss", required_argument, 0, 'r'},
{"pcpu", required_argument, 0, 'P'},
+ {"elapsed", required_argument, 0, 'e'},
{"argument-array", required_argument, 0, 'a'},
{"help", no_argument, 0, 'h'},
{"version", no_argument, 0, 'V'},
switch (c) {
case '?': /* help */
- print_usage ();
- exit (STATE_UNKNOWN);
+ usage2 (_("Unknown argument"), optarg);
case 'h': /* help */
print_help ();
exit (STATE_OK);
exit (STATE_OK);
case 't': /* timeout period */
if (!is_integer (optarg))
- usage (_("Timeout Interval must be an integer!\n\n"));
+ usage2 (_("Timeout interval must be a positive integer"), optarg);
else
timeout_interval = atoi (optarg);
break;
else if (sscanf (optarg, "%d:", &cmin) == 1)
break;
else
- usage (_("Critical Process Count must be an integer!\n\n"));
+ usage4 (_("Critical Process Count must be an integer!"));
break;
- case 'w': /* warning time threshold */
+ case 'w': /* warning threshold */
if (is_integer (optarg))
wmax = atoi (optarg);
else if (sscanf (optarg, ":%d", &wmax) == 1)
else if (sscanf (optarg, "%d:", &wmin) == 1)
break;
else
- usage (_("%s: Warning Process Count must be an integer!\n\n"));
+ usage4 (_("Warning Process Count must be an integer!"));
break;
case 'p': /* process id */
if (sscanf (optarg, "%d%[^0-9]", &ppid, tmp) == 1) {
- asprintf (&fmt, "%s%sPPID = %d", fmt, (options ? ", " : ""), ppid);
+ asprintf (&fmt, "%s%sPPID = %d", (fmt ? fmt : "") , (options ? ", " : ""), ppid);
options |= PPID;
break;
}
- printf (_("%s: Parent Process ID must be an integer!\n\n"),
- progname);
- print_usage ();
- exit (STATE_UNKNOWN);
+ usage4 (_("Parent Process ID must be an integer!"));
case 's': /* status */
if (statopts)
break;
else
statopts = optarg;
- asprintf (&fmt, _("%s%sSTATE = %s"), fmt, (options ? ", " : ""), statopts);
+ asprintf (&fmt, _("%s%sSTATE = %s"), (fmt ? fmt : ""), (options ? ", " : ""), statopts);
options |= STAT;
break;
case 'u': /* user or user id */
uid = atoi (optarg);
pw = getpwuid ((uid_t) uid);
/* check to be sure user exists */
- if (pw == NULL) {
- printf (_("UID %d was not found\n"), uid);
- print_usage ();
- exit (STATE_UNKNOWN);
- }
+ if (pw == NULL)
+ usage2 (_("UID %s was not found"), optarg);
}
else {
pw = getpwnam (optarg);
/* check to be sure user exists */
- if (pw == NULL) {
- printf (_("User name %s was not found\n"), optarg);
- print_usage ();
- exit (STATE_UNKNOWN);
- }
+ if (pw == NULL)
+ usage2 (_("User name %s was not found"), optarg);
/* then get uid */
uid = pw->pw_uid;
}
user = pw->pw_name;
- asprintf (&fmt, _("%s%sUID = %d (%s)"), fmt, (options ? ", " : ""),
+ asprintf (&fmt, "%s%sUID = %d (%s)", (fmt ? fmt : ""), (options ? ", " : ""),
uid, user);
options |= USER;
break;
case 'C': /* command */
+ /* TODO: allow this to be passed in with --metric */
if (prog)
break;
else
prog = optarg;
- asprintf (&fmt, _("%s%scommand name '%s'"), fmt, (options ? ", " : ""),
+ asprintf (&fmt, _("%s%scommand name '%s'"), (fmt ? fmt : ""), (options ? ", " : ""),
prog);
options |= PROG;
break;
case 'a': /* args (full path name with args) */
+ /* TODO: allow this to be passed in with --metric */
if (args)
break;
else
args = optarg;
- asprintf (&fmt, _("%s%sargs '%s'"), fmt, (options ? ", " : ""), args);
+ asprintf (&fmt, "%s%sargs '%s'", (fmt ? fmt : ""), (options ? ", " : ""), args);
options |= ARGS;
break;
case 'r': /* RSS */
if (sscanf (optarg, "%d%[^0-9]", &rss, tmp) == 1) {
- asprintf (&fmt, _("%s%sRSS >= %d"), fmt, (options ? ", " : ""), rss);
+ asprintf (&fmt, "%s%sRSS >= %d", (fmt ? fmt : ""), (options ? ", " : ""), rss);
options |= RSS;
break;
}
- printf (_("%s: RSS must be an integer!\n\n"),
- progname);
- print_usage ();
- exit (STATE_UNKNOWN);
+ usage4 (_("RSS must be an integer!"));
case 'z': /* VSZ */
if (sscanf (optarg, "%d%[^0-9]", &vsz, tmp) == 1) {
- asprintf (&fmt, _("%s%sVSZ >= %d"), fmt, (options ? ", " : ""), vsz);
+ asprintf (&fmt, "%s%sVSZ >= %d", (fmt ? fmt : ""), (options ? ", " : ""), vsz);
options |= VSZ;
break;
}
- printf (_("%s: VSZ must be an integer!\n\n"),
- progname);
- print_usage ();
- exit (STATE_UNKNOWN);
+ usage4 (_("VSZ must be an integer!"));
case 'P': /* PCPU */
/* TODO: -P 1.5.5 is accepted */
if (sscanf (optarg, "%f%[^0-9.]", &pcpu, tmp) == 1) {
- asprintf (&fmt, _("%s%sPCPU >= %.2f"), fmt, (options ? ", " : ""), pcpu);
+ asprintf (&fmt, "%s%sPCPU >= %.2f", (fmt ? fmt : ""), (options ? ", " : ""), pcpu);
options |= PCPU;
break;
}
- printf (_("%s: PCPU must be a float!\n\n"),
- progname);
- print_usage ();
- exit (STATE_UNKNOWN);
+ usage4 (_("PCPU must be a float!"));
case 'm':
asprintf (&metric_name, "%s", optarg);
if ( strcmp(optarg, "PROCS") == 0) {
metric = METRIC_CPU;
break;
}
- printf (_("%s: metric must be one of PROCS, VSZ, RSS, CPU!\n\n"),
- progname);
- print_usage ();
- exit (STATE_UNKNOWN);
+ else if ( strcmp(optarg, "ELAPSED") == 0) {
+ metric = METRIC_ELAPSED;
+ break;
+ }
+
+ usage4 (_("Metric must be one of PROCS, VSZ, RSS, CPU, ELAPSED!"));
case 'v': /* command */
verbose++;
break;
cmax = atoi (argv[c++]);
if (statopts == NULL && argv[c]) {
asprintf (&statopts, "%s", argv[c++]);
- asprintf (&fmt, _("%s%sSTATE = %s"), fmt, (options ? ", " : ""), statopts);
+ asprintf (&fmt, _("%s%sSTATE = %s"), (fmt ? fmt : ""), (options ? ", " : ""), statopts);
options |= STAT;
}
-
int
validate_arguments ()
{
-
-
-\f
/* Check thresholds against value */
int
check_thresholds (int value)
}
+/* convert the elapsed time to seconds */
+int
+convert_to_seconds(char *etime) {
+
+ char *ptr;
+ int total;
+
+ int hyphcnt;
+ int coloncnt;
+ int days;
+ int hours;
+ int minutes;
+ int seconds;
+
+ hyphcnt = 0;
+ coloncnt = 0;
+ days = 0;
+ hours = 0;
+ minutes = 0;
+ seconds = 0;
+
+ for (ptr = etime; *ptr != '\0'; ptr++) {
+
+ if (*ptr == '-') {
+ hyphcnt++;
+ continue;
+ }
+ if (*ptr == ':') {
+ coloncnt++;
+ continue;
+ }
+ }
+
+ if (hyphcnt > 0) {
+ sscanf(etime, "%d-%d:%d:%d",
+ &days, &hours, &minutes, &seconds);
+ /* linux 2.6.5/2.6.6 reporting some processes with infinite
+ * elapsed times for some reason */
+ if (days == 49710) {
+ return 0;
+ }
+ } else {
+ if (coloncnt == 2) {
+ sscanf(etime, "%d:%d:%d",
+ &hours, &minutes, &seconds);
+ } else if (coloncnt == 1) {
+ sscanf(etime, "%d:%d",
+ &minutes, &seconds);
+ }
+ }
+
+ total = (days * 86400) +
+ (hours * 3600) +
+ (minutes * 60) +
+ seconds;
+ if (verbose >= 3 && metric == METRIC_ELAPSED) {
+ printf("seconds: %d\n", total);
+ }
+ return total;
+}
-\f
void
print_help (void)
{
print_revision (progname, revision);
- printf (_("Copyright (c) 1999 Ethan Galstad <nagios@nagios.org>"));
- printf (_(COPYRIGHT), copyright, email);
+ printf ("Copyright (c) 1999 Ethan Galstad <nagios@nagios.org>");
+ printf (COPYRIGHT, copyright, email);
printf(_("\
Checks all processes and generates WARNING or CRITICAL states if the specified\n\
Optional Arguments:\n\
-m, --metric=TYPE\n\
Check thresholds against metric. Valid types:\n\
- PROCS - number of processes (default)\n\
- VSZ - virtual memory size\n\
- RSS - resident set memory size\n\
- CPU - percentage cpu\n\
+ PROCS - number of processes (default)\n\
+ VSZ - virtual memory size\n\
+ RSS - resident set memory size\n\
+ CPU - percentage cpu\n"));
+/* only linux etime is support currently */
+#if defined( __linux__ )
+ printf(_("\
+ ELAPSED - time elapsed in seconds\n"));
+#endif /* defined(__linux__) */
+ printf (_(UT_TIMEOUT), DEFAULT_SOCKET_TIMEOUT);
+
+ printf(_("\
-v, --verbose\n\
Extra information. Up to 3 verbosity levels\n"));
-a, --argument-array=STRING\n\
Only scan for processes with args that contain STRING.\n\
-C, --command=COMMAND\n\
- Only scan for exact matches to the named COMMAND.\n"));
+ Only scan for exact matches of COMMAND (without path).\n"));
printf(_("\n\
RANGEs are specified 'min:max' or 'min:' or ':max' (or 'max'). If\n\
Warning alert if > 10 processes with command arguments containing \n\
'/usr/local/bin/perl' and owned by root\n\n\
check_procs -w 50000 -c 100000 --metric=VSZ\n\
- Alert if vsz of any processes over 50K or 100K\n\n"));
+ Alert if vsz of any processes over 50K or 100K\n\
+ check_procs -w 10 -c 20 --metric=CPU\n\
+ Alert if cpu of any processes over 10%% or 20%%\n\n"));
printf (_(UT_SUPPORT));
}
{
printf ("\
Usage: %s -w <range> -c <range> [-m metric] [-s state] [-p ppid]\n\
- [-u user] [-r rss] [-z vsz] [-P %%cpu] [-a argument-array]\n\
- [-C command] [-v]\n", progname);
- printf (_(UT_HLP_VRS), progname, progname);
+ [-u user] [-r rss] [-z vsz] [-P %%cpu] [-a argument-array]\n\
+ [-C command] [-t timeout] [-v]\n", progname);
}
-