aboutsummaryrefslogtreecommitdiff
path: root/plugins/check_overcr.c
diff options
context:
space:
mode:
Diffstat (limited to 'plugins/check_overcr.c')
-rw-r--r--plugins/check_overcr.c489
1 files changed, 489 insertions, 0 deletions
diff --git a/plugins/check_overcr.c b/plugins/check_overcr.c
new file mode 100644
index 00000000..305a8242
--- /dev/null
+++ b/plugins/check_overcr.c
@@ -0,0 +1,489 @@
+/******************************************************************************
+*
+* CHECK_OVERCR.C
+*
+* Program: Over-CR collector plugin for Nagios
+* License: GPL
+* Copyright (c) 1999 Ethan Galstad (nagios@nagios.org)
+*
+* $Id$
+*
+* Description:
+*
+* Notes:
+* - This plugin requires that Eric Molitors' Over-CR collector daemon
+* be running on any UNIX boxes you want to monitor. Over-CR
+* is available from * http://www.molitor.org/overcr/
+*
+* Modifications:
+*
+* 08-11-999 Jacob Lundqvist <jaclu@grm.se>
+* Load was presented as a one digit percentage - changed to two digit
+* value * before load of 11.2 was presented as "1.2%" (not very
+* high). Warning and Critical params were int's, not very good
+* for load, changed to doubles, so we can trap loadlimits like
+* 1.5. Also added more informative LOAD error messages.
+*
+* License Information:
+*
+* This program is free software; you can redistribute it and/or modify
+* it under the terms of the GNU General Public License as published by
+* the Free Software Foundation; either version 2 of the License, or
+* (at your option) any later version.
+*
+* This program is distributed in the hope that it will be useful,
+* but WITHOUT ANY WARRANTY; without even the implied warranty of
+* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+* GNU General Public License for more details.
+*
+* You should have received a copy of the GNU General Public License
+* along with this program; if not, write to the Free Software
+* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*
+*****************************************************************************/
+
+#include "config.h"
+#include "common.h"
+#include "netutils.h"
+#include "utils.h"
+
+#define CHECK_NONE 0
+#define CHECK_LOAD1 1
+#define CHECK_LOAD5 2
+#define CHECK_LOAD15 4
+#define CHECK_DPU 8
+#define CHECK_PROCS 16
+#define CHECK_NETSTAT 32
+#define CHECK_UPTIME 64
+
+#define PORT 2000
+
+#define PROGNAME "check_overcr"
+
+char *server_address = NULL;
+int server_port = PORT;
+double warning_value = 0L;
+double critical_value = 0L;
+int check_warning_value = FALSE;
+int check_critical_value = FALSE;
+int vars_to_check = CHECK_NONE;
+int cmd_timeout = 1;
+
+int netstat_port = 0;
+char *disk_name = NULL;
+char *process_name = NULL;
+
+int process_arguments (int, char **);
+void print_usage (void);
+void print_help (void);
+
+int
+main (int argc, char **argv)
+{
+ int result;
+ char send_buffer[MAX_INPUT_BUFFER];
+ char recv_buffer[MAX_INPUT_BUFFER];
+ char output_message[MAX_INPUT_BUFFER];
+ char temp_buffer[MAX_INPUT_BUFFER];
+ char *temp_ptr = NULL;
+ int found_disk = FALSE;
+ unsigned long percent_used_disk_space = 100;
+ double load;
+ double load_1min;
+ double load_5min;
+ double load_15min;
+ int port_connections = 0;
+ int processes = 0;
+ double uptime_raw_hours;
+ int uptime_raw_minutes = 0;
+ int uptime_days = 0;
+ int uptime_hours = 0;
+ int uptime_minutes = 0;
+
+ if (process_arguments (argc, argv) == ERROR)
+ usage ("Could not parse arguments\n");
+
+ /* initialize alarm signal handling */
+ signal (SIGALRM, socket_timeout_alarm_handler);
+
+ /* set socket timeout */
+ alarm (socket_timeout);
+
+ result = STATE_OK;
+
+ if (vars_to_check == CHECK_LOAD1 || vars_to_check == CHECK_LOAD5
+ || vars_to_check == CHECK_LOAD15) {
+
+ strcpy (send_buffer, "LOAD\r\nQUIT\r\n");
+ result =
+ process_tcp_request2 (server_address, server_port, send_buffer,
+ recv_buffer, sizeof (recv_buffer));
+ if (result != STATE_OK)
+ return result;
+
+ temp_ptr = (char *) strtok (recv_buffer, "\r\n");
+ if (temp_ptr == NULL) {
+ printf ("Invalid response from server - no load information\n");
+ return STATE_CRITICAL;
+ }
+ load_1min = strtod (temp_ptr, NULL);
+ temp_ptr = (char *) strtok (NULL, "\r\n");
+ if (temp_ptr == NULL) {
+ printf ("Invalid response from server after load 1\n");
+ return STATE_CRITICAL;
+ }
+ load_5min = strtod (temp_ptr, NULL);
+ temp_ptr = (char *) strtok (NULL, "\r\n");
+ if (temp_ptr == NULL) {
+ printf ("Invalid response from server after load 5\n");
+ return STATE_CRITICAL;
+ }
+ load_15min = strtod (temp_ptr, NULL);
+
+
+ switch (vars_to_check) {
+ case CHECK_LOAD1:
+ strcpy (temp_buffer, "1");
+ load = load_1min;
+ break;
+ case CHECK_LOAD5:
+ strcpy (temp_buffer, "5");
+ load = load_5min;
+ break;
+ default:
+ strcpy (temp_buffer, "15");
+ load = load_15min;
+ break;
+ }
+
+ if (check_critical_value == TRUE && (load >= critical_value))
+ result = STATE_CRITICAL;
+ else if (check_warning_value == TRUE && (load >= warning_value))
+ result = STATE_WARNING;
+ sprintf (output_message, "Load %s - %s-min load average = %0.2f",
+ (result == STATE_OK) ? "ok" : "problem", temp_buffer, load);
+ }
+
+
+ else if (vars_to_check == CHECK_DPU) {
+
+ sprintf (send_buffer, "DISKSPACE\r\n");
+ result =
+ process_tcp_request2 (server_address, server_port, send_buffer,
+ recv_buffer, sizeof (recv_buffer));
+ if (result != STATE_OK)
+ return result;
+
+ for (temp_ptr = (char *) strtok (recv_buffer, " "); temp_ptr != NULL;
+ temp_ptr = (char *) strtok (NULL, " ")) {
+
+ if (!strcmp (temp_ptr, disk_name)) {
+ found_disk = TRUE;
+ temp_ptr = (char *) strtok (NULL, "%");
+ if (temp_ptr == NULL) {
+ printf ("Invalid response from server\n");
+ return STATE_CRITICAL;
+ }
+ percent_used_disk_space = strtoul (temp_ptr, NULL, 10);
+ break;
+ }
+
+ temp_ptr = (char *) strtok (NULL, "\r\n");
+ }
+
+ /* error if we couldn't find the info for the disk */
+ if (found_disk == FALSE) {
+ sprintf (output_message, "Error: Disk '%s' non-existent or not mounted",
+ disk_name);
+ result = STATE_CRITICAL;
+ }
+
+ /* else check the disk space used */
+ else {
+
+ if (check_critical_value == TRUE
+ && (percent_used_disk_space >= critical_value)) result =
+ STATE_CRITICAL;
+ else if (check_warning_value == TRUE
+ && (percent_used_disk_space >= warning_value)) result =
+ STATE_WARNING;
+
+ sprintf (output_message, "Disk %s - %lu%% used on %s",
+ (result == STATE_OK) ? "ok" : "problem",
+ percent_used_disk_space, disk_name);
+ }
+ }
+
+ else if (vars_to_check == CHECK_NETSTAT) {
+
+ sprintf (send_buffer, "NETSTAT %d\r\n", netstat_port);
+ result =
+ process_tcp_request2 (server_address, server_port, send_buffer,
+ recv_buffer, sizeof (recv_buffer));
+ if (result != STATE_OK)
+ return result;
+
+ port_connections = strtod (recv_buffer, NULL);
+
+ if (check_critical_value == TRUE && (port_connections >= critical_value))
+ result = STATE_CRITICAL;
+ else if (check_warning_value == TRUE
+ && (port_connections >= warning_value)) result = STATE_WARNING;
+
+ sprintf (output_message, "Net %s - %d connection%s on port %d",
+ (result == STATE_OK) ? "ok" : "problem", port_connections,
+ (port_connections == 1) ? "" : "s", netstat_port);
+ }
+
+ else if (vars_to_check == CHECK_PROCS) {
+
+ sprintf (send_buffer, "PROCESS %s\r\n", process_name);
+ result =
+ process_tcp_request2 (server_address, server_port, send_buffer,
+ recv_buffer, sizeof (recv_buffer));
+ if (result != STATE_OK)
+ return result;
+
+ temp_ptr = (char *) strtok (recv_buffer, "(");
+ if (temp_ptr == NULL) {
+ printf ("Invalid response from server\n");
+ return STATE_CRITICAL;
+ }
+ temp_ptr = (char *) strtok (NULL, ")");
+ if (temp_ptr == NULL) {
+ printf ("Invalid response from server\n");
+ return STATE_CRITICAL;
+ }
+ processes = strtod (temp_ptr, NULL);
+
+ if (check_critical_value == TRUE && (processes >= critical_value))
+ result = STATE_CRITICAL;
+ else if (check_warning_value == TRUE && (processes >= warning_value))
+ result = STATE_WARNING;
+
+ sprintf (output_message, "Process %s - %d instance%s of %s running",
+ (result == STATE_OK) ? "ok" : "problem", processes,
+ (processes == 1) ? "" : "s", process_name);
+ }
+
+ else if (vars_to_check == CHECK_UPTIME) {
+
+ sprintf (send_buffer, "UPTIME\r\n");
+ result =
+ process_tcp_request2 (server_address, server_port, send_buffer,
+ recv_buffer, sizeof (recv_buffer));
+ if (result != STATE_OK)
+ return result;
+
+ uptime_raw_hours = strtod (recv_buffer, NULL);
+ uptime_raw_minutes = (unsigned long) (uptime_raw_hours * 60.0);
+
+ if (check_critical_value == TRUE
+ && (uptime_raw_minutes <= critical_value)) result = STATE_CRITICAL;
+ else if (check_warning_value == TRUE
+ && (uptime_raw_minutes <= warning_value)) result = STATE_WARNING;
+
+ uptime_days = uptime_raw_minutes / 1440;
+ uptime_raw_minutes %= 1440;
+ uptime_hours = uptime_raw_minutes / 60;
+ uptime_raw_minutes %= 60;
+ uptime_minutes = uptime_raw_minutes;
+
+ sprintf (output_message, "Uptime %s - Up %d days %d hours %d minutes",
+ (result == STATE_OK) ? "ok" : "problem", uptime_days,
+ uptime_hours, uptime_minutes);
+ }
+
+ else {
+ strcpy (output_message, "Nothing to check!\n");
+ result = STATE_UNKNOWN;
+ }
+
+ /* reset timeout */
+ alarm (0);
+
+ printf ("%s\n", output_message);
+
+ return result;
+}
+
+
+
+
+
+/* process command-line arguments */
+int
+process_arguments (int argc, char **argv)
+{
+ int c;
+
+#ifdef HAVE_GETOPT_H
+ int option_index = 0;
+ static struct option long_options[] = {
+ {"port", required_argument, 0, 'p'},
+ {"timeout", required_argument, 0, 't'},
+ {"critical", required_argument, 0, 'c'},
+ {"warning", required_argument, 0, 'w'},
+ {"variable", required_argument, 0, 'v'},
+ {"hostname", required_argument, 0, 'H'},
+ {"version", no_argument, 0, 'V'},
+ {"help", no_argument, 0, 'h'},
+ {0, 0, 0, 0}
+ };
+#endif
+
+ /* no options were supplied */
+ if (argc < 2)
+ return ERROR;
+
+ /* backwards compatibility */
+ if (!is_option (argv[1])) {
+ server_address = argv[1];
+ argv[1] = argv[0];
+ argv = &argv[1];
+ argc--;
+ }
+
+ for (c = 1; c < argc; c++) {
+ if (strcmp ("-to", argv[c]) == 0)
+ strcpy (argv[c], "-t");
+ else if (strcmp ("-wv", argv[c]) == 0)
+ strcpy (argv[c], "-w");
+ else if (strcmp ("-cv", argv[c]) == 0)
+ strcpy (argv[c], "-c");
+ }
+
+ while (1) {
+#ifdef HAVE_GETOPT_H
+ c =
+ getopt_long (argc, argv, "+hVH:t:c:w:p:v:", long_options,
+ &option_index);
+#else
+ c = getopt (argc, argv, "+hVH:t:c:w:p:v:");
+#endif
+
+ if (c == -1 || c == EOF || c == 1)
+ break;
+
+ switch (c) {
+ case '?': /* print short usage statement if args not parsable */
+ printf ("%s: Unknown argument: %s\n\n", my_basename (argv[0]), optarg);
+ print_usage ();
+ exit (STATE_UNKNOWN);
+ case 'h': /* help */
+ print_help ();
+ exit (STATE_OK);
+ case 'V': /* version */
+ print_revision (my_basename (argv[0]), "$Revision$");
+ exit (STATE_OK);
+ case 'H': /* hostname */
+ server_address = optarg;
+ break;
+ case 'p': /* port */
+ if (is_intnonneg (optarg))
+ server_port = atoi (optarg);
+ else
+ terminate (STATE_UNKNOWN,
+ "Server port an integer (seconds)\nType '%s -h' for additional help\n",
+ PROGNAME);
+ break;
+ case 'v': /* variable */
+ if (strcmp (optarg, "LOAD1") == 0)
+ vars_to_check = CHECK_LOAD1;
+ else if (strcmp (optarg, "LOAD5") == 0)
+ vars_to_check = CHECK_LOAD5;
+ else if (strcmp (optarg, "LOAD15") == 0)
+ vars_to_check = CHECK_LOAD15;
+ else if (strcmp (optarg, "UPTIME") == 0)
+ vars_to_check = CHECK_UPTIME;
+ else if (strstr (optarg, "PROC") == optarg) {
+ vars_to_check = CHECK_PROCS;
+ process_name = strscpy (process_name, optarg + 4);
+ }
+ else if (strstr (optarg, "NET") == optarg) {
+ vars_to_check = CHECK_NETSTAT;
+ netstat_port = atoi (optarg + 3);
+ }
+ else if (strstr (optarg, "DPU") == optarg) {
+ vars_to_check = CHECK_DPU;
+ disk_name = strscpy (disk_name, optarg + 3);
+ }
+ else
+ return ERROR;
+ break;
+ case 'w': /* warning threshold */
+ warning_value = strtoul (optarg, NULL, 10);
+ check_warning_value = TRUE;
+ break;
+ case 'c': /* critical threshold */
+ critical_value = strtoul (optarg, NULL, 10);
+ check_critical_value = TRUE;
+ break;
+ case 't': /* timeout */
+ socket_timeout = atoi (optarg);
+ if (socket_timeout <= 0)
+ return ERROR;
+ }
+
+ }
+ return OK;
+}
+
+
+
+
+
+void
+print_usage (void)
+{
+ printf
+ ("Usage: %s -H host [-p port] [-v variable] [-w warning] [-c critical] [-t timeout]\n",
+ PROGNAME);
+}
+
+
+
+
+
+void
+print_help (void)
+{
+ print_revision (PROGNAME, "$Revision$");
+ printf
+ ("Copyright (c) 2000 Ethan Galstad/Karl DeBisschop\n\n"
+ "This plugin attempts to contact the Over-CR collector daemon running on the\n"
+ "remote UNIX server in order to gather the requested system information. This\n"
+ "plugin requres that Eric Molitors' Over-CR collector daemon be running on the\n"
+ "remote server. Over-CR can be downloaded from http://www.molitor.org/overcr\n"
+ "(This plugin was tested with version 0.99.53 of the Over-CR collector)\n\n");
+ print_usage ();
+ printf
+ ("\nOptions:\n"
+ "-H, --hostname=HOST\n"
+ " Name of the host to check\n"
+ "-p, --port=INTEGER\n"
+ " Optional port number (default: %d)\n"
+ "-v, --variable=STRING\n"
+ " Variable to check. Valid variables include:\n"
+ " LOAD1 = 1 minute average CPU load\n"
+ " LOAD5 = 5 minute average CPU load\n"
+ " LOAD15 = 15 minute average CPU load\n"
+ " DPU<filesys> = percent used disk space on filesystem <filesys>\n"
+ " PROC<process> = number of running processes with name <process>\n"
+ " NET<port> = number of active connections on TCP port <port>\n"
+ " UPTIME = system uptime in seconds\n"
+ " -w, --warning=INTEGER\n"
+ " Threshold which will result in a warning status\n"
+ " -c, --critical=INTEGER\n"
+ " Threshold which will result in a critical status\n"
+ " -t, --timeout=INTEGER\n"
+ " Seconds before connection attempt times out (default: %d)\n"
+ "-h, --help\n"
+ " Print this help screen\n"
+ "-V, --version\n"
+ " Print version information\n\n"
+ "Notes:\n"
+ " - For the available options, the critical threshold value should always be\n"
+ " higher than the warning threshold value, EXCEPT with the uptime variable\n"
+ " (i.e. lower uptimes are worse).\n", PORT, DEFAULT_SOCKET_TIMEOUT);
+}