| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547 |
- /******************************************************************************
- * Nagios check_ide_smart plugin
- *
- * License: GPL
- *
- * ide-smart 1.3 - IDE S.M.A.R.T. checking tool
- * Copyright (C) 1998-1999 Ragnar Hojland Espinosa <ragnar@lightside.dhis.org>
- * 1998 Gadi Oxman <gadio@netvision.net.il>
- *
- * Copyright (c) 2000 Robert Dale <rdale@digital-mission.com>
- * Copyright (c) 2000-2006 nagios-plugins team
- *
- * Last Modified: $Date$
- *
- * Description:
- *
- * This file contains the check_ide_smart plugin
- *
- * This plugin checks a local hard drive with the (Linux specific) SMART interface
- *
- *
- * License Information:
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this program; if not, write to the Free Software
- * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
- *
- * $Id$
- */
- const char *progname = "check_ide_smart";
- const char *revision = "$Revision$";
- const char *copyright = "2000-2006";
- const char *email = "nagiosplug-devel@lists.sourceforge.net";
-
- #include "common.h"
- #include "utils.h"
- void print_help (void);
- void print_usage (void);
- #include <sys/stat.h>
- #include <sys/ioctl.h>
- #include <fcntl.h>
- #include <linux/hdreg.h>
- #include <linux/types.h>
- #include <errno.h>
-
- #define NR_ATTRIBUTES 30
-
- #ifndef TRUE
- #define TRUE 1
- #endif /* */
-
- #define PREFAILURE 2
- #define ADVISORY 1
- #define OPERATIONAL 0
- #define UNKNOWN -1
- typedef struct threshold_s
- {
- __u8 id;
- __u8 threshold;
- __u8 reserved[10];
- }
- __attribute__ ((packed)) threshold_t;
- typedef struct thresholds_s
- {
- __u16 revision;
- threshold_t thresholds[NR_ATTRIBUTES];
- __u8 reserved[18];
- __u8 vendor[131];
- __u8 checksum;
- }
- __attribute__ ((packed)) thresholds_t;
- typedef struct value_s
- {
- __u8 id;
- __u16 status;
- __u8 value;
- __u8 vendor[8];
- }
- __attribute__ ((packed)) value_t;
- typedef struct values_s
- {
- __u16 revision;
- value_t values[NR_ATTRIBUTES];
- __u8 offline_status;
- __u8 vendor1;
- __u16 offline_timeout;
- __u8 vendor2;
- __u8 offline_capability;
- __u16 smart_capability;
- __u8 reserved[16];
- __u8 vendor[125];
- __u8 checksum;
- }
- __attribute__ ((packed)) values_t;
- struct
- {
- __u8 value;
- char *text;
- }
- offline_status_text[] =
- {
- {0x00, "NeverStarted"},
- {0x02, "Completed"},
- {0x04, "Suspended"},
- {0x05, "Aborted"},
- {0x06, "Failed"},
- {0, 0}
- };
- struct
- {
- __u8 value;
- char *text;
- }
- smart_command[] =
- {
- {SMART_ENABLE, "SMART_ENABLE"},
- {SMART_DISABLE, "SMART_DISABLE"},
- {SMART_IMMEDIATE_OFFLINE, "SMART_IMMEDIATE_OFFLINE"},
- {SMART_AUTO_OFFLINE, "SMART_AUTO_OFFLINE"}
- };
- /* Index to smart_command table, keep in order */
- enum SmartCommand
- { SMART_CMD_ENABLE,
- SMART_CMD_DISABLE,
- SMART_CMD_IMMEDIATE_OFFLINE,
- SMART_CMD_AUTO_OFFLINE
- };
- void print_values (values_t * p, thresholds_t * t);
- int smart_cmd_simple (int fd, enum SmartCommand command, __u8 val0, char show_error);
- int
- main (int argc, char *argv[])
- {
- char *device = NULL;
- int command = -1;
- int o, longindex;
- int retval = 0;
- thresholds_t thresholds;
- values_t values;
- int fd;
- static struct option longopts[] = {
- {"device", required_argument, 0, 'd'},
- {"immediate", no_argument, 0, 'i'},
- {"quiet-check", no_argument, 0, 'q'},
- {"auto-on", no_argument, 0, '1'},
- {"auto-off", no_argument, 0, '0'},
- {"nagios", no_argument, 0, 'n'},
- {"help", no_argument, 0, 'h'},
- {"version", no_argument, 0, 'V'}, {0, 0, 0, 0}
- };
- setlocale (LC_ALL, "");
- bindtextdomain (PACKAGE, LOCALEDIR);
- textdomain (PACKAGE);
- while (1) {
-
- o = getopt_long (argc, argv, "+d:iq10nhV", longopts, &longindex);
- if (o == -1 || o == EOF || o == 1)
- break;
- switch (o) {
- case 'd':
- device = optarg;
- break;
- case 'q':
- command = 3;
- break;
- case 'i':
- command = 2;
- break;
- case '1':
- command = 1;
- break;
- case '0':
- command = 0;
- break;
- case 'n':
- command = 4;
- break;
- case 'h':
- print_help ();
- return STATE_OK;
- case 'V':
- print_revision (progname, revision);
- return STATE_OK;
- default:
- usage2 (_("Unknown argument"), optarg);
- }
- }
- if (optind < argc) {
- device = argv[optind];
- }
- if (!device) {
- print_help ();
- return STATE_OK;
- }
- fd = open (device, O_RDONLY);
- if (fd < 0) {
- printf (_("CRITICAL - Couldn't open device %s: %s\n"), device, strerror (errno));
- return STATE_CRITICAL;
- }
- if (smart_cmd_simple (fd, SMART_CMD_ENABLE, 0, TRUE)) {
- printf (_("CRITICAL - SMART_CMD_ENABLE\n"));
- return STATE_CRITICAL;
- }
- switch (command) {
- case 0:
- retval = smart_cmd_simple (fd, SMART_CMD_AUTO_OFFLINE, 0, TRUE);
- break;
- case 1:
- retval = smart_cmd_simple (fd, SMART_CMD_AUTO_OFFLINE, 0xF8, TRUE);
- break;
- case 2:
- retval = smart_cmd_simple (fd, SMART_CMD_IMMEDIATE_OFFLINE, 0, TRUE);
- break;
- case 3:
- smart_read_values (fd, &values);
- smart_read_thresholds (fd, &thresholds);
- retval = values_not_passed (&values, &thresholds);
- break;
- case 4:
- smart_read_values (fd, &values);
- smart_read_thresholds (fd, &thresholds);
- retval = nagios (&values, &thresholds);
- break;
- default:
- smart_read_values (fd, &values);
- smart_read_thresholds (fd, &thresholds);
- print_values (&values, &thresholds);
- break;
- }
- close (fd);
- return retval;
- }
- char *
- get_offline_text (int status)
- {
- int i;
- for (i = 0; offline_status_text[i].text; i++) {
- if (offline_status_text[i].value == status) {
- return offline_status_text[i].text;
- }
- }
- return "UNKNOW";
- }
- int
- smart_read_values (int fd, values_t * values)
- {
- int e;
- __u8 args[4 + 512];
- args[0] = WIN_SMART;
- args[1] = 0;
- args[2] = SMART_READ_VALUES;
- args[3] = 1;
- if (ioctl (fd, HDIO_DRIVE_CMD, &args)) {
- e = errno;
- printf (_("CRITICAL - SMART_READ_VALUES: %s\n"), strerror (errno));
- return e;
- }
- memcpy (values, args + 4, 512);
- return 0;
- }
- int
- values_not_passed (values_t * p, thresholds_t * t)
- {
- value_t * value = p->values;
- threshold_t * threshold = t->thresholds;
- int failed = 0;
- int passed = 0;
- int i;
- for (i = 0; i < NR_ATTRIBUTES; i++) {
- if (value->id && threshold->id && value->id == threshold->id) {
- if (value->value <= threshold->threshold) {
- ++failed;
- }
- else {
- ++passed;
- }
- }
- ++value;
- ++threshold;
- }
- return (passed ? -failed : 2);
- }
- int
- nagios (values_t * p, thresholds_t * t)
- {
- value_t * value = p->values;
- threshold_t * threshold = t->thresholds;
- int status = OPERATIONAL;
- int prefailure = 0;
- int advisory = 0;
- int failed = 0;
- int passed = 0;
- int total = 0;
- int i;
- for (i = 0; i < NR_ATTRIBUTES; i++) {
- if (value->id && threshold->id && value->id == threshold->id) {
- if (value->value <= threshold->threshold) {
- ++failed;
- if (value->status & 1) {
- status = PREFAILURE;
- ++prefailure;
- }
- else {
- status = ADVISORY;
- ++advisory;
- }
- }
- else {
- ++passed;
- }
- ++total;
- }
- ++value;
- ++threshold;
- }
- switch (status) {
- case PREFAILURE:
- printf (_("CRITICAL - %d Harddrive PreFailure%cDetected! %d/%d tests failed.\n"),
- prefailure,
- prefailure > 1 ? 's' : ' ',
- failed,
- total);
- status=STATE_CRITICAL;
- break;
- case ADVISORY:
- printf (_("WARNING - %d Harddrive Advisor%s Detected. %d/%d tests failed.\n"),
- advisory,
- advisory > 1 ? "ies" : "y",
- failed,
- total);
- status=STATE_WARNING;
- break;
- case OPERATIONAL:
- printf (_("OK - Operational (%d/%d tests passed)\n"), passed, total);
- status=STATE_OK;
- break;
- default:
- printf (_("ERROR - Status '%d' unkown. %d/%d tests passed\n"), status,
- passed, total);
- status = STATE_UNKNOWN;
- break;
- }
- return status;
- }
- void
- print_value (value_t * p, threshold_t * t)
- {
- printf ("Id=%3d, Status=%2d {%s , %s}, Value=%3d, Threshold=%3d, %s\n",
- p->id, p->status, p->status & 1 ? "PreFailure" : "Advisory ",
- p->status & 2 ? "OnLine " : "OffLine", p->value, t->threshold,
- p->value > t->threshold ? "Passed" : "Failed");
- }
- void
- print_values (values_t * p, thresholds_t * t)
- {
- value_t * value = p->values;
- threshold_t * threshold = t->thresholds;
- int i;
- for (i = 0; i < NR_ATTRIBUTES; i++) {
- if (value->id && threshold->id && value->id == threshold->id) {
- print_value (value++, threshold++);
- }
- }
- printf
- (_("OffLineStatus=%d {%s}, AutoOffLine=%s, OffLineTimeout=%d minutes\n"),
- p->offline_status,
- get_offline_text (p->offline_status & 0x7f),
- (p->offline_status & 0x80 ? "Yes" : "No"),
- p->offline_timeout / 60);
- printf
- (_("OffLineCapability=%d {%s %s %s}\n"),
- p->offline_capability,
- p->offline_capability & 1 ? "Immediate" : "",
- p->offline_capability & 2 ? "Auto" : "",
- p->offline_capability & 4 ? "AbortOnCmd" : "SuspendOnCmd");
- printf
- (_("SmartRevision=%d, CheckSum=%d, SmartCapability=%d {%s %s}\n"),
- p->revision,
- p->checksum,
- p->smart_capability,
- p->smart_capability & 1 ? "SaveOnStandBy" : "",
- p->smart_capability & 2 ? "AutoSave" : "");
- }
- void
- print_thresholds (thresholds_t * p)
- {
- threshold_t * threshold = p->thresholds;
- int i;
- printf ("\n");
- printf ("SmartRevision=%d\n", p->revision);
- for (i = 0; i < NR_ATTRIBUTES; i++) {
- if (threshold->id) {
- printf ("Id=%3d, Threshold=%3d\n", threshold->id,
- threshold->threshold); }
- ++threshold;
- }
- printf ("CheckSum=%d\n", p->checksum);
- }
- int
- smart_cmd_simple (int fd, enum SmartCommand command, __u8 val0, char show_error)
- {
- int e = 0;
- __u8 args[4];
- args[0] = WIN_SMART;
- args[1] = val0;
- args[2] = smart_command[command].value;
- args[3] = 0;
- if (ioctl (fd, HDIO_DRIVE_CMD, &args)) {
- e = errno;
- if (show_error) {
- printf (_("CRITICAL - %s: %s\n"), smart_command[command].text, strerror (errno));
- }
- }
- return e;
- }
- int
- smart_read_thresholds (int fd, thresholds_t * thresholds)
- {
- int e;
- __u8 args[4 + 512];
- args[0] = WIN_SMART;
- args[1] = 0;
- args[2] = SMART_READ_THRESHOLDS;
- args[3] = 1;
- if (ioctl (fd, HDIO_DRIVE_CMD, &args)) {
- e = errno;
- printf (_("CRITICAL - SMART_READ_THRESHOLDS: %s\n"), strerror (errno));
- return e;
- }
- memcpy (thresholds, args + 4, 512);
- return 0;
- }
- void
- print_help (void)
- {
- print_revision (progname, revision);
- printf ("Nagios feature - 1999 Robert Dale <rdale@digital-mission.com>\n");
- printf ("(C) 1999 Ragnar Hojland Espinosa <ragnar@lightside.dhis.org>\n");
- printf (COPYRIGHT, copyright, email);
- printf (_("This plugin checks a local hard drive with the (Linux specific) SMART interface [http://smartlinux.sourceforge.net/smart/index.php]."));
-
- printf ("\n\n");
-
- print_usage ();
- printf (_(UT_HELP_VRSN));
-
- printf (" %s\n", "-d, --device=DEVICE");
- printf (" %s\n", _("Select device DEVICE"));
- printf (" %s\n", _("Note: if the device is selected with this option, _no_ other options are accepted"));
- printf (" %s\n", "-i, --immediate");
- printf (" %s\n", _("Perform immediately offline tests"));
- printf (" %s\n", "-q, --quiet-check");
- printf (" %s\n", _("Returns the number of failed tests"));
- printf (" %s\n", "-1, --auto-on");
- printf (" %s\n", _("Turn on automatic offline tests"));
- printf (" %s\n", "-0, --auto-off");
- printf (" %s\n", _("Turn off automatic offline tests"));
- printf (" %s\n", "-n, --nagios");
- printf (" %s\n", _("Output suitable for Nagios\n"));
- printf (_(UT_SUPPORT));
- }
- /* todo : add to the long nanual as example
- *
- * Run with: check_ide-smart --nagios [-d] <DRIVE>
- * Where DRIVE is an IDE drive, ie. /dev/hda, /dev/hdb, /dev/hdc
- *
- * - Returns 0 on no errors
- * - Returns 1 on advisories
- * - Returns 2 on prefailure
- * - Returns -1 not too often
- */
- void
- print_usage (void)
- {
- printf (_("Usage:");
- printf ("%s [-d <device>] [-i <immediate>] [-q quiet] [-1 <auto-on>]",progname);
- pritnf (" [-O <auto-off>] [-n <nagios>]\n");
- }
|