/***************************************************************************** * * Monitoring check_ide_smart plugin * ide-smart 1.3 - IDE S.M.A.R.T. checking tool * * License: GPL * Copyright (C) 1998-1999 Ragnar Hojland Espinosa * 1998 Gadi Oxman * Copyright (c) 2000 Robert Dale * Copyright (c) 2000-2007 Monitoring Plugins Development Team * * Description: * * This file contains the check_ide_smart plugin * * This plugin checks a local hard drive with the (Linux specific) SMART * interface * * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . * * *****************************************************************************/ const char *progname = "check_ide_smart"; const char *copyright = "1998-2007"; const char *email = "devel@monitoring-plugins.org"; #include "common.h" #include "utils.h" void print_help(void); void print_usage(void); #include #include #include #ifdef __linux__ # include # include # define OPEN_MODE O_RDONLY #endif /* __linux__ */ #ifdef __NetBSD__ # include # include # include # include /* for __u8 and friends */ # include # include # include # include # define SMART_ENABLE WDSM_ENABLE_OPS # define SMART_DISABLE WDSM_DISABLE_OPS # define SMART_IMMEDIATE_OFFLINE WDSM_EXEC_OFFL_IMM # define SMART_AUTO_OFFLINE 0xdb /* undefined in NetBSD headers */ # define OPEN_MODE O_RDWR #endif /* __NetBSD__ */ #include #define NR_ATTRIBUTES 30 #define PREFAILURE 2 #define ADVISORY 1 #define OPERATIONAL 0 #define UNKNOWN -1 typedef struct threshold_s { __u8 id; __u8 threshold; __u8 reserved[10]; } __attribute__((packed)) threshold_t; typedef struct thresholds_s { __u16 revision; threshold_t thresholds[NR_ATTRIBUTES]; __u8 reserved[18]; __u8 vendor[131]; __u8 checksum; } __attribute__((packed)) thresholds_t; typedef struct value_s { __u8 id; __u16 status; __u8 value; __u8 vendor[8]; } __attribute__((packed)) value_t; typedef struct values_s { __u16 revision; value_t values[NR_ATTRIBUTES]; __u8 offline_status; __u8 vendor1; __u16 offline_timeout; __u8 vendor2; __u8 offline_capability; __u16 smart_capability; __u8 reserved[16]; __u8 vendor[125]; __u8 checksum; } __attribute__((packed)) values_t; struct { __u8 value; char *text; } offline_status_text[] = {{0x00, "NeverStarted"}, {0x02, "Completed"}, {0x04, "Suspended"}, {0x05, "Aborted"}, {0x06, "Failed"}, {0, 0}}; struct { __u8 value; char *text; } smart_command[] = {{SMART_ENABLE, "SMART_ENABLE"}, {SMART_DISABLE, "SMART_DISABLE"}, {SMART_IMMEDIATE_OFFLINE, "SMART_IMMEDIATE_OFFLINE"}, {SMART_AUTO_OFFLINE, "SMART_AUTO_OFFLINE"}}; /* Index to smart_command table, keep in order */ enum SmartCommand { SMART_CMD_ENABLE, SMART_CMD_DISABLE, SMART_CMD_IMMEDIATE_OFFLINE, SMART_CMD_AUTO_OFFLINE }; char *get_offline_text(int); int smart_read_values(int, values_t *); int nagios(values_t *, thresholds_t *); void print_value(value_t *, threshold_t *); void print_values(values_t *, thresholds_t *); int smart_cmd_simple(int, enum SmartCommand, __u8, bool); int smart_read_thresholds(int, thresholds_t *); bool verbose = false; int main(int argc, char *argv[]) { char *device = NULL; int o, longindex; int retval = 0; thresholds_t thresholds; values_t values; int fd; static struct option longopts[] = {{"device", required_argument, 0, 'd'}, {"immediate", no_argument, 0, 'i'}, {"quiet-check", no_argument, 0, 'q'}, {"auto-on", no_argument, 0, '1'}, {"auto-off", no_argument, 0, '0'}, {"nagios", no_argument, 0, 'n'}, /* DEPRECATED, but we still accept it */ {"help", no_argument, 0, 'h'}, {"version", no_argument, 0, 'V'}, {0, 0, 0, 0}}; /* Parse extra opts if any */ argv = np_extra_opts(&argc, argv, progname); setlocale(LC_ALL, ""); bindtextdomain(PACKAGE, LOCALEDIR); textdomain(PACKAGE); while (true) { o = getopt_long(argc, argv, "+d:iq10nhVv", longopts, &longindex); if (o == -1 || o == EOF || o == 1) break; switch (o) { case 'd': device = optarg; break; case 'q': fprintf(stderr, "%s\n", _("DEPRECATION WARNING: the -q switch (quiet output) is no longer \"quiet\".")); fprintf(stderr, "%s\n", _("Nagios-compatible output is now always returned.")); break; case 'i': case '1': case '0': printf("%s\n", _("SMART commands are broken and have been disabled (See Notes in --help).")); return STATE_CRITICAL; break; case 'n': fprintf(stderr, "%s\n", _("DEPRECATION WARNING: the -n switch (Nagios-compatible output) is now the")); fprintf(stderr, "%s\n", _("default and will be removed from future releases.")); break; case 'v': /* verbose */ verbose = true; break; case 'h': print_help(); return STATE_UNKNOWN; case 'V': print_revision(progname, NP_VERSION); return STATE_UNKNOWN; default: usage5(); } } if (optind < argc) { device = argv[optind]; } if (!device) { print_help(); return STATE_UNKNOWN; } fd = open(device, OPEN_MODE); if (fd < 0) { printf(_("CRITICAL - Couldn't open device %s: %s\n"), device, strerror(errno)); return STATE_CRITICAL; } if (smart_cmd_simple(fd, SMART_CMD_ENABLE, 0, false)) { printf(_("CRITICAL - SMART_CMD_ENABLE\n")); return STATE_CRITICAL; } smart_read_values(fd, &values); smart_read_thresholds(fd, &thresholds); retval = nagios(&values, &thresholds); if (verbose) print_values(&values, &thresholds); close(fd); return retval; } char *get_offline_text(int status) { int i; for (i = 0; offline_status_text[i].text; i++) { if (offline_status_text[i].value == status) { return offline_status_text[i].text; } } return "UNKNOWN"; } int smart_read_values(int fd, values_t *values) { #ifdef __linux__ int e; __u8 args[4 + 512]; args[0] = WIN_SMART; args[1] = 0; args[2] = SMART_READ_VALUES; args[3] = 1; if (ioctl(fd, HDIO_DRIVE_CMD, &args)) { e = errno; printf(_("CRITICAL - SMART_READ_VALUES: %s\n"), strerror(errno)); return e; } memcpy(values, args + 4, 512); #endif /* __linux__ */ #ifdef __NetBSD__ struct atareq req; unsigned char inbuf[DEV_BSIZE]; memset(&req, 0, sizeof(req)); req.timeout = 1000; memset(&inbuf, 0, sizeof(inbuf)); req.flags = ATACMD_READ; req.features = WDSM_RD_DATA; req.command = WDCC_SMART; req.databuf = (char *)inbuf; req.datalen = sizeof(inbuf); req.cylinder = WDSMART_CYL; if (ioctl(fd, ATAIOCCOMMAND, &req) == 0) { if (req.retsts != ATACMD_OK) errno = ENODEV; } if (errno != 0) { int e = errno; printf(_("CRITICAL - SMART_READ_VALUES: %s\n"), strerror(errno)); return e; } (void)memcpy(values, inbuf, 512); #endif /* __NetBSD__ */ return 0; } int nagios(values_t *p, thresholds_t *t) { value_t *value = p->values; threshold_t *threshold = t->thresholds; int status = OPERATIONAL; int prefailure = 0; int advisory = 0; int failed = 0; int passed = 0; int total = 0; int i; for (i = 0; i < NR_ATTRIBUTES; i++) { if (value->id && threshold->id && value->id == threshold->id) { if (value->value < threshold->threshold) { ++failed; if (value->status & 1) { status = PREFAILURE; ++prefailure; } else { status = ADVISORY; ++advisory; } } else { ++passed; } ++total; } ++value; ++threshold; } switch (status) { case PREFAILURE: printf(_("CRITICAL - %d Harddrive PreFailure%cDetected! %d/%d tests failed.\n"), prefailure, prefailure > 1 ? 's' : ' ', failed, total); status = STATE_CRITICAL; break; case ADVISORY: printf(_("WARNING - %d Harddrive Advisor%s Detected. %d/%d tests failed.\n"), advisory, advisory > 1 ? "ies" : "y", failed, total); status = STATE_WARNING; break; case OPERATIONAL: printf(_("OK - Operational (%d/%d tests passed)\n"), passed, total); status = STATE_OK; break; default: printf(_("ERROR - Status '%d' unknown. %d/%d tests passed\n"), status, passed, total); status = STATE_UNKNOWN; break; } return status; } void print_value(value_t *p, threshold_t *t) { printf("Id=%3d, Status=%2d {%s , %s}, Value=%3d, Threshold=%3d, %s\n", p->id, p->status, p->status & 1 ? "PreFailure" : "Advisory ", p->status & 2 ? "OnLine " : "OffLine", p->value, t->threshold, p->value >= t->threshold ? "Passed" : "Failed"); } void print_values(values_t *p, thresholds_t *t) { value_t *value = p->values; threshold_t *threshold = t->thresholds; int i; for (i = 0; i < NR_ATTRIBUTES; i++) { if (value->id && threshold->id && value->id == threshold->id) { print_value(value++, threshold++); } } printf(_("OffLineStatus=%d {%s}, AutoOffLine=%s, OffLineTimeout=%d minutes\n"), p->offline_status, get_offline_text(p->offline_status & 0x7f), (p->offline_status & 0x80 ? "Yes" : "No"), p->offline_timeout / 60); printf(_("OffLineCapability=%d {%s %s %s}\n"), p->offline_capability, p->offline_capability & 1 ? "Immediate" : "", p->offline_capability & 2 ? "Auto" : "", p->offline_capability & 4 ? "AbortOnCmd" : "SuspendOnCmd"); printf(_("SmartRevision=%d, CheckSum=%d, SmartCapability=%d {%s %s}\n"), p->revision, p->checksum, p->smart_capability, p->smart_capability & 1 ? "SaveOnStandBy" : "", p->smart_capability & 2 ? "AutoSave" : ""); } int smart_cmd_simple(int fd, enum SmartCommand command, __u8 val0, bool show_error) { int e = STATE_UNKNOWN; #ifdef __linux__ __u8 args[4]; args[0] = WIN_SMART; args[1] = val0; args[2] = smart_command[command].value; args[3] = 0; if (ioctl(fd, HDIO_DRIVE_CMD, &args)) { e = STATE_CRITICAL; if (show_error) printf(_("CRITICAL - %s: %s\n"), smart_command[command].text, strerror(errno)); } else { e = STATE_OK; if (show_error) printf(_("OK - Command sent (%s)\n"), smart_command[command].text); } #endif /* __linux__ */ #ifdef __NetBSD__ struct atareq req; memset(&req, 0, sizeof(req)); req.timeout = 1000; req.flags = ATACMD_READREG; req.features = smart_command[command].value; req.command = WDCC_SMART; req.cylinder = WDSMART_CYL; req.sec_count = val0; if (ioctl(fd, ATAIOCCOMMAND, &req) == 0) { if (req.retsts != ATACMD_OK) errno = ENODEV; if (req.cylinder != WDSMART_CYL) errno = ENODEV; } if (errno != 0) { e = STATE_CRITICAL; if (show_error) printf(_("CRITICAL - %s: %s\n"), smart_command[command].text, strerror(errno)); } else { e = STATE_OK; if (show_error) printf(_("OK - Command sent (%s)\n"), smart_command[command].text); } #endif /* __NetBSD__ */ return e; } int smart_read_thresholds(int fd, thresholds_t *thresholds) { #ifdef __linux__ int e; __u8 args[4 + 512]; args[0] = WIN_SMART; args[1] = 0; args[2] = SMART_READ_THRESHOLDS; args[3] = 1; if (ioctl(fd, HDIO_DRIVE_CMD, &args)) { e = errno; printf(_("CRITICAL - SMART_READ_THRESHOLDS: %s\n"), strerror(errno)); return e; } memcpy(thresholds, args + 4, 512); #endif /* __linux__ */ #ifdef __NetBSD__ struct atareq req; unsigned char inbuf[DEV_BSIZE]; memset(&req, 0, sizeof(req)); req.timeout = 1000; memset(&inbuf, 0, sizeof(inbuf)); req.flags = ATACMD_READ; req.features = WDSM_RD_THRESHOLDS; req.command = WDCC_SMART; req.databuf = (char *)inbuf; req.datalen = sizeof(inbuf); req.cylinder = WDSMART_CYL; if (ioctl(fd, ATAIOCCOMMAND, &req) == 0) { if (req.retsts != ATACMD_OK) errno = ENODEV; } if (errno != 0) { int e = errno; printf(_("CRITICAL - SMART_READ_THRESHOLDS: %s\n"), strerror(errno)); return e; } (void)memcpy(thresholds, inbuf, 512); #endif /* __NetBSD__ */ return 0; } void print_help(void) { print_revision(progname, NP_VERSION); printf("(C) 1999 Ragnar Hojland Espinosa \n"); printf("Plugin implementation - 1999 Robert Dale \n"); printf(COPYRIGHT, copyright, email); printf(_("This plugin checks a local hard drive with the (Linux specific) SMART interface " "[http://smartlinux.sourceforge.net/smart/index.php].")); printf("\n\n"); print_usage(); printf(UT_HELP_VRSN); printf(UT_EXTRA_OPTS); printf(" %s\n", "-d, --device=DEVICE"); printf(" %s\n", _("Select device DEVICE")); printf(" %s\n", _("Note: if the device is specified without this option, any further option will")); printf(" %s\n", _("be ignored.")); printf(UT_VERBOSE); printf("\n"); printf("%s\n", _("Notes:")); printf(" %s\n", _("The SMART command modes (-i/--immediate, -0/--auto-off and -1/--auto-on) were")); printf(" %s\n", _("broken in an underhand manner and have been disabled. You can use smartctl")); printf(" %s\n", _("instead:")); printf(" %s\n", _("-0/--auto-off: use \"smartctl --offlineauto=off\"")); printf(" %s\n", _("-1/--auto-on: use \"smartctl --offlineauto=on\"")); printf(" %s\n", _("-i/--immediate: use \"smartctl --test=offline\"")); printf(UT_SUPPORT); } /* todo : add to the long nanual as example * * Run with: check_ide-smart --nagios [-d] * Where DRIVE is an IDE drive, ie. /dev/hda, /dev/hdb, /dev/hdc * * - Returns 0 on no errors * - Returns 1 on advisories * - Returns 2 on prefailure * - Returns -1 not too often */ void print_usage(void) { printf("%s\n", _("Usage:")); printf("%s [-d ] [-v]", progname); }