##########################################################################
# $Id$
##########################################################################
#######################################################
## Copyright (c) 2008 Jaco Botha <jaco_botha@hotmail.com>
## Covered under the included MIT/X-Consortium License:
## http://www.opensource.org/licenses/mit-license.php
## All modifications and contributions by other persons to
## this script are assumed to have been donated to the
## Logwatch project and thus assume the above copyright
## and licensing terms. If you want to make contributions
## under your own copyright or a different license this
## must be explicitly stated in the contribution an the
## Logwatch project reserves the right to not accept such
## contributions. If you have made significant
## contributions to this script and want to claim
## copyright please contact logwatch-devel@lists.sourceforge.net.
#########################################################
use strict;
my ($Device, $Msg, $Test);
my %ParamChanges = ();
my %TempChanges = ();
my %TempLimit = ();
my %TempCritLimit = ();
my %Pendsectors = ();
my %NumPendsectors = ();
my %Offsectors = ();
my %NumOffsectors = ();
my %Warnings = ();
my %UnableToReg = ();
my $ShutdownFailed = 0;
my $StartupFailed = 0;
my %NotInDatabase = ();
my %CantMonitor = ();
my $UnableToMonitor = 0;
my %DriveTest = ();
my %Failed = ();
my %OtherList = ();
my $DLine = 0;
my %UnavailableDev = ();
my %SataDisk = ();
my %CheckFailed = ();
my %Monitoring = ();
my %DeviceInfo = ();
my $Detail = $ENV{'LOGWATCH_DETAIL_LEVEL'} || 0;
my $IgnoreUnmatched = $ENV{'smartd_ignore_unmatched'} || 0;
while (defined(my $ThisLine = <STDIN>)) {
chomp($ThisLine);
if ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), No such device(?: or address)?, open\(\) failed/ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), open\(\) failed: No such device(?: or address)?/ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), found in smartd database./ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), not found in smartd database./ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), opened/)) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), appears to lack SMART*/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), enabled autosave \(cleared GLTSD bit\)\./ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), enabled SMART Attribute Autosave/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), enabled SMART Automatic Offline Testing/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), Self-Test Log error count increased from \d+ to \d+/ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), new Self-Test Log error at hour timestamp \d+/ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), same Attribute has different ID numbers:/ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Num *Test_Description *Status *Remaining *LifeTime/ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^# *[0-9]+ Short offline *Completed:/ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^# *[0-9]+ Extended offline *Completed:/ )) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^# *[0-9]+ Offline *Fatal or unknown error/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), not capable of SMART (Health Status |self-)check/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), is in STANDBY mode, skipping checks/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), self-test in progress, [0-9]+% remaining/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), previous self-test completed without error/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), type changed from \'\w+\' to \'\w+\'/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), state (?:read from|written to)/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), CHECK POWER STATUS spins up disk/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), STANDBY mode ignored due to reached limit of skipped checks/ )) {
# ignore
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), is back in ACTIVE or IDLE mode, resuming checks/ )) {
# ignore
} elsif ( $ThisLine =~ /^file \/var\/run\/smartd.pid written containing PID [0-9]+/ ) {
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^ *$/ )) {
# ignore empty lines
} elsif ( ($ThisLine =~ /^smartd version/)
|| ($ThisLine =~ /^smartd [0-9.]+ [0-9-]+ r[0-9]+ \[.*\]/)
|| ($ThisLine =~ /^Home page/)
|| ($ThisLine =~ /Copyright \(C\) [0-9-]+(?: by|,) Bruce Allen/)
|| ($ThisLine =~ /configuration file/i)
|| ($ThisLine =~ /\[trip Temperature is \d+ Celsius\]/)
|| ($ThisLine =~ /^Monitoring/)
|| ($ThisLine =~ /smartd received signal 15: Terminated/)
|| ($ThisLine =~ /smartd is exiting \(exit status 0\)/)
|| ($ThisLine =~ /smartd has fork/)
|| ($ThisLine =~ /smartd (startup|shutdown) succeeded/)
|| ($ThisLine =~ /Unable to register device (.*) \(no Directive -d removable\). Exiting/)
|| ($ThisLine =~ /Device (.*), SATA disks accessed via libata are not currently supported by smartmontools./)
|| ($ThisLine =~ /Device: (.*), IE \(SMART\) not enabled, skip device/)
|| ($ThisLine =~ /^Try '.*' to turn on SMART features/)
|| ($ThisLine =~ /Device: (.*), Bad IEC (SMART) mode page, err=-5, skip device/)
|| ($ThisLine =~ /Drive: DEVICESCAN, implied '-a' Directive on line [\d]+ of file/)
|| ($ThisLine =~ /packet devices \[this device CD\/DVD\] not SMART capable/)
|| ($ThisLine =~ /System clock time adjusted to the past/) )
{
# ignore
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), is SMART capable. Adding to "monitor" list./ )) {
$Monitoring{$Device} = 1;
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), ([^,]+, S\/N:[^,]+,.* FW:.*)/ )) {
$DeviceInfo{$Device} = $Msg;
} elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), (\[[^,]+, lu id: .*)/ )) {
$DeviceInfo{$Device} = $Msg;
# } elsif ( ($Device,$Msg) = ($ThisLine =~ /^Device: ([^,]+), (.*)$/)) {
# $ParamChanges{$Device}{$Msg}++;
} elsif ( ($Device) = ($ThisLine =~ /^Device: ([^,]+), not found in smartd database./ )) {
$NotInDatabase{$Device}++;
} elsif ( my ($Device,$AttribType,$Code,$Name,undef,undef,undef,$RawVal) = ($ThisLine =~ /^Device: ([^,]+), SMART ([A-Za-z]+) Attribute: ([0-9]+) (Temperature_Celsius) changed from ([0-9]+) (\[Raw [0-9]+(?: \([0-9]+\s[0-9]+\s[0-9]+\s[0-9]+(?:\s[0-9])?\))?\]) to ([0-9]+) \[Raw ([0-9]+)(?: \([0-9]+\s[0-9]+\s[0-9]+\s[0-9]+(?:\s[0-9])?\))?\]/)) {
push @{$TempChanges{$Device}}, $RawVal;
# smartd reports temperature changes this way only for SCSI disks
} elsif ( my ($Device,$AttribType,$Code,$Name,undef,undef,$NewVal) = ($ThisLine =~ /^Device: ([^,]+), SMART ([A-Za-z]+) Attribute: ([0-9]+) ([A-Za-z_]+) changed from ([0-9]+) (\[Raw [0-9]+\] )?to ([0-9]+)/)) {
push (@{$ParamChanges{$Device}{"$AttribType: $Name ($Code)"}}, $NewVal);
} elsif ( my ($Device,$Name,undef,$NewVal) = ($ThisLine =~ /^Device: ([^,]+), (.*) increased from ([0-9]+) to ([0-9]+)/) ) {
push (@{$ParamChanges{$Device}{"information: $Name"}}, $NewVal);
} elsif ( my ($Device,$NewVal) = ($ThisLine =~ /^Device: ([^,]+), initial Temperature is (\d+) Celsius/)) {
push @{$TempChanges{$Device}},$NewVal;
} elsif ( my ($Device,$Limit) = ($ThisLine =~ /^Device: ([^,]+), Temperature \d+ Celsius reached limit of (\d+) Celsius/)) {
# Device: /dev/sda, Temperature 37 Celsius reached limit of 10 Celsius (Min/Max 37/37)
$TempLimit{"$Device,$Limit"}++;
} elsif ( my ($Device,$Limit) = ($ThisLine =~ /^Device: ([^,]+), Temperature \d+ Celsius reached critical limit of (\d+) Celsius/)) {
# Device: /dev/sda, Temperature 38 Celsius reached critical limit of 15 Celsius (Min/Max 38!/39)
$TempCritLimit{"$Device,$Limit"}++;
} elsif ( my ($Device,$NewVal) = ($ThisLine =~ /^Device: ([^,]+), Temperature changed [-+]?\d+ Celsius to (\d+) Celsius/)) {
push @{$TempChanges{$Device}},$NewVal;
} elsif ( my ($Device, $Num) = ($ThisLine =~ /^Device: ([^,]+), (\d+) Currently unreadable \(pending\) sectors/) ) {
$Pendsectors{$Device}++;
$NumPendsectors{$Device} = $Num;
} elsif ( my ($Device, $Num) = ($ThisLine =~ /^Device: ([^,]+), (\d+) Offline uncorrectable sectors/) ) {
$Offsectors{$Device}++;
$NumOffsectors{$Device} = $Num;
} elsif ( my ($Device,$TestType) = ($ThisLine =~ /^Device: ([^,]+), starting scheduled ((?:Short|Long|Conveyance|Selective) Self-|Offline Immediate )Test/) ) {
$DriveTest{$Device}{$TestType}++;
} elsif ( my ($Device,$AttribType,$Code,$Name) = ($ThisLine =~ /^Device: ([^,]+), Failed SMART ([A-Za-z]+) Attribute: ([0-9]+) ([A-Za-z_]+)/)) {
$Failed{$Device}{"$AttribType attribute: $Name ($Code)"}++;
} elsif ( my ($Device, $Text) = ($ThisLine =~ /^Device: ([^,]+), failed (.*)$/) ) {
$Failed{$Device}{"$Text"}++;
} elsif ( ( $ThisLine =~ /warning/i ) ) {
$Warnings{$ThisLine}++;
} elsif ( my ($Device, $Text) = ( $ThisLine =~ /^Device: ([^,]+), (can't monitor.*)$/i ) ) {
$CantMonitor{$Device}{$Text}++;
} elsif ( ($ThisLine =~ /smartd startup failed/ ) ) {
$StartupFailed++;
} elsif ( ($ThisLine =~ /smartd shutdown failed/ ) ) {
$ShutdownFailed++;
} elsif ( my ($Device,$DLine) = ($ThisLine =~ /Unable to register SCSI device (.*) at line ([0-9]*) of file/) ) {
$UnableToReg{"$Device,$DLine"}++
} elsif ( ($Device) = ($ThisLine =~ /Device ([^ ]+) not available/)) {
$UnavailableDev{$Device}++;
} elsif ( my ($Device) = ($ThisLine =~ /Device (.*): SATA disks accessed via libata are supported by Linux kernel versions 2.6.15-rc1 and above/) ) {
$SataDisk{"$Device"}++;
} elsif ($ThisLine =~ /Unable to monitor any SMART enabled devices\. Try debug \(-d\) option\. Exiting/) {
$UnableToMonitor++;
} elsif ( my ($Device) = ($ThisLine =~ /Device: ([^,]+), FAILED SMART self-check/) ) {
$CheckFailed{$Device}++;
} else {
# Report any unmatched entries...
$OtherList{$ThisLine}++;
}
}
if (keys %CheckFailed) {
print "\nFAILED SMART self-check !!!";
print "\n---------------------------";
foreach my $Device (sort keys %CheckFailed) {
printf "\n %s: BACK UP DATA NOW!", $Device;
}
print "\n====================================\n";
}
if ($UnableToMonitor > 0) {
print "\nUnable to monitor any SMART enabled devices.";
print "\n Try debug (-d) option: $UnableToMonitor Time(s)\n";
}
if (keys %NotInDatabase) {
print "\n";
foreach my $Device (sort keys %NotInDatabase) {
print "$Device not in smartd database.\n";
}
}
if (keys %CantMonitor and $Detail) {
foreach my $Device (sort keys %CantMonitor) {
print "\n$Device :\n";
foreach my $Line (sort keys %{$CantMonitor{$Device}}) {
print " $Line - " . $CantMonitor{$Device}{$Line} . " Time(s)\n";
}
}
}
if (keys %ParamChanges) {
foreach my $Device (sort keys %ParamChanges) {
print "\n$Device :\n";
foreach my $Msg (sort keys %{$ParamChanges{$Device}}) {
print " $Msg changed to ";
my $count=0;
foreach (@{$ParamChanges{$Device}{$Msg}}) {
# print 12 values to each line
if ($count % 12 == 0) {
print "\n ";
}
print "$_, ";
$count++;
}
print "\n";
}
}
}
if (keys %TempChanges) {
print "Temperature Changes\n==================\n";
my (@min,@max);
foreach my $Device (sort keys %TempChanges) {
if($Detail < 10) {
my @sorttemp = sort @{$TempChanges{$Device}};
push @min, $sorttemp[0];
push @max, $sorttemp[$#sorttemp];
} elsif($Detail < 20) {
my @sorttemp = sort @{$TempChanges{$Device}};
print "$Device : $sorttemp[0] - $sorttemp[$#sorttemp]\n";
} else {
print "$Device : ";
print join ", ",@{$TempChanges{$Device}};
print "\n";
}
}
if($Detail < 10) {
my @sorttemp = sort @min;
my $mint = $sorttemp[0];
my @sorttemp = sort @max;
my $maxt = $sorttemp[$#sorttemp];
print "All devices: $mint - $maxt\n";
}
}
if (keys %TempCritLimit) {
printf "\nReached critical temperature limit:\n";
foreach (keys %TempCritLimit) {
my ($Device,$Limit)=split ",";
print "\t" . $Device . ": reached limit of " . $Limit . " Celsius: ". $TempCritLimit{"$Device,$Limit"} . " Time(s)\n";
}
}
if (keys %TempLimit) {
printf "\nReached temperature limit:\n";
foreach (keys %TempLimit) {
my ($Device,$Limit)=split ",";
print "\t" . $Device . ": reached limit of " . $Limit . " Celsius: ". $TempLimit{"$Device,$Limit"} . " Time(s)\n";
}
}
if (keys %Pendsectors){
print "\nCurrently unreadable (pending) sectors detected:\n";
foreach my $Device (sort keys %Pendsectors) {
print "\t" . $Device . " - " . $Pendsectors{$Device} . " Time(s)\n";
print "\t" . $NumPendsectors{$Device} . " unreadable sectors detected\n";
}
}
if (keys %Offsectors){
print "\nOffline uncorrectable sectors detected:\n";
foreach my $Device (sort keys %Offsectors) {
print "\t" . $Device . " - " . $Offsectors{$Device} . " Time(s)\n";
print "\t" . $NumOffsectors{$Device} . " offline uncorrectable sectors detected\n";
}
}
if (keys %Failed) {
foreach my $Device (sort keys %Failed) {
print "\n$Device :\n";
foreach my $Msg (sort keys %{$Failed{$Device}}) {
print " Failed $Msg " . $Failed{$Device}{$Msg} . " Time(s)\n";
}
}
}
if (keys %DriveTest) {
foreach my $Device (sort keys %DriveTest) {
print "\n$Device :\n";
foreach my $Type (sort keys %{$DriveTest{$Device}}) {
print " started scheduled ${Type}Test " . $DriveTest{$Device}{$Type} . " Time(s)\n";
}
}
}
if ( (keys %Warnings) ) {
print "\nWarnings:\n";
foreach my $Line (sort {$Warnings{$b} <=> $Warnings{$a}} keys %Warnings) {
print "\t" . $Line . " - ". $Warnings{$Line} . " Time(s)\n";
}
}
if ($StartupFailed) {
print "\n Smartd startup failed: " . $StartupFailed . " Time(s)\n";
}
if ($ShutdownFailed) {
print "\n Smartd shutdown failed: " . $ShutdownFailed . " Time(s)\n";
}
if ( (keys %UnableToReg) ) {
print "\n Wrong configuration for devices:\n";
foreach (sort keys %UnableToReg) {
($Device,$DLine) = split ",";
print " " . $Device . (" (line ") . $DLine . ") : ". $UnableToReg{"$Device,$DLine"} . " Time(s)\n";
}
}
if (%UnavailableDev) {
print "\nUnavailable device:\n";
foreach my $Device (sort keys %UnavailableDev) {
print " Device " . $Device . " : " . $UnavailableDev{$Device} . " Time(s)\n";
}
}
if (%SataDisk) {
print "\nSATA disk(s) supported by Linux kernel >= 2.6.15-rc1:\n";
foreach my $Device (sort keys %SataDisk) {
print " " .$Device .": Try adding '-d ata' or '-d sat' to the smartd.conf config file line\n";
}
print "\n";
}
if (keys %Monitoring and $Detail > 7) {
print "\nMonitoring:\n";
foreach my $Device (sort keys %Monitoring) {
print "\t$Device";
if (defined($DeviceInfo{$Device})) {
print ": $DeviceInfo{$Device}\n";
} else {
print "\n";
}
}
}
if ((%OtherList) and (not $IgnoreUnmatched)){
print "\n**Unmatched Entries**\n";
foreach my $line (sort keys %OtherList) {
print $line." : " .$OtherList{$line}." time(s)\n";
}
}
exit(0);
# vi: shiftwidth=3 tabstop=3 syntax=perl et
# Local Variables:
# mode: perl
# perl-indent-level: 3
# indent-tabs-mode: nil
# End: