Blame SOURCES/0020-move-MCE-handling-in-event-to-abrt-action-check-oops.patch

06486d
From d3ac6c888953d0bcd304d30dfa0f1c731987f358 Mon Sep 17 00:00:00 2001
06486d
From: Denys Vlasenko <dvlasenk@redhat.com>
06486d
Date: Mon, 6 Jan 2014 16:46:48 +0100
06486d
Subject: [ABRT PATCH 20/27] move MCE handling in event to
06486d
 abrt-action-check-oops-for-hw-error
06486d
06486d
Having a separate tool should help with internationalization
06486d
06486d
Signed-off-by: Denys Vlasenko <dvlasenk@redhat.com>
06486d
06486d
Related to rhbz#1032077
06486d
06486d
Signed-off-by: Jakub Filak <jfilak@redhat.com>
06486d
---
06486d
 configure.ac                                       |   1 +
06486d
 doc/Makefile.am                                    |   1 +
06486d
 po/POTFILES.in                                     |   1 +
06486d
 src/plugins/Makefile.am                            |   3 +
06486d
 src/plugins/abrt-action-check-oops-for-hw-error.in | 118 +++++++++++++++++++++
06486d
 src/plugins/koops_event.conf                       |  57 +---------
06486d
 8 files changed, 129 insertions(+), 55 deletions(-)
06486d
 create mode 100644 src/plugins/abrt-action-check-oops-for-hw-error.in
06486d
06486d
diff --git a/configure.ac b/configure.ac
06486d
index 3bd13bc..346faa8 100644
06486d
--- a/configure.ac
06486d
+++ b/configure.ac
06486d
@@ -279,6 +279,7 @@ AC_CONFIG_FILES([
06486d
 	src/dbus/Makefile
06486d
 	src/plugins/abrt-action-install-debuginfo
06486d
 	src/plugins/abrt-action-analyze-vmcore
06486d
+	src/plugins/abrt-action-check-oops-for-hw-error
06486d
 	src/python-problem/Makefile
06486d
 	src/python-problem/doc/Makefile
06486d
 	src/python-problem/tests/Makefile
06486d
diff --git a/doc/Makefile.am b/doc/Makefile.am
06486d
index f1abef8..e76abde 100644
06486d
--- a/doc/Makefile.am
06486d
+++ b/doc/Makefile.am
06486d
@@ -32,6 +32,7 @@ MAN1_TXT += abrt-action-save-package-data.txt
06486d
 MAN1_TXT += abrt-action-save-kernel-data.txt
06486d
 MAN1_TXT += abrt-install-ccpp-hook.txt
06486d
 MAN1_TXT += abrt-action-analyze-vmcore.txt
06486d
+MAN1_TXT += abrt-action-check-oops-for-hw-error.txt
06486d
 MAN1_TXT += abrt-action-analyze-ccpp-local.txt
06486d
 MAN1_TXT += abrt-watch-log.txt
06486d
 MAN1_TXT += abrt-upload-watch.txt
06486d
diff --git a/po/POTFILES.in b/po/POTFILES.in
06486d
index 5f883c0..6d90162 100644
06486d
--- a/po/POTFILES.in
06486d
+++ b/po/POTFILES.in
06486d
@@ -25,6 +25,7 @@ src/plugins/abrt-action-analyze-oops.c
06486d
 src/plugins/abrt-action-analyze-xorg.c
06486d
 src/plugins/abrt-action-analyze-python.c
06486d
 src/plugins/abrt-action-analyze-vmcore.in
06486d
+src/plugins/abrt-action-check-oops-for-hw-error.in
06486d
 src/plugins/abrt-action-generate-backtrace.c
06486d
 src/plugins/abrt-action-generate-core-backtrace.c
06486d
 src/plugins/abrt-action-install-debuginfo.in
06486d
diff --git a/src/plugins/Makefile.am b/src/plugins/Makefile.am
06486d
index 60246f2..dd32c7d 100644
06486d
--- a/src/plugins/Makefile.am
06486d
+++ b/src/plugins/Makefile.am
06486d
@@ -5,6 +5,7 @@ bin_SCRIPTS = \
06486d
     abrt-action-analyze-core \
06486d
     abrt-action-analyze-vulnerability \
06486d
     abrt-action-analyze-vmcore \
06486d
+    abrt-action-check-oops-for-hw-error \
06486d
     abrt-action-list-dsos \
06486d
     abrt-action-perform-ccpp-analysis \
06486d
     abrt-action-save-kernel-data \
06486d
@@ -74,6 +75,7 @@ PYTHON_FILES = \
06486d
     abrt-action-analyze-core \
06486d
     abrt-action-analyze-vulnerability \
06486d
     abrt-action-analyze-vmcore.in \
06486d
+    abrt-action-check-oops-for-hw-error.in \
06486d
     abrt-action-perform-ccpp-analysis.in \
06486d
     abrt-action-notify
06486d
 
06486d
@@ -88,6 +90,7 @@ EXTRA_DIST = \
06486d
     analyze_RetraceServer.xml.in \
06486d
     analyze_VMcore.xml.in \
06486d
     abrt-action-analyze-vmcore \
06486d
+    abrt-action-check-oops-for-hw-error \
06486d
     abrt-action-save-kernel-data \
06486d
     abrt-action-ureport \
06486d
     abrt-gdb-exploitable \
06486d
diff --git a/src/plugins/abrt-action-check-oops-for-hw-error.in b/src/plugins/abrt-action-check-oops-for-hw-error.in
06486d
new file mode 100644
06486d
index 0000000..83c0f22
06486d
--- /dev/null
06486d
+++ b/src/plugins/abrt-action-check-oops-for-hw-error.in
06486d
@@ -0,0 +1,118 @@
06486d
+#!/usr/bin/python -u
06486d
+
06486d
+import sys
06486d
+import os
06486d
+import locale
06486d
+import gettext
06486d
+
06486d
+GETTEXT_PROGNAME = "abrt"
06486d
+
06486d
+_ = gettext.lgettext
06486d
+
06486d
+def file_has_string(filename, string):
06486d
+    try:
06486d
+        f = open(filename, "r")
06486d
+    except IOError as e:
06486d
+        #print e
06486d
+        return False
06486d
+    for line in f:
06486d
+        if string in line:
06486d
+            f.close()
06486d
+            return True
06486d
+    f.close()
06486d
+    return False
06486d
+
06486d
+
06486d
+def tail_with_search(filename, string, maxlen):
06486d
+    try:
06486d
+        f = open(filename, "r")
06486d
+    except IOError as e:
06486d
+        #print e
06486d
+        return []
06486d
+    l = []
06486d
+    for line in f:
06486d
+        if string in line:
06486d
+            l.append(line)
06486d
+            if len(l) > maxlen:
06486d
+                del l[0]
06486d
+    f.close()
06486d
+    return l
06486d
+
06486d
+
06486d
+if __name__ == "__main__":
06486d
+    try:
06486d
+        locale.setlocale(locale.LC_ALL, "")
06486d
+    except locale.Error:
06486d
+        os.environ['LC_ALL'] = 'C'
06486d
+        locale.setlocale(locale.LC_ALL, "")
06486d
+
06486d
+    # Defeat "AttributeError: 'module' object has no attribute 'nl_langinfo'"
06486d
+    try:
06486d
+        gettext.bind_textdomain_codeset(GETTEXT_PROGNAME,
06486d
+                                        locale.nl_langinfo(locale.CODESET))
06486d
+    except AttributeError:
06486d
+        pass
06486d
+
06486d
+    gettext.bindtextdomain(GETTEXT_PROGNAME, '/usr/share/locale')
06486d
+    gettext.textdomain(GETTEXT_PROGNAME)
06486d
+
06486d
+    #
06486d
+    # So far we only look for Machine Check Exceptions here.
06486d
+    #
06486d
+
06486d
+    # See if MCEs were seen
06486d
+    if not file_has_string("dmesg", "Machine check events logged"):
06486d
+        sys.exit(0)
06486d
+    #
06486d
+    # There was an MCE. IOW: it's not a bug, it's a HW error.
06486d
+    f = open("not-reportable", "w")
06486d
+    f.write("The kernel log indicates that hardware errors were detected.\n");
06486d
+    f.write("This is most likely not a software problem.\n");
06486d
+    f.close()
06486d
+
06486d
+    #
06486d
+    # Did mcelog logged it to /var/log/mcelog
06486d
+    # (RHEL6 by default does this)?
06486d
+    if os.path.exists("/var/log/mcelog"):
06486d
+        f = open("comment", "w")
06486d
+        f.write("The kernel log indicates that hardware errors were detected.\n")
06486d
+        f.write("/var/log/mcelog file may have more information.\n")
06486d
+        f.write("The last 20 lines of /var/log/mcelog are:\n")
06486d
+        f.write("=========================================\n")
06486d
+        #tail -n20 /var/log/mcelog 2>&1
06486d
+        l = tail_with_search("/var/log/mcelog", "", 20)
06486d
+        for line in l:
06486d
+            f.write(line)
06486d
+        f.close()
06486d
+        sys.exit(0)
06486d
+    #
06486d
+    # On RHEL7, mcelog is run so that its output ends up in syslog.
06486d
+    # Do we see that?
06486d
+    if file_has_string("/var/log/messages", "mcelog: Hardware event"):
06486d
+        f = open("comment", "w")
06486d
+        f.write("The kernel log indicates that hardware errors were detected.\n")
06486d
+        f.write("System log may have more information.\n")
06486d
+        f.write("The last 20 mcelog lines of system log are:\n")
06486d
+        f.write("==========================================\n")
06486d
+        #grep -Fi 'mcelog:' /var/log/messages | tail -n20 2>&1
06486d
+        l = tail_with_search("/var/log/messages", "mcelog:", 20)
06486d
+        for line in l:
06486d
+            f.write(line)
06486d
+        f.close()
06486d
+        sys.exit(0)
06486d
+    #
06486d
+    # Apparently, there is no running mcelog daemon!
06486d
+    # Let user know that he needs one.
06486d
+    f = open("comment", "w")
06486d
+    f.write("The kernel log indicates that hardware errors were detected.\n")
06486d
+    f.write("The data was saved by kernel for processing by the mcelog tool.\n")
06486d
+    f.write("However, neither /var/log/mcelog nor system log contain mcelog messages.\n")
06486d
+    f.write("Most likely reason is that mcelog is not installed or not configured\n")
06486d
+    f.write("to be started during boot.\n")
06486d
+    f.write("Without this tool running, the binary data saved by kernel\n")
06486d
+    f.write("is of limited usefulness.\n")
06486d
+    f.write("(You can save this data anyway by running 'cat </dev/mcelog >FILE').\n")
06486d
+    f.write("The recommended course of action is to install mcelog.\n")
06486d
+    f.write("If another hardware error would occur, a user-readable description\n")
06486d
+    f.write("of it will be saved in system log or /var/log/mcelog.\n")
06486d
+    f.close()
06486d
diff --git a/src/plugins/koops_event.conf b/src/plugins/koops_event.conf
06486d
index 7dfbe36..3740f65 100644
06486d
--- a/src/plugins/koops_event.conf
06486d
+++ b/src/plugins/koops_event.conf
06486d
@@ -3,61 +3,8 @@ EVENT=post-create analyzer=Kerneloops
06486d
         # >> instead of > is due to bugzilla.redhat.com/show_bug.cgi?id=854266
06486d
         abrt-action-analyze-oops &&
06486d
         dmesg >>dmesg &&
06486d
-        abrt-action-save-kernel-data
06486d
-        abrt-action-save-kernel-data || exit $?
06486d
-        #
06486d
-        # If it exists, we can save a copy of MCE log here:
06486d
-        #test -f /var/log/mcelog && cp /var/log/mcelog .
06486d
-        # but in current config, sosreport already does that.
06486d
-        #
06486d
-        # See if MCEs were seen but mcelog isn't installed or running
06486d
-        grep -qFi 'Machine check events logged' dmesg || exit 0
06486d
-        #
06486d
-        # There was an MCE. IOW: it's not a bug, it's a HW error.
06486d
-        # Did mcelog logged it to /var/log/mcelog
06486d
-        # (RHEL6 by default does this)?
06486d
-        test -f /var/log/mcelog &&
06486d
-        {
06486d
-                # (Ab)use user comment field to inform user about it.
06486d
-                echo "The kernel log indicates that hardware errors were detected."
06486d
-                echo "/var/log/mcelog file may have more information."
06486d
-                echo "The last 20 lines of /var/log/mcelog are:"
06486d
-                echo "========================================="
06486d
-                # Redirecting sterr in case selinux makes it unreadable
06486d
-                # (annoying anyway, but at least user knows what's going on):
06486d
-                tail -n20 /var/log/mcelog 2>&1
06486d
-                exit 0
06486d
-        } >comment
06486d
-        #
06486d
-        # On RHEL7, mcelog is run so that its output ends up in syslog.
06486d
-        # Do we see that?
06486d
-        grep -qFi 'mcelog: Hardware event' /var/log/messages &&
06486d
-        {
06486d
-                echo "The kernel log indicates that hardware errors were detected."
06486d
-                echo "System log may have more information."
06486d
-                echo "The last 20 mcelog lines of system log are:"
06486d
-                echo "========================================="
06486d
-                # Redirecting sterr in case selinux makes it unreadable
06486d
-                # (annoying anyway, but at least user knows what's going on):
06486d
-                grep -Fi 'mcelog:' /var/log/messages | tail -n20 2>&1
06486d
-                exit 0
06486d
-        } >comment
06486d
-        #
06486d
-        # Apparently, there is no running mcelog daemon!
06486d
-        # Let user know that he needs one.
06486d
-        {
06486d
-        echo "The kernel log indicates that hardware errors were detected."
06486d
-        echo "The data was saved by kernel for processing by the mcelog tool."
06486d
-        echo "However, neither /var/log/mcelog nor system log contain mcelog messages."
06486d
-        echo "Most likely reason is that mcelog is not installed or not configured"
06486d
-        echo "to be started during boot."
06486d
-        echo "Without this tool running, the binary data saved by kernel"
06486d
-        echo "is of limited usefulness."
06486d
-        echo "(You can save this data anyway by running 'cat </dev/mcelog >FILE')."
06486d
-        echo "The recommended course of action is to install mcelog."
06486d
-        echo "If another hardware error would occur, a user-readable description"
06486d
-        echo "of it will be saved in system log or /var/log/mcelog."
06486d
-        } >comment
06486d
+        abrt-action-save-kernel-data &&
06486d
+        abrt-action-check-oops-for-hw-error
06486d
 
06486d
 # If you want behavior similar to one provided by kerneloops daemon
06486d
 # distributed by kerneloops.org - that is, if you want
06486d
-- 
06486d
1.8.3.1
06486d