mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-12-28 11:18:45 +07:00
0dc9c639e6
The NFIT MCE handler callback (for handling media errors on NVDIMMs)
takes a mutex to add the location of a memory error to a list. But since
the notifier call chain for machine checks (x86_mce_decoder_chain) is
atomic, we get a lockdep splat like:
BUG: sleeping function called from invalid context at kernel/locking/mutex.c:620
in_atomic(): 1, irqs_disabled(): 0, pid: 4, name: kworker/0:0
[..]
Call Trace:
dump_stack
___might_sleep
__might_sleep
mutex_lock_nested
? __lock_acquire
nfit_handle_mce
notifier_call_chain
atomic_notifier_call_chain
? atomic_notifier_call_chain
mce_gen_pool_process
Convert the notifier to a blocking one which gets to run only in process
context.
Boris: remove the notifier call in atomic context in print_mce(). For
now, let's print the MCE on the atomic path so that we can make sure
they go out and get logged at least.
Fixes: 6839a6d96f
("nfit: do an ARS scrub on hitting a latent media error")
Reported-by: Ross Zwisler <ross.zwisler@linux.intel.com>
Signed-off-by: Vishal Verma <vishal.l.verma@intel.com>
Acked-by: Tony Luck <tony.luck@intel.com>
Cc: Dan Williams <dan.j.williams@intel.com>
Cc: linux-edac <linux-edac@vger.kernel.org>
Cc: x86-ml <x86@kernel.org>
Cc: <stable@vger.kernel.org>
Link: http://lkml.kernel.org/r/20170411224457.24777-1-vishal.l.verma@intel.com
Signed-off-by: Borislav Petkov <bp@suse.de>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
146 lines
3.3 KiB
C
146 lines
3.3 KiB
C
/*
|
|
* MCE event pool management in MCE context
|
|
*
|
|
* Copyright (C) 2015 Intel Corp.
|
|
* Author: Chen, Gong <gong.chen@linux.intel.com>
|
|
*
|
|
* This file is licensed under GPLv2.
|
|
*/
|
|
#include <linux/smp.h>
|
|
#include <linux/mm.h>
|
|
#include <linux/genalloc.h>
|
|
#include <linux/llist.h>
|
|
#include "mce-internal.h"
|
|
|
|
/*
|
|
* printk() is not safe in MCE context. This is a lock-less memory allocator
|
|
* used to save error information organized in a lock-less list.
|
|
*
|
|
* This memory pool is only to be used to save MCE records in MCE context.
|
|
* MCE events are rare, so a fixed size memory pool should be enough. Use
|
|
* 2 pages to save MCE events for now (~80 MCE records at most).
|
|
*/
|
|
#define MCE_POOLSZ (2 * PAGE_SIZE)
|
|
|
|
static struct gen_pool *mce_evt_pool;
|
|
static LLIST_HEAD(mce_event_llist);
|
|
static char gen_pool_buf[MCE_POOLSZ];
|
|
|
|
/*
|
|
* Compare the record "t" with each of the records on list "l" to see if
|
|
* an equivalent one is present in the list.
|
|
*/
|
|
static bool is_duplicate_mce_record(struct mce_evt_llist *t, struct mce_evt_llist *l)
|
|
{
|
|
struct mce_evt_llist *node;
|
|
struct mce *m1, *m2;
|
|
|
|
m1 = &t->mce;
|
|
|
|
llist_for_each_entry(node, &l->llnode, llnode) {
|
|
m2 = &node->mce;
|
|
|
|
if (!mce_cmp(m1, m2))
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* The system has panicked - we'd like to peruse the list of MCE records
|
|
* that have been queued, but not seen by anyone yet. The list is in
|
|
* reverse time order, so we need to reverse it. While doing that we can
|
|
* also drop duplicate records (these were logged because some banks are
|
|
* shared between cores or by all threads on a socket).
|
|
*/
|
|
struct llist_node *mce_gen_pool_prepare_records(void)
|
|
{
|
|
struct llist_node *head;
|
|
LLIST_HEAD(new_head);
|
|
struct mce_evt_llist *node, *t;
|
|
|
|
head = llist_del_all(&mce_event_llist);
|
|
if (!head)
|
|
return NULL;
|
|
|
|
/* squeeze out duplicates while reversing order */
|
|
llist_for_each_entry_safe(node, t, head, llnode) {
|
|
if (!is_duplicate_mce_record(node, t))
|
|
llist_add(&node->llnode, &new_head);
|
|
}
|
|
|
|
return new_head.first;
|
|
}
|
|
|
|
void mce_gen_pool_process(struct work_struct *__unused)
|
|
{
|
|
struct llist_node *head;
|
|
struct mce_evt_llist *node, *tmp;
|
|
struct mce *mce;
|
|
|
|
head = llist_del_all(&mce_event_llist);
|
|
if (!head)
|
|
return;
|
|
|
|
head = llist_reverse_order(head);
|
|
llist_for_each_entry_safe(node, tmp, head, llnode) {
|
|
mce = &node->mce;
|
|
blocking_notifier_call_chain(&x86_mce_decoder_chain, 0, mce);
|
|
gen_pool_free(mce_evt_pool, (unsigned long)node, sizeof(*node));
|
|
}
|
|
}
|
|
|
|
bool mce_gen_pool_empty(void)
|
|
{
|
|
return llist_empty(&mce_event_llist);
|
|
}
|
|
|
|
int mce_gen_pool_add(struct mce *mce)
|
|
{
|
|
struct mce_evt_llist *node;
|
|
|
|
if (!mce_evt_pool)
|
|
return -EINVAL;
|
|
|
|
node = (void *)gen_pool_alloc(mce_evt_pool, sizeof(*node));
|
|
if (!node) {
|
|
pr_warn_ratelimited("MCE records pool full!\n");
|
|
return -ENOMEM;
|
|
}
|
|
|
|
memcpy(&node->mce, mce, sizeof(*mce));
|
|
llist_add(&node->llnode, &mce_event_llist);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int mce_gen_pool_create(void)
|
|
{
|
|
struct gen_pool *tmpp;
|
|
int ret = -ENOMEM;
|
|
|
|
tmpp = gen_pool_create(ilog2(sizeof(struct mce_evt_llist)), -1);
|
|
if (!tmpp)
|
|
goto out;
|
|
|
|
ret = gen_pool_add(tmpp, (unsigned long)gen_pool_buf, MCE_POOLSZ, -1);
|
|
if (ret) {
|
|
gen_pool_destroy(tmpp);
|
|
goto out;
|
|
}
|
|
|
|
mce_evt_pool = tmpp;
|
|
|
|
out:
|
|
return ret;
|
|
}
|
|
|
|
int mce_gen_pool_init(void)
|
|
{
|
|
/* Just init mce_gen_pool once. */
|
|
if (mce_evt_pool)
|
|
return 0;
|
|
|
|
return mce_gen_pool_create();
|
|
}
|