Commit 91d00547 authored by Naoya Horiguchi's avatar Naoya Horiguchi Committed by Linus Torvalds

mm/hwpoison: mf_mutex for soft offline and unpoison

Patch series "mm/hwpoison: fix unpoison_memory()", v4.

The main purpose of this series is to sync unpoison code to recent
changes around how hwpoison code takes page refcount.  Unpoison should
work or simply fail (without crash) if impossible.

The recent works of keeping hwpoison pages in shmem pagecache introduce
a new state of hwpoisoned pages, but unpoison for such pages is not
supported yet with this series.

It seems that soft-offline and unpoison can be used as general purpose
page offline/online mechanism (not in the context of memory error).  I
think that we need some additional works to realize it because currently
soft-offline and unpoison are assumed not to happen so frequently (print
out too many messages for aggressive usecases).  But anyway this could
be another interesting next topic.

v1: https://lore.kernel.org/linux-mm/20210614021212.223326-1-nao.horiguchi@gmail.com/
v2: https://lore.kernel.org/linux-mm/20211025230503.2650970-1-naoya.horiguchi@linux.dev/
v3: https://lore.kernel.org/linux-mm/20211105055058.3152564-1-naoya.horiguchi@linux.dev/

This patch (of 3):

Originally mf_mutex is introduced to serialize multiple MCE events, but
it is not that useful to allow unpoison to run in parallel with
memory_failure() and soft offline.  So apply mf_mutex to soft offline
and unpoison.  The memory failure handler and soft offline handler get
simpler with this.

Link: https://lkml.kernel.org/r/20211115084006.3728254-1-naoya.horiguchi@linux.dev
Link: https://lkml.kernel.org/r/20211115084006.3728254-2-naoya.horiguchi@linux.devSigned-off-by: default avatarNaoya Horiguchi <naoya.horiguchi@nec.com>
Reviewed-by: default avatarYang Shi <shy828301@gmail.com>
Cc: "Aneesh Kumar K.V" <aneesh.kumar@linux.vnet.ibm.com>
Cc: David Hildenbrand <david@redhat.com>
Cc: Ding Hui <dinghui@sangfor.com.cn>
Cc: Miaohe Lin <linmiaohe@huawei.com>
Cc: Michal Hocko <mhocko@suse.com>
Cc: Oscar Salvador <osalvador@suse.de>
Cc: Peter Xu <peterx@redhat.com>
Cc: Tony Luck <tony.luck@intel.com>
Signed-off-by: default avatarAndrew Morton <akpm@linux-foundation.org>
Signed-off-by: default avatarLinus Torvalds <torvalds@linux-foundation.org>
parent e1c63e11
...@@ -1502,14 +1502,6 @@ static int memory_failure_hugetlb(unsigned long pfn, int flags) ...@@ -1502,14 +1502,6 @@ static int memory_failure_hugetlb(unsigned long pfn, int flags)
lock_page(head); lock_page(head);
page_flags = head->flags; page_flags = head->flags;
if (!PageHWPoison(head)) {
pr_err("Memory failure: %#lx: just unpoisoned\n", pfn);
num_poisoned_pages_dec();
unlock_page(head);
put_page(head);
return 0;
}
/* /*
* TODO: hwpoison for pud-sized hugetlb doesn't work right now, so * TODO: hwpoison for pud-sized hugetlb doesn't work right now, so
* simply disable it. In order to make it work properly, we need * simply disable it. In order to make it work properly, we need
...@@ -1623,6 +1615,8 @@ static int memory_failure_dev_pagemap(unsigned long pfn, int flags, ...@@ -1623,6 +1615,8 @@ static int memory_failure_dev_pagemap(unsigned long pfn, int flags,
return rc; return rc;
} }
static DEFINE_MUTEX(mf_mutex);
/** /**
* memory_failure - Handle memory failure of a page. * memory_failure - Handle memory failure of a page.
* @pfn: Page Number of the corrupted page * @pfn: Page Number of the corrupted page
...@@ -1649,7 +1643,6 @@ int memory_failure(unsigned long pfn, int flags) ...@@ -1649,7 +1643,6 @@ int memory_failure(unsigned long pfn, int flags)
int res = 0; int res = 0;
unsigned long page_flags; unsigned long page_flags;
bool retry = true; bool retry = true;
static DEFINE_MUTEX(mf_mutex);
if (!sysctl_memory_failure_recovery) if (!sysctl_memory_failure_recovery)
panic("Memory failure on page %lx", pfn); panic("Memory failure on page %lx", pfn);
...@@ -1783,16 +1776,6 @@ int memory_failure(unsigned long pfn, int flags) ...@@ -1783,16 +1776,6 @@ int memory_failure(unsigned long pfn, int flags)
*/ */
page_flags = p->flags; page_flags = p->flags;
/*
* unpoison always clear PG_hwpoison inside page lock
*/
if (!PageHWPoison(p)) {
pr_err("Memory failure: %#lx: just unpoisoned\n", pfn);
num_poisoned_pages_dec();
unlock_page(p);
put_page(p);
goto unlock_mutex;
}
if (hwpoison_filter(p)) { if (hwpoison_filter(p)) {
if (TestClearPageHWPoison(p)) if (TestClearPageHWPoison(p))
num_poisoned_pages_dec(); num_poisoned_pages_dec();
...@@ -1973,6 +1956,7 @@ int unpoison_memory(unsigned long pfn) ...@@ -1973,6 +1956,7 @@ int unpoison_memory(unsigned long pfn)
struct page *page; struct page *page;
struct page *p; struct page *p;
int freeit = 0; int freeit = 0;
int ret = 0;
unsigned long flags = 0; unsigned long flags = 0;
static DEFINE_RATELIMIT_STATE(unpoison_rs, DEFAULT_RATELIMIT_INTERVAL, static DEFINE_RATELIMIT_STATE(unpoison_rs, DEFAULT_RATELIMIT_INTERVAL,
DEFAULT_RATELIMIT_BURST); DEFAULT_RATELIMIT_BURST);
...@@ -1983,39 +1967,30 @@ int unpoison_memory(unsigned long pfn) ...@@ -1983,39 +1967,30 @@ int unpoison_memory(unsigned long pfn)
p = pfn_to_page(pfn); p = pfn_to_page(pfn);
page = compound_head(p); page = compound_head(p);
mutex_lock(&mf_mutex);
if (!PageHWPoison(p)) { if (!PageHWPoison(p)) {
unpoison_pr_info("Unpoison: Page was already unpoisoned %#lx\n", unpoison_pr_info("Unpoison: Page was already unpoisoned %#lx\n",
pfn, &unpoison_rs); pfn, &unpoison_rs);
return 0; goto unlock_mutex;
} }
if (page_count(page) > 1) { if (page_count(page) > 1) {
unpoison_pr_info("Unpoison: Someone grabs the hwpoison page %#lx\n", unpoison_pr_info("Unpoison: Someone grabs the hwpoison page %#lx\n",
pfn, &unpoison_rs); pfn, &unpoison_rs);
return 0; goto unlock_mutex;
} }
if (page_mapped(page)) { if (page_mapped(page)) {
unpoison_pr_info("Unpoison: Someone maps the hwpoison page %#lx\n", unpoison_pr_info("Unpoison: Someone maps the hwpoison page %#lx\n",
pfn, &unpoison_rs); pfn, &unpoison_rs);
return 0; goto unlock_mutex;
} }
if (page_mapping(page)) { if (page_mapping(page)) {
unpoison_pr_info("Unpoison: the hwpoison page has non-NULL mapping %#lx\n", unpoison_pr_info("Unpoison: the hwpoison page has non-NULL mapping %#lx\n",
pfn, &unpoison_rs); pfn, &unpoison_rs);
return 0; goto unlock_mutex;
}
/*
* unpoison_memory() can encounter thp only when the thp is being
* worked by memory_failure() and the page lock is not held yet.
* In such case, we yield to memory_failure() and make unpoison fail.
*/
if (!PageHuge(page) && PageTransHuge(page)) {
unpoison_pr_info("Unpoison: Memory failure is now running on %#lx\n",
pfn, &unpoison_rs);
return 0;
} }
if (!get_hwpoison_page(p, flags)) { if (!get_hwpoison_page(p, flags)) {
...@@ -2023,29 +1998,23 @@ int unpoison_memory(unsigned long pfn) ...@@ -2023,29 +1998,23 @@ int unpoison_memory(unsigned long pfn)
num_poisoned_pages_dec(); num_poisoned_pages_dec();
unpoison_pr_info("Unpoison: Software-unpoisoned free page %#lx\n", unpoison_pr_info("Unpoison: Software-unpoisoned free page %#lx\n",
pfn, &unpoison_rs); pfn, &unpoison_rs);
return 0; goto unlock_mutex;
} }
lock_page(page);
/*
* This test is racy because PG_hwpoison is set outside of page lock.
* That's acceptable because that won't trigger kernel panic. Instead,
* the PG_hwpoison page will be caught and isolated on the entrance to
* the free buddy page pool.
*/
if (TestClearPageHWPoison(page)) { if (TestClearPageHWPoison(page)) {
unpoison_pr_info("Unpoison: Software-unpoisoned page %#lx\n", unpoison_pr_info("Unpoison: Software-unpoisoned page %#lx\n",
pfn, &unpoison_rs); pfn, &unpoison_rs);
num_poisoned_pages_dec(); num_poisoned_pages_dec();
freeit = 1; freeit = 1;
} }
unlock_page(page);
put_page(page); put_page(page);
if (freeit && !(pfn == my_zero_pfn(0) && page_count(p) == 1)) if (freeit && !(pfn == my_zero_pfn(0) && page_count(p) == 1))
put_page(page); put_page(page);
return 0; unlock_mutex:
mutex_unlock(&mf_mutex);
return ret;
} }
EXPORT_SYMBOL(unpoison_memory); EXPORT_SYMBOL(unpoison_memory);
...@@ -2226,9 +2195,12 @@ int soft_offline_page(unsigned long pfn, int flags) ...@@ -2226,9 +2195,12 @@ int soft_offline_page(unsigned long pfn, int flags)
return -EIO; return -EIO;
} }
mutex_lock(&mf_mutex);
if (PageHWPoison(page)) { if (PageHWPoison(page)) {
pr_info("%s: %#lx page already poisoned\n", __func__, pfn); pr_info("%s: %#lx page already poisoned\n", __func__, pfn);
put_ref_page(ref_page); put_ref_page(ref_page);
mutex_unlock(&mf_mutex);
return 0; return 0;
} }
...@@ -2247,5 +2219,7 @@ int soft_offline_page(unsigned long pfn, int flags) ...@@ -2247,5 +2219,7 @@ int soft_offline_page(unsigned long pfn, int flags)
} }
} }
mutex_unlock(&mf_mutex);
return ret; return ret;
} }
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment