Commit ac5fcde0 authored by Naoya Horiguchi's avatar Naoya Horiguchi Committed by Andrew Morton

mm, hwpoison: make unpoison aware of raw error info in hwpoisoned hugepage

Raw error info list needs to be removed when hwpoisoned hugetlb is
unpoisoned.  And unpoison handler needs to know how many errors there are
in the target hugepage.  So add them.

HPageVmemmapOptimized(hpage) and HPageRawHwpUnreliable(hpage)) sometimes
can't be unpoisoned, so skip them.

Link: https://lkml.kernel.org/r/20220714042420.1847125-5-naoya.horiguchi@linux.devSigned-off-by: default avatarNaoya Horiguchi <naoya.horiguchi@nec.com>
Reported-by: default avatarkernel test robot <lkp@intel.com>
Reviewed-by: default avatarMiaohe Lin <linmiaohe@huawei.com>
Cc: David Hildenbrand <david@redhat.com>
Cc: Liu Shixin <liushixin2@huawei.com>
Cc: Mike Kravetz <mike.kravetz@oracle.com>
Cc: Muchun Song <songmuchun@bytedance.com>
Cc: Oscar Salvador <osalvador@suse.de>
Cc: Yang Shi <shy828301@gmail.com>
Signed-off-by: default avatarAndrew Morton <akpm@linux-foundation.org>
parent 161df60e
...@@ -490,6 +490,11 @@ static inline void num_poisoned_pages_dec(void) ...@@ -490,6 +490,11 @@ static inline void num_poisoned_pages_dec(void)
atomic_long_dec(&num_poisoned_pages); atomic_long_dec(&num_poisoned_pages);
} }
static inline void num_poisoned_pages_sub(long i)
{
atomic_long_sub(i, &num_poisoned_pages);
}
#else #else
static inline swp_entry_t make_hwpoison_entry(struct page *page) static inline swp_entry_t make_hwpoison_entry(struct page *page)
...@@ -505,6 +510,10 @@ static inline int is_hwpoison_entry(swp_entry_t swp) ...@@ -505,6 +510,10 @@ static inline int is_hwpoison_entry(swp_entry_t swp)
static inline void num_poisoned_pages_inc(void) static inline void num_poisoned_pages_inc(void)
{ {
} }
static inline void num_poisoned_pages_sub(long i)
{
}
#endif #endif
static inline int non_swap_entry(swp_entry_t entry) static inline int non_swap_entry(swp_entry_t entry)
......
...@@ -1678,19 +1678,23 @@ static inline struct llist_head *raw_hwp_list_head(struct page *hpage) ...@@ -1678,19 +1678,23 @@ static inline struct llist_head *raw_hwp_list_head(struct page *hpage)
return (struct llist_head *)&page_private(hpage + SUBPAGE_INDEX_HWPOISON); return (struct llist_head *)&page_private(hpage + SUBPAGE_INDEX_HWPOISON);
} }
static void __free_raw_hwp_pages(struct page *hpage) static unsigned long __free_raw_hwp_pages(struct page *hpage, bool move_flag)
{ {
struct llist_head *head; struct llist_head *head;
struct llist_node *t, *tnode; struct llist_node *t, *tnode;
unsigned long count = 0;
head = raw_hwp_list_head(hpage); head = raw_hwp_list_head(hpage);
llist_for_each_safe(tnode, t, head->first) { llist_for_each_safe(tnode, t, head->first) {
struct raw_hwp_page *p = container_of(tnode, struct raw_hwp_page, node); struct raw_hwp_page *p = container_of(tnode, struct raw_hwp_page, node);
if (move_flag)
SetPageHWPoison(p->page); SetPageHWPoison(p->page);
kfree(p); kfree(p);
count++;
} }
llist_del_all(head); llist_del_all(head);
return count;
} }
static int hugetlb_set_page_hwpoison(struct page *hpage, struct page *page) static int hugetlb_set_page_hwpoison(struct page *hpage, struct page *page)
...@@ -1733,17 +1737,36 @@ static int hugetlb_set_page_hwpoison(struct page *hpage, struct page *page) ...@@ -1733,17 +1737,36 @@ static int hugetlb_set_page_hwpoison(struct page *hpage, struct page *page)
* Once HPageRawHwpUnreliable is set, raw_hwp_page is not * Once HPageRawHwpUnreliable is set, raw_hwp_page is not
* used any more, so free it. * used any more, so free it.
*/ */
__free_raw_hwp_pages(hpage); __free_raw_hwp_pages(hpage, false);
} }
return ret; return ret;
} }
static unsigned long free_raw_hwp_pages(struct page *hpage, bool move_flag)
{
/*
* HPageVmemmapOptimized hugepages can't be freed because struct
* pages for tail pages are required but they don't exist.
*/
if (move_flag && HPageVmemmapOptimized(hpage))
return 0;
/*
* HPageRawHwpUnreliable hugepages shouldn't be unpoisoned by
* definition.
*/
if (HPageRawHwpUnreliable(hpage))
return 0;
return __free_raw_hwp_pages(hpage, move_flag);
}
void hugetlb_clear_page_hwpoison(struct page *hpage) void hugetlb_clear_page_hwpoison(struct page *hpage)
{ {
if (HPageRawHwpUnreliable(hpage)) if (HPageRawHwpUnreliable(hpage))
return; return;
ClearPageHWPoison(hpage); ClearPageHWPoison(hpage);
__free_raw_hwp_pages(hpage); free_raw_hwp_pages(hpage, true);
} }
/* /*
...@@ -1887,6 +1910,10 @@ static inline int try_memory_failure_hugetlb(unsigned long pfn, int flags, int * ...@@ -1887,6 +1910,10 @@ static inline int try_memory_failure_hugetlb(unsigned long pfn, int flags, int *
return 0; return 0;
} }
static inline unsigned long free_raw_hwp_pages(struct page *hpage, bool flag)
{
return 0;
}
#endif /* CONFIG_HUGETLB_PAGE */ #endif /* CONFIG_HUGETLB_PAGE */
static int memory_failure_dev_pagemap(unsigned long pfn, int flags, static int memory_failure_dev_pagemap(unsigned long pfn, int flags,
...@@ -2292,6 +2319,7 @@ int unpoison_memory(unsigned long pfn) ...@@ -2292,6 +2319,7 @@ int unpoison_memory(unsigned long pfn)
struct page *p; struct page *p;
int ret = -EBUSY; int ret = -EBUSY;
int freeit = 0; int freeit = 0;
unsigned long count = 1;
static DEFINE_RATELIMIT_STATE(unpoison_rs, DEFAULT_RATELIMIT_INTERVAL, static DEFINE_RATELIMIT_STATE(unpoison_rs, DEFAULT_RATELIMIT_INTERVAL,
DEFAULT_RATELIMIT_BURST); DEFAULT_RATELIMIT_BURST);
...@@ -2339,6 +2367,13 @@ int unpoison_memory(unsigned long pfn) ...@@ -2339,6 +2367,13 @@ int unpoison_memory(unsigned long pfn)
ret = get_hwpoison_page(p, MF_UNPOISON); ret = get_hwpoison_page(p, MF_UNPOISON);
if (!ret) { if (!ret) {
if (PageHuge(p)) {
count = free_raw_hwp_pages(page, false);
if (count == 0) {
ret = -EBUSY;
goto unlock_mutex;
}
}
ret = TestClearPageHWPoison(page) ? 0 : -EBUSY; ret = TestClearPageHWPoison(page) ? 0 : -EBUSY;
} else if (ret < 0) { } else if (ret < 0) {
if (ret == -EHWPOISON) { if (ret == -EHWPOISON) {
...@@ -2347,6 +2382,13 @@ int unpoison_memory(unsigned long pfn) ...@@ -2347,6 +2382,13 @@ int unpoison_memory(unsigned long pfn)
unpoison_pr_info("Unpoison: failed to grab page %#lx\n", unpoison_pr_info("Unpoison: failed to grab page %#lx\n",
pfn, &unpoison_rs); pfn, &unpoison_rs);
} else { } else {
if (PageHuge(p)) {
count = free_raw_hwp_pages(page, false);
if (count == 0) {
ret = -EBUSY;
goto unlock_mutex;
}
}
freeit = !!TestClearPageHWPoison(p); freeit = !!TestClearPageHWPoison(p);
put_page(page); put_page(page);
...@@ -2359,7 +2401,7 @@ int unpoison_memory(unsigned long pfn) ...@@ -2359,7 +2401,7 @@ int unpoison_memory(unsigned long pfn)
unlock_mutex: unlock_mutex:
mutex_unlock(&mf_mutex); mutex_unlock(&mf_mutex);
if (!ret || freeit) { if (!ret || freeit) {
num_poisoned_pages_dec(); num_poisoned_pages_sub(count);
unpoison_pr_info("Unpoison: Software-unpoisoned page %#lx\n", unpoison_pr_info("Unpoison: Software-unpoisoned page %#lx\n",
page_to_pfn(p), &unpoison_rs); page_to_pfn(p), &unpoison_rs);
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment