Commit 1b5c65b6 authored by Barry Song's avatar Barry Song Committed by Andrew Morton

mm/page_owner: record and dump free_pid and free_tgid

While investigating some complex memory allocation and free bugs
especially in multi-processes and multi-threads cases, from time to time,
I feel the free stack isn't sufficient as a page can be freed by processes
or threads other than the one allocating it.  And other processes and
threads which free the page often have the exactly same free stack with
the one allocating the page.  We can't know who free the page only through
the free stack though the current page_owner does tell us the pid and tgid
of the one allocating the page.  This makes the bug investigation often
hard.

So this patch adds free pid and tgid in page_owner, so that we can easily
figure out if the freeing is crossing processes or threads.

Link: https://lkml.kernel.org/r/20231114034202.73098-1-v-songbaohua@oppo.comSigned-off-by: default avatarBarry Song <v-songbaohua@oppo.com>
Cc: Audra Mitchell <audra@redhat.com>
Cc: Hyeonggon Yoo <42.hyeyoo@gmail.com>
Cc: Joonsoo Kim <iamjoonsoo.kim@lge.com>
Cc: Kassey Li <quic_yingangl@quicinc.com>
Cc: Kemeng Shi <shikemeng@huaweicloud.com>
Signed-off-by: default avatarAndrew Morton <akpm@linux-foundation.org>
parent 20954c12
...@@ -32,6 +32,8 @@ struct page_owner { ...@@ -32,6 +32,8 @@ struct page_owner {
char comm[TASK_COMM_LEN]; char comm[TASK_COMM_LEN];
pid_t pid; pid_t pid;
pid_t tgid; pid_t tgid;
pid_t free_pid;
pid_t free_tgid;
}; };
static bool page_owner_enabled __initdata; static bool page_owner_enabled __initdata;
...@@ -152,6 +154,8 @@ void __reset_page_owner(struct page *page, unsigned short order) ...@@ -152,6 +154,8 @@ void __reset_page_owner(struct page *page, unsigned short order)
page_owner = get_page_owner(page_ext); page_owner = get_page_owner(page_ext);
page_owner->free_handle = handle; page_owner->free_handle = handle;
page_owner->free_ts_nsec = free_ts_nsec; page_owner->free_ts_nsec = free_ts_nsec;
page_owner->free_pid = current->pid;
page_owner->free_tgid = current->tgid;
page_ext = page_ext_next(page_ext); page_ext = page_ext_next(page_ext);
} }
page_ext_put(page_ext); page_ext_put(page_ext);
...@@ -253,6 +257,8 @@ void __folio_copy_owner(struct folio *newfolio, struct folio *old) ...@@ -253,6 +257,8 @@ void __folio_copy_owner(struct folio *newfolio, struct folio *old)
new_page_owner->handle = old_page_owner->handle; new_page_owner->handle = old_page_owner->handle;
new_page_owner->pid = old_page_owner->pid; new_page_owner->pid = old_page_owner->pid;
new_page_owner->tgid = old_page_owner->tgid; new_page_owner->tgid = old_page_owner->tgid;
new_page_owner->free_pid = old_page_owner->free_pid;
new_page_owner->free_tgid = old_page_owner->free_tgid;
new_page_owner->ts_nsec = old_page_owner->ts_nsec; new_page_owner->ts_nsec = old_page_owner->ts_nsec;
new_page_owner->free_ts_nsec = old_page_owner->ts_nsec; new_page_owner->free_ts_nsec = old_page_owner->ts_nsec;
strcpy(new_page_owner->comm, old_page_owner->comm); strcpy(new_page_owner->comm, old_page_owner->comm);
...@@ -495,7 +501,8 @@ void __dump_page_owner(const struct page *page) ...@@ -495,7 +501,8 @@ void __dump_page_owner(const struct page *page)
if (!handle) { if (!handle) {
pr_alert("page_owner free stack trace missing\n"); pr_alert("page_owner free stack trace missing\n");
} else { } else {
pr_alert("page last free stack trace:\n"); pr_alert("page last free pid %d tgid %d stack trace:\n",
page_owner->free_pid, page_owner->free_tgid);
stack_depot_print(handle); stack_depot_print(handle);
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment