Commit e4dcad20 authored by Joel Fernandes (Google)'s avatar Joel Fernandes (Google) Committed by Linus Torvalds

rss_stat: add support to detect RSS updates of external mm

When a process updates the RSS of a different process, the rss_stat
tracepoint appears in the context of the process doing the update.  This
can confuse userspace that the RSS of process doing the update is
updated, while in reality a different process's RSS was updated.

This issue happens in reclaim paths such as with direct reclaim or
background reclaim.

This patch adds more information to the tracepoint about whether the mm
being updated belongs to the current process's context (curr field).  We
also include a hash of the mm pointer so that the process who the mm
belongs to can be uniquely identified (mm_id field).

Also vsprintf.c is refactored a bit to allow reuse of hashing code.

[akpm@linux-foundation.org: remove unused local `str']
[joelaf@google.com: inline call to ptr_to_hashval]
  Link: http://lore.kernel.org/r/20191113153816.14b95acd@gandalf.local.home
  Link: http://lkml.kernel.org/r/20191114164622.GC233237@google.com
Link: http://lkml.kernel.org/r/20191106024452.81923-1-joel@joelfernandes.orgSigned-off-by: default avatarJoel Fernandes (Google) <joel@joelfernandes.org>
Reported-by: default avatarIoannis Ilkos <ilkos@google.com>
Acked-by: Petr Mladek <pmladek@suse.com>	[lib/vsprintf.c]
Cc: Tim Murray <timmurray@google.com>
Cc: Michal Hocko <mhocko@suse.com>
Cc: Carmen Jackson <carmenjackson@google.com>
Cc: Mayank Gupta <mayankgupta@google.com>
Cc: Daniel Colascione <dancol@google.com>
Cc: Steven Rostedt (VMware) <rostedt@goodmis.org>
Cc: Minchan Kim <minchan@kernel.org>
Cc: "Aneesh Kumar K.V" <aneesh.kumar@linux.ibm.com>
Cc: Dan Williams <dan.j.williams@intel.com>
Cc: Jerome Glisse <jglisse@redhat.com>
Cc: Matthew Wilcox <willy@infradead.org>
Cc: Ralph Campbell <rcampbell@nvidia.com>
Cc: Vlastimil Babka <vbabka@suse.cz>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: default avatarAndrew Morton <akpm@linux-foundation.org>
Signed-off-by: default avatarLinus Torvalds <torvalds@linux-foundation.org>
parent b3d1411b
...@@ -1643,27 +1643,27 @@ static inline unsigned long get_mm_counter(struct mm_struct *mm, int member) ...@@ -1643,27 +1643,27 @@ static inline unsigned long get_mm_counter(struct mm_struct *mm, int member)
return (unsigned long)val; return (unsigned long)val;
} }
void mm_trace_rss_stat(int member, long count); void mm_trace_rss_stat(struct mm_struct *mm, int member, long count);
static inline void add_mm_counter(struct mm_struct *mm, int member, long value) static inline void add_mm_counter(struct mm_struct *mm, int member, long value)
{ {
long count = atomic_long_add_return(value, &mm->rss_stat.count[member]); long count = atomic_long_add_return(value, &mm->rss_stat.count[member]);
mm_trace_rss_stat(member, count); mm_trace_rss_stat(mm, member, count);
} }
static inline void inc_mm_counter(struct mm_struct *mm, int member) static inline void inc_mm_counter(struct mm_struct *mm, int member)
{ {
long count = atomic_long_inc_return(&mm->rss_stat.count[member]); long count = atomic_long_inc_return(&mm->rss_stat.count[member]);
mm_trace_rss_stat(member, count); mm_trace_rss_stat(mm, member, count);
} }
static inline void dec_mm_counter(struct mm_struct *mm, int member) static inline void dec_mm_counter(struct mm_struct *mm, int member)
{ {
long count = atomic_long_dec_return(&mm->rss_stat.count[member]); long count = atomic_long_dec_return(&mm->rss_stat.count[member]);
mm_trace_rss_stat(member, count); mm_trace_rss_stat(mm, member, count);
} }
/* Optimized variant when page is already known not to be PageAnon */ /* Optimized variant when page is already known not to be PageAnon */
......
...@@ -216,6 +216,8 @@ int bprintf(u32 *bin_buf, size_t size, const char *fmt, ...) __printf(3, 4); ...@@ -216,6 +216,8 @@ int bprintf(u32 *bin_buf, size_t size, const char *fmt, ...) __printf(3, 4);
extern ssize_t memory_read_from_buffer(void *to, size_t count, loff_t *ppos, extern ssize_t memory_read_from_buffer(void *to, size_t count, loff_t *ppos,
const void *from, size_t available); const void *from, size_t available);
int ptr_to_hashval(const void *ptr, unsigned long *hashval_out);
/** /**
* strstarts - does @str start with @prefix? * strstarts - does @str start with @prefix?
* @str: string to examine * @str: string to examine
......
...@@ -316,24 +316,50 @@ TRACE_EVENT(mm_page_alloc_extfrag, ...@@ -316,24 +316,50 @@ TRACE_EVENT(mm_page_alloc_extfrag,
__entry->change_ownership) __entry->change_ownership)
); );
/*
* Required for uniquely and securely identifying mm in rss_stat tracepoint.
*/
#ifndef __PTR_TO_HASHVAL
static unsigned int __maybe_unused mm_ptr_to_hash(const void *ptr)
{
int ret;
unsigned long hashval;
ret = ptr_to_hashval(ptr, &hashval);
if (ret)
return 0;
/* The hashed value is only 32-bit */
return (unsigned int)hashval;
}
#define __PTR_TO_HASHVAL
#endif
TRACE_EVENT(rss_stat, TRACE_EVENT(rss_stat,
TP_PROTO(int member, TP_PROTO(struct mm_struct *mm,
int member,
long count), long count),
TP_ARGS(member, count), TP_ARGS(mm, member, count),
TP_STRUCT__entry( TP_STRUCT__entry(
__field(unsigned int, mm_id)
__field(unsigned int, curr)
__field(int, member) __field(int, member)
__field(long, size) __field(long, size)
), ),
TP_fast_assign( TP_fast_assign(
__entry->mm_id = mm_ptr_to_hash(mm);
__entry->curr = !!(current->mm == mm);
__entry->member = member; __entry->member = member;
__entry->size = (count << PAGE_SHIFT); __entry->size = (count << PAGE_SHIFT);
), ),
TP_printk("member=%d size=%ldB", TP_printk("mm_id=%u curr=%d member=%d size=%ldB",
__entry->mm_id,
__entry->curr,
__entry->member, __entry->member,
__entry->size) __entry->size)
); );
......
...@@ -761,11 +761,38 @@ static int __init initialize_ptr_random(void) ...@@ -761,11 +761,38 @@ static int __init initialize_ptr_random(void)
early_initcall(initialize_ptr_random); early_initcall(initialize_ptr_random);
/* Maps a pointer to a 32 bit unique identifier. */ /* Maps a pointer to a 32 bit unique identifier. */
static inline int __ptr_to_hashval(const void *ptr, unsigned long *hashval_out)
{
unsigned long hashval;
if (static_branch_unlikely(&not_filled_random_ptr_key))
return -EAGAIN;
#ifdef CONFIG_64BIT
hashval = (unsigned long)siphash_1u64((u64)ptr, &ptr_key);
/*
* Mask off the first 32 bits, this makes explicit that we have
* modified the address (and 32 bits is plenty for a unique ID).
*/
hashval = hashval & 0xffffffff;
#else
hashval = (unsigned long)siphash_1u32((u32)ptr, &ptr_key);
#endif
*hashval_out = hashval;
return 0;
}
int ptr_to_hashval(const void *ptr, unsigned long *hashval_out)
{
return __ptr_to_hashval(ptr, hashval_out);
}
static char *ptr_to_id(char *buf, char *end, const void *ptr, static char *ptr_to_id(char *buf, char *end, const void *ptr,
struct printf_spec spec) struct printf_spec spec)
{ {
const char *str = sizeof(ptr) == 8 ? "(____ptrval____)" : "(ptrval)"; const char *str = sizeof(ptr) == 8 ? "(____ptrval____)" : "(ptrval)";
unsigned long hashval; unsigned long hashval;
int ret;
/* When debugging early boot use non-cryptographically secure hash. */ /* When debugging early boot use non-cryptographically secure hash. */
if (unlikely(debug_boot_weak_hash)) { if (unlikely(debug_boot_weak_hash)) {
...@@ -773,22 +800,13 @@ static char *ptr_to_id(char *buf, char *end, const void *ptr, ...@@ -773,22 +800,13 @@ static char *ptr_to_id(char *buf, char *end, const void *ptr,
return pointer_string(buf, end, (const void *)hashval, spec); return pointer_string(buf, end, (const void *)hashval, spec);
} }
if (static_branch_unlikely(&not_filled_random_ptr_key)) { ret = __ptr_to_hashval(ptr, &hashval);
if (ret) {
spec.field_width = 2 * sizeof(ptr); spec.field_width = 2 * sizeof(ptr);
/* string length must be less than default_width */ /* string length must be less than default_width */
return error_string(buf, end, str, spec); return error_string(buf, end, str, spec);
} }
#ifdef CONFIG_64BIT
hashval = (unsigned long)siphash_1u64((u64)ptr, &ptr_key);
/*
* Mask off the first 32 bits, this makes explicit that we have
* modified the address (and 32 bits is plenty for a unique ID).
*/
hashval = hashval & 0xffffffff;
#else
hashval = (unsigned long)siphash_1u32((u32)ptr, &ptr_key);
#endif
return pointer_string(buf, end, (const void *)hashval, spec); return pointer_string(buf, end, (const void *)hashval, spec);
} }
......
...@@ -154,9 +154,9 @@ static int __init init_zero_pfn(void) ...@@ -154,9 +154,9 @@ static int __init init_zero_pfn(void)
} }
core_initcall(init_zero_pfn); core_initcall(init_zero_pfn);
void mm_trace_rss_stat(int member, long count) void mm_trace_rss_stat(struct mm_struct *mm, int member, long count)
{ {
trace_rss_stat(member, count); trace_rss_stat(mm, member, count);
} }
#if defined(SPLIT_RSS_COUNTING) #if defined(SPLIT_RSS_COUNTING)
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment