-
Notifications
You must be signed in to change notification settings - Fork 52.3k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
mm: mmap_lock: add tracepoints around lock acquisition
The goal of these tracepoints is to be able to debug lock contention issues. This lock is acquired on most (all?) mmap / munmap / page fault operations, so a multi-threaded process which does a lot of these can experience significant contention. We trace just before we start acquisition, when the acquisition returns (whether it succeeded or not), and when the lock is released (or downgraded). The events are broken out by lock type (read / write). The events are also broken out by memcg path. For container-based workloads, users often think of several processes in a memcg as a single logical "task", so collecting statistics at this level is useful. The end goal is to get latency information. This isn't directly included in the trace events. Instead, users are expected to compute the time between "start locking" and "acquire returned", using e.g. synthetic events or BPF. The benefit we get from this is simpler code. Because we use tracepoint_enabled() to decide whether or not to trace, this patch has effectively no overhead unless tracepoints are enabled at runtime. If tracepoints are enabled, there is a performance impact, but how much depends on exactly what e.g. the BPF program does. [axelrasmussen@google.com: fix use-after-free race and css ref leak in tracepoints] Link: https://lkml.kernel.org/r/20201130233504.3725241-1-axelrasmussen@google.com [axelrasmussen@google.com: v3] Link: https://lkml.kernel.org/r/20201207213358.573750-1-axelrasmussen@google.com [rostedt@goodmis.org: in-depth examples of tracepoint_enabled() usage, and per-cpu-per-context buffer design] Link: https://lkml.kernel.org/r/20201105211739.568279-2-axelrasmussen@google.com Signed-off-by: Axel Rasmussen <axelrasmussen@google.com> Acked-by: Vlastimil Babka <vbabka@suse.cz> Cc: Steven Rostedt <rostedt@goodmis.org> Cc: Ingo Molnar <mingo@redhat.com> Cc: Michel Lespinasse <walken@google.com> Cc: Daniel Jordan <daniel.m.jordan@oracle.com> Cc: Jann Horn <jannh@google.com> Cc: Chinwen Chang <chinwen.chang@mediatek.com> Cc: Davidlohr Bueso <dbueso@suse.de> Cc: David Rientjes <rientjes@google.com> Cc: Laurent Dufour <ldufour@linux.ibm.com> Cc: Yafang Shao <laoar.shao@gmail.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
- Loading branch information
Showing
4 changed files
with
427 additions
and
6 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,107 @@ | ||
/* SPDX-License-Identifier: GPL-2.0 */ | ||
#undef TRACE_SYSTEM | ||
#define TRACE_SYSTEM mmap_lock | ||
|
||
#if !defined(_TRACE_MMAP_LOCK_H) || defined(TRACE_HEADER_MULTI_READ) | ||
#define _TRACE_MMAP_LOCK_H | ||
|
||
#include <linux/tracepoint.h> | ||
#include <linux/types.h> | ||
|
||
struct mm_struct; | ||
|
||
extern int trace_mmap_lock_reg(void); | ||
extern void trace_mmap_lock_unreg(void); | ||
|
||
TRACE_EVENT_FN(mmap_lock_start_locking, | ||
|
||
TP_PROTO(struct mm_struct *mm, const char *memcg_path, bool write), | ||
|
||
TP_ARGS(mm, memcg_path, write), | ||
|
||
TP_STRUCT__entry( | ||
__field(struct mm_struct *, mm) | ||
__string(memcg_path, memcg_path) | ||
__field(bool, write) | ||
), | ||
|
||
TP_fast_assign( | ||
__entry->mm = mm; | ||
__assign_str(memcg_path, memcg_path); | ||
__entry->write = write; | ||
), | ||
|
||
TP_printk( | ||
"mm=%p memcg_path=%s write=%s\n", | ||
__entry->mm, | ||
__get_str(memcg_path), | ||
__entry->write ? "true" : "false" | ||
), | ||
|
||
trace_mmap_lock_reg, trace_mmap_lock_unreg | ||
); | ||
|
||
TRACE_EVENT_FN(mmap_lock_acquire_returned, | ||
|
||
TP_PROTO(struct mm_struct *mm, const char *memcg_path, bool write, | ||
bool success), | ||
|
||
TP_ARGS(mm, memcg_path, write, success), | ||
|
||
TP_STRUCT__entry( | ||
__field(struct mm_struct *, mm) | ||
__string(memcg_path, memcg_path) | ||
__field(bool, write) | ||
__field(bool, success) | ||
), | ||
|
||
TP_fast_assign( | ||
__entry->mm = mm; | ||
__assign_str(memcg_path, memcg_path); | ||
__entry->write = write; | ||
__entry->success = success; | ||
), | ||
|
||
TP_printk( | ||
"mm=%p memcg_path=%s write=%s success=%s\n", | ||
__entry->mm, | ||
__get_str(memcg_path), | ||
__entry->write ? "true" : "false", | ||
__entry->success ? "true" : "false" | ||
), | ||
|
||
trace_mmap_lock_reg, trace_mmap_lock_unreg | ||
); | ||
|
||
TRACE_EVENT_FN(mmap_lock_released, | ||
|
||
TP_PROTO(struct mm_struct *mm, const char *memcg_path, bool write), | ||
|
||
TP_ARGS(mm, memcg_path, write), | ||
|
||
TP_STRUCT__entry( | ||
__field(struct mm_struct *, mm) | ||
__string(memcg_path, memcg_path) | ||
__field(bool, write) | ||
), | ||
|
||
TP_fast_assign( | ||
__entry->mm = mm; | ||
__assign_str(memcg_path, memcg_path); | ||
__entry->write = write; | ||
), | ||
|
||
TP_printk( | ||
"mm=%p memcg_path=%s write=%s\n", | ||
__entry->mm, | ||
__get_str(memcg_path), | ||
__entry->write ? "true" : "false" | ||
), | ||
|
||
trace_mmap_lock_reg, trace_mmap_lock_unreg | ||
); | ||
|
||
#endif /* _TRACE_MMAP_LOCK_H */ | ||
|
||
/* This part must be outside protection */ | ||
#include <trace/define_trace.h> |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.