blob: e74ee1cd4b9c4746f129d42afd84fa208fa0d331 [file] [log] [blame]
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -08001/* Copyright (c) 2016 Facebook
2 *
3 * This program is free software; you can redistribute it and/or
4 * modify it under the terms of version 2 of the GNU General Public
5 * License as published by the Free Software Foundation.
6 */
7#include <uapi/linux/bpf.h>
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -08008#include <uapi/linux/ptrace.h>
9#include <uapi/linux/perf_event.h>
10#include <linux/version.h>
11#include <linux/sched.h>
Yonghong Song03421a92020-05-13 11:02:23 -070012#include <bpf/bpf_helpers.h>
13#include <bpf/bpf_tracing.h>
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -080014
Ilya Leoshkeviche4d9c232020-07-20 13:48:06 +020015#define _(P) \
16 ({ \
17 typeof(P) val; \
18 bpf_probe_read_kernel(&val, sizeof(val), &(P)); \
19 val; \
20 })
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -080021
22#define MINBLOCK_US 1
23
24struct key_t {
25 char waker[TASK_COMM_LEN];
26 char target[TASK_COMM_LEN];
27 u32 wret;
28 u32 tret;
29};
30
31struct bpf_map_def SEC("maps") counts = {
32 .type = BPF_MAP_TYPE_HASH,
33 .key_size = sizeof(struct key_t),
34 .value_size = sizeof(u64),
35 .max_entries = 10000,
36};
37
38struct bpf_map_def SEC("maps") start = {
39 .type = BPF_MAP_TYPE_HASH,
40 .key_size = sizeof(u32),
41 .value_size = sizeof(u64),
42 .max_entries = 10000,
43};
44
45struct wokeby_t {
46 char name[TASK_COMM_LEN];
47 u32 ret;
48};
49
50struct bpf_map_def SEC("maps") wokeby = {
51 .type = BPF_MAP_TYPE_HASH,
52 .key_size = sizeof(u32),
53 .value_size = sizeof(struct wokeby_t),
54 .max_entries = 10000,
55};
56
57struct bpf_map_def SEC("maps") stackmap = {
58 .type = BPF_MAP_TYPE_STACK_TRACE,
59 .key_size = sizeof(u32),
60 .value_size = PERF_MAX_STACK_DEPTH * sizeof(u64),
61 .max_entries = 10000,
62};
63
64#define STACKID_FLAGS (0 | BPF_F_FAST_STACK_CMP)
65
66SEC("kprobe/try_to_wake_up")
67int waker(struct pt_regs *ctx)
68{
69 struct task_struct *p = (void *) PT_REGS_PARM1(ctx);
Daniel Borkmann02413ca2016-04-13 00:10:53 +020070 struct wokeby_t woke;
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -080071 u32 pid;
72
73 pid = _(p->pid);
74
75 bpf_get_current_comm(&woke.name, sizeof(woke.name));
76 woke.ret = bpf_get_stackid(ctx, &stackmap, STACKID_FLAGS);
77
78 bpf_map_update_elem(&wokeby, &pid, &woke, BPF_ANY);
79 return 0;
80}
81
Alexei Starovoitov3c9b1642016-04-06 18:43:30 -070082static inline int update_counts(void *ctx, u32 pid, u64 delta)
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -080083{
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -080084 struct wokeby_t *woke;
85 u64 zero = 0, *val;
Daniel Borkmann02413ca2016-04-13 00:10:53 +020086 struct key_t key;
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -080087
Daniel Borkmann02413ca2016-04-13 00:10:53 +020088 __builtin_memset(&key.waker, 0, sizeof(key.waker));
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -080089 bpf_get_current_comm(&key.target, sizeof(key.target));
90 key.tret = bpf_get_stackid(ctx, &stackmap, STACKID_FLAGS);
Daniel Borkmann02413ca2016-04-13 00:10:53 +020091 key.wret = 0;
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -080092
93 woke = bpf_map_lookup_elem(&wokeby, &pid);
94 if (woke) {
95 key.wret = woke->ret;
Daniel Borkmann02413ca2016-04-13 00:10:53 +020096 __builtin_memcpy(&key.waker, woke->name, sizeof(key.waker));
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -080097 bpf_map_delete_elem(&wokeby, &pid);
98 }
99
100 val = bpf_map_lookup_elem(&counts, &key);
101 if (!val) {
102 bpf_map_update_elem(&counts, &key, &zero, BPF_NOEXIST);
103 val = bpf_map_lookup_elem(&counts, &key);
104 if (!val)
105 return 0;
106 }
107 (*val) += delta;
108 return 0;
109}
110
Alexei Starovoitov3c9b1642016-04-06 18:43:30 -0700111#if 1
112/* taken from /sys/kernel/debug/tracing/events/sched/sched_switch/format */
113struct sched_switch_args {
114 unsigned long long pad;
115 char prev_comm[16];
116 int prev_pid;
117 int prev_prio;
118 long long prev_state;
119 char next_comm[16];
120 int next_pid;
121 int next_prio;
122};
123SEC("tracepoint/sched/sched_switch")
124int oncpu(struct sched_switch_args *ctx)
125{
126 /* record previous thread sleep time */
127 u32 pid = ctx->prev_pid;
128#else
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -0800129SEC("kprobe/finish_task_switch")
130int oncpu(struct pt_regs *ctx)
131{
132 struct task_struct *p = (void *) PT_REGS_PARM1(ctx);
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -0800133 /* record previous thread sleep time */
Alexei Starovoitov3c9b1642016-04-06 18:43:30 -0700134 u32 pid = _(p->pid);
135#endif
136 u64 delta, ts, *tsp;
137
Alexei Starovoitova6ffe7b2016-02-17 19:58:59 -0800138 ts = bpf_ktime_get_ns();
139 bpf_map_update_elem(&start, &pid, &ts, BPF_ANY);
140
141 /* calculate current thread's delta time */
142 pid = bpf_get_current_pid_tgid();
143 tsp = bpf_map_lookup_elem(&start, &pid);
144 if (!tsp)
145 /* missed start or filtered */
146 return 0;
147
148 delta = bpf_ktime_get_ns() - *tsp;
149 bpf_map_delete_elem(&start, &pid);
150 delta = delta / 1000;
151 if (delta < MINBLOCK_US)
152 return 0;
153
154 return update_counts(ctx, pid, delta);
155}
156char _license[] SEC("license") = "GPL";
157u32 _version SEC("version") = LINUX_VERSION_CODE;