blob: ec96d64aec6995cbb484a77823b7e13f51a36a88 [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001// SPDX-License-Identifier: GPL-2.0
Ingo Molnar0a02ad92009-09-11 12:12:54 +02002#include "builtin.h"
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +02003#include "perf.h"
Arnaldo Carvalho de Melo91854f92019-08-29 14:59:50 -03004#include "perf-sys.h"
Ingo Molnar0a02ad92009-09-11 12:12:54 +02005
Arnaldo Carvalho de Meloee29be62011-11-28 17:57:40 -02006#include "util/evlist.h"
Arnaldo Carvalho de Meloe3f42602011-11-16 17:02:54 -02007#include "util/evsel.h"
Ingo Molnar0a02ad92009-09-11 12:12:54 +02008#include "util/symbol.h"
9#include "util/thread.h"
10#include "util/header.h"
Arnaldo Carvalho de Melo94c744b2009-12-11 21:24:02 -020011#include "util/session.h"
Arnaldo Carvalho de Melo45694aa2011-11-28 08:30:20 -020012#include "util/tool.h"
Yann Droneaud57480d22014-06-30 22:28:47 +020013#include "util/cloexec.h"
Jiri Olsaa151a372016-04-12 15:29:29 +020014#include "util/thread_map.h"
Jiri Olsa8cd91192016-04-12 15:29:27 +020015#include "util/color.h"
David Ahern49394a22016-11-16 15:06:29 +090016#include "util/stat.h"
Arnaldo Carvalho de Melo6a9fa4e2019-06-25 17:31:26 -030017#include "util/string2.h"
David Ahern6c973c92016-11-16 15:06:32 +090018#include "util/callchain.h"
David Ahern853b7402016-11-29 10:15:44 -070019#include "util/time-utils.h"
Ingo Molnar0a02ad92009-09-11 12:12:54 +020020
Arnaldo Carvalho de Melofa0d9842019-08-30 12:52:25 -030021#include <subcmd/pager.h>
Josh Poimboeuf4b6ab942015-12-15 09:39:39 -060022#include <subcmd/parse-options.h>
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +020023#include "util/trace-event.h"
Ingo Molnar0a02ad92009-09-11 12:12:54 +020024
Ingo Molnar0a02ad92009-09-11 12:12:54 +020025#include "util/debug.h"
26
Arnaldo Carvalho de Melo877a7a12017-04-17 11:39:06 -030027#include <linux/kernel.h>
David Ahern49394a22016-11-16 15:06:29 +090028#include <linux/log2.h>
Arnaldo Carvalho de Melo7f7c5362019-07-04 11:32:27 -030029#include <linux/zalloc.h>
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +020030#include <sys/prctl.h>
Markus Trippelsdorf7b78f132012-04-04 10:45:27 +020031#include <sys/resource.h>
Arnaldo Carvalho de Melofd20e812017-04-17 15:23:08 -030032#include <inttypes.h>
Ingo Molnar0a02ad92009-09-11 12:12:54 +020033
Arnaldo Carvalho de Meloa43783a2017-04-18 10:46:11 -030034#include <errno.h>
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +020035#include <semaphore.h>
36#include <pthread.h>
37#include <math.h>
Yunlong Songcb06ac22015-03-31 21:46:30 +080038#include <api/fs/fs.h>
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -030039#include <linux/time64.h>
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +020040
Arnaldo Carvalho de Melo3052ba52019-06-25 17:27:31 -030041#include <linux/ctype.h>
Arnaldo Carvalho de Melo3d689ed2017-04-17 16:10:49 -030042
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +020043#define PR_SET_NAME 15 /* Set process name */
44#define MAX_CPUS 4096
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +020045#define COMM_LEN 20
46#define SYM_LEN 129
Yunlong Songa35e27d2015-03-31 21:46:29 +080047#define MAX_PID 1024000
Ingo Molnarec156762009-09-11 12:12:54 +020048
mingo39aeb522009-09-14 20:04:48 +020049struct sched_atom;
Ingo Molnarec156762009-09-11 12:12:54 +020050
51struct task_desc {
52 unsigned long nr;
53 unsigned long pid;
54 char comm[COMM_LEN];
55
56 unsigned long nr_events;
57 unsigned long curr_event;
mingo39aeb522009-09-14 20:04:48 +020058 struct sched_atom **atoms;
Ingo Molnarec156762009-09-11 12:12:54 +020059
60 pthread_t thread;
61 sem_t sleep_sem;
62
63 sem_t ready_for_work;
64 sem_t work_done_sem;
65
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +020066 u64 cpu_usage;
Ingo Molnarec156762009-09-11 12:12:54 +020067};
68
69enum sched_event_type {
70 SCHED_EVENT_RUN,
71 SCHED_EVENT_SLEEP,
72 SCHED_EVENT_WAKEUP,
Mike Galbraith55ffb7a2009-10-10 14:46:04 +020073 SCHED_EVENT_MIGRATION,
Ingo Molnarec156762009-09-11 12:12:54 +020074};
75
mingo39aeb522009-09-14 20:04:48 +020076struct sched_atom {
Ingo Molnarec156762009-09-11 12:12:54 +020077 enum sched_event_type type;
Arnaldo Carvalho de Meloeed05fe2010-04-05 12:53:45 -030078 int specific_wait;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +020079 u64 timestamp;
80 u64 duration;
Ingo Molnarec156762009-09-11 12:12:54 +020081 unsigned long nr;
Ingo Molnarec156762009-09-11 12:12:54 +020082 sem_t *wait_sem;
83 struct task_desc *wakee;
84};
85
Dongshenge936e8e2014-05-05 16:05:54 +090086#define TASK_STATE_TO_CHAR_STR "RSDTtZXxKWP"
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +020087
Namhyung Kim941bdea2017-01-13 19:45:21 +090088/* task state bitmask, copied from include/linux/sched.h */
89#define TASK_RUNNING 0
90#define TASK_INTERRUPTIBLE 1
91#define TASK_UNINTERRUPTIBLE 2
92#define __TASK_STOPPED 4
93#define __TASK_TRACED 8
94/* in tsk->exit_state */
95#define EXIT_DEAD 16
96#define EXIT_ZOMBIE 32
97#define EXIT_TRACE (EXIT_ZOMBIE | EXIT_DEAD)
98/* in tsk->state again */
99#define TASK_DEAD 64
100#define TASK_WAKEKILL 128
101#define TASK_WAKING 256
102#define TASK_PARKED 512
103
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200104enum thread_state {
105 THREAD_SLEEPING = 0,
106 THREAD_WAIT_CPU,
107 THREAD_SCHED_IN,
108 THREAD_IGNORE
109};
110
111struct work_atom {
112 struct list_head list;
113 enum thread_state state;
Frederic Weisbeckeraa1ab9d2009-09-14 03:01:12 +0200114 u64 sched_out_time;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200115 u64 wake_up_time;
116 u64 sched_in_time;
117 u64 runtime;
118};
119
mingo39aeb522009-09-14 20:04:48 +0200120struct work_atoms {
121 struct list_head work_list;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200122 struct thread *thread;
123 struct rb_node node;
124 u64 max_lat;
Frederic Weisbecker3786310a2009-12-09 21:40:08 +0100125 u64 max_lat_at;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200126 u64 total_lat;
127 u64 nb_atoms;
128 u64 total_runtime;
Josef Bacik2f80dd42015-05-22 09:18:40 -0400129 int num_merged;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200130};
131
mingo39aeb522009-09-14 20:04:48 +0200132typedef int (*sort_fn_t)(struct work_atoms *, struct work_atoms *);
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200133
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300134struct perf_sched;
135
136struct trace_sched_handler {
Jiri Olsa32dcd022019-07-21 13:23:51 +0200137 int (*switch_event)(struct perf_sched *sched, struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300138 struct perf_sample *sample, struct machine *machine);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300139
Jiri Olsa32dcd022019-07-21 13:23:51 +0200140 int (*runtime_event)(struct perf_sched *sched, struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300141 struct perf_sample *sample, struct machine *machine);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300142
Jiri Olsa32dcd022019-07-21 13:23:51 +0200143 int (*wakeup_event)(struct perf_sched *sched, struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300144 struct perf_sample *sample, struct machine *machine);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300145
David Aherncb627502013-08-07 22:50:47 -0400146 /* PERF_RECORD_FORK event, not sched_process_fork tracepoint */
147 int (*fork_event)(struct perf_sched *sched, union perf_event *event,
148 struct machine *machine);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300149
150 int (*migrate_task_event)(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +0200151 struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300152 struct perf_sample *sample,
153 struct machine *machine);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300154};
155
Jiri Olsaa151a372016-04-12 15:29:29 +0200156#define COLOR_PIDS PERF_COLOR_BLUE
Jiri Olsacf294f22016-04-12 15:29:30 +0200157#define COLOR_CPUS PERF_COLOR_BG_RED
Jiri Olsaa151a372016-04-12 15:29:29 +0200158
Jiri Olsa99623c62016-04-12 15:29:26 +0200159struct perf_sched_map {
160 DECLARE_BITMAP(comp_cpus_mask, MAX_CPUS);
161 int *comp_cpus;
162 bool comp;
Jiri Olsa9749b902019-07-21 13:23:50 +0200163 struct perf_thread_map *color_pids;
Jiri Olsaa151a372016-04-12 15:29:29 +0200164 const char *color_pids_str;
Jiri Olsaf8548392019-07-21 13:23:49 +0200165 struct perf_cpu_map *color_cpus;
Jiri Olsacf294f22016-04-12 15:29:30 +0200166 const char *color_cpus_str;
Jiri Olsaf8548392019-07-21 13:23:49 +0200167 struct perf_cpu_map *cpus;
Jiri Olsa73643bb2016-04-12 15:29:31 +0200168 const char *cpus_str;
Jiri Olsa99623c62016-04-12 15:29:26 +0200169};
170
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300171struct perf_sched {
172 struct perf_tool tool;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300173 const char *sort_order;
174 unsigned long nr_tasks;
Yunlong Songcb06ac22015-03-31 21:46:30 +0800175 struct task_desc **pid_to_task;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300176 struct task_desc **tasks;
177 const struct trace_sched_handler *tp_handler;
178 pthread_mutex_t start_work_mutex;
179 pthread_mutex_t work_done_wait_mutex;
180 int profile_cpu;
181/*
182 * Track the current task - that way we can know whether there's any
183 * weird events, such as a task being switched away that is not current.
184 */
185 int max_cpu;
186 u32 curr_pid[MAX_CPUS];
187 struct thread *curr_thread[MAX_CPUS];
188 char next_shortname1;
189 char next_shortname2;
190 unsigned int replay_repeat;
191 unsigned long nr_run_events;
192 unsigned long nr_sleep_events;
193 unsigned long nr_wakeup_events;
194 unsigned long nr_sleep_corrections;
195 unsigned long nr_run_events_optimized;
196 unsigned long targetless_wakeups;
197 unsigned long multitarget_wakeups;
198 unsigned long nr_runs;
199 unsigned long nr_timestamps;
200 unsigned long nr_unordered_timestamps;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300201 unsigned long nr_context_switch_bugs;
202 unsigned long nr_events;
203 unsigned long nr_lost_chunks;
204 unsigned long nr_lost_events;
205 u64 run_measurement_overhead;
206 u64 sleep_measurement_overhead;
207 u64 start_time;
208 u64 cpu_usage;
209 u64 runavg_cpu_usage;
210 u64 parent_cpu_usage;
211 u64 runavg_parent_cpu_usage;
212 u64 sum_runtime;
213 u64 sum_fluct;
214 u64 run_avg;
215 u64 all_runtime;
216 u64 all_count;
217 u64 cpu_last_switched[MAX_CPUS];
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -0800218 struct rb_root_cached atom_root, sorted_atom_root, merged_atom_root;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300219 struct list_head sort_list, cmp_pid;
Yunlong Song939cda52015-03-31 21:46:34 +0800220 bool force;
Josef Bacik2f80dd42015-05-22 09:18:40 -0400221 bool skip_merge;
Jiri Olsa99623c62016-04-12 15:29:26 +0200222 struct perf_sched_map map;
David Ahern52df1382016-11-16 15:06:30 +0900223
224 /* options for timehist command */
225 bool summary;
226 bool summary_only;
Namhyung Kim699b5b92016-12-08 23:47:52 +0900227 bool idle_hist;
David Ahern6c973c92016-11-16 15:06:32 +0900228 bool show_callchain;
229 unsigned int max_stack;
David Aherna407b062016-11-16 15:06:33 +0900230 bool show_cpu_visual;
David Ahernfc1469f2016-11-16 15:06:31 +0900231 bool show_wakeups;
Brendan Gregg292c4a82017-03-14 01:56:29 +0000232 bool show_next;
David Ahern350f54f2016-11-25 09:28:41 -0700233 bool show_migrations;
Namhyung Kim414e0502017-01-13 19:45:22 +0900234 bool show_state;
David Ahern52df1382016-11-16 15:06:30 +0900235 u64 skipped_samples;
David Ahern853b7402016-11-29 10:15:44 -0700236 const char *time_str;
237 struct perf_time_interval ptime;
Namhyung Kim9396c9c2016-12-22 15:03:50 +0900238 struct perf_time_interval hist_time;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300239};
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200240
David Ahern49394a22016-11-16 15:06:29 +0900241/* per thread run time data */
242struct thread_runtime {
243 u64 last_time; /* time of previous sched in/out event */
244 u64 dt_run; /* run time */
Namhyung Kim941bdea2017-01-13 19:45:21 +0900245 u64 dt_sleep; /* time between CPU access by sleep (off cpu) */
246 u64 dt_iowait; /* time between CPU access by iowait (off cpu) */
247 u64 dt_preempt; /* time between CPU access by preempt (off cpu) */
David Ahern49394a22016-11-16 15:06:29 +0900248 u64 dt_delay; /* time between wakeup and sched-in */
249 u64 ready_to_run; /* time of wakeup */
250
251 struct stats run_stats;
252 u64 total_run_time;
Namhyung Kim587782c2017-01-13 19:45:23 +0900253 u64 total_sleep_time;
254 u64 total_iowait_time;
255 u64 total_preempt_time;
256 u64 total_delay_time;
David Ahern350f54f2016-11-25 09:28:41 -0700257
Namhyung Kim941bdea2017-01-13 19:45:21 +0900258 int last_state;
Changbin Du8640da92018-03-06 11:37:36 +0800259
260 char shortname[3];
Changbin Du99a3c3a2018-03-06 11:37:37 +0800261 bool comm_changed;
262
David Ahern350f54f2016-11-25 09:28:41 -0700263 u64 migrations;
David Ahern49394a22016-11-16 15:06:29 +0900264};
265
266/* per event run time data */
267struct evsel_runtime {
268 u64 *last_time; /* time this event was last seen per cpu */
269 u32 ncpu; /* highest cpu slot allocated */
270};
271
Namhyung Kim3bc2fa92016-12-08 23:47:51 +0900272/* per cpu idle time data */
273struct idle_thread_runtime {
274 struct thread_runtime tr;
275 struct thread *last_thread;
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -0800276 struct rb_root_cached sorted_root;
Namhyung Kim3bc2fa92016-12-08 23:47:51 +0900277 struct callchain_root callchain;
278 struct callchain_cursor cursor;
279};
280
David Ahern49394a22016-11-16 15:06:29 +0900281/* track idle times per cpu */
282static struct thread **idle_threads;
283static int idle_max_cpu;
284static char idle_comm[] = "<idle>";
285
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200286static u64 get_nsecs(void)
287{
288 struct timespec ts;
289
290 clock_gettime(CLOCK_MONOTONIC, &ts);
291
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300292 return ts.tv_sec * NSEC_PER_SEC + ts.tv_nsec;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200293}
294
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300295static void burn_nsecs(struct perf_sched *sched, u64 nsecs)
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200296{
297 u64 T0 = get_nsecs(), T1;
298
299 do {
300 T1 = get_nsecs();
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300301 } while (T1 + sched->run_measurement_overhead < T0 + nsecs);
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200302}
303
304static void sleep_nsecs(u64 nsecs)
305{
306 struct timespec ts;
307
308 ts.tv_nsec = nsecs % 999999999;
309 ts.tv_sec = nsecs / 999999999;
310
311 nanosleep(&ts, NULL);
312}
313
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300314static void calibrate_run_measurement_overhead(struct perf_sched *sched)
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200315{
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300316 u64 T0, T1, delta, min_delta = NSEC_PER_SEC;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200317 int i;
318
319 for (i = 0; i < 10; i++) {
320 T0 = get_nsecs();
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300321 burn_nsecs(sched, 0);
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200322 T1 = get_nsecs();
323 delta = T1-T0;
324 min_delta = min(min_delta, delta);
325 }
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300326 sched->run_measurement_overhead = min_delta;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200327
Arnaldo Carvalho de Melo9486aa32011-01-22 20:37:02 -0200328 printf("run measurement overhead: %" PRIu64 " nsecs\n", min_delta);
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200329}
330
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300331static void calibrate_sleep_measurement_overhead(struct perf_sched *sched)
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200332{
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300333 u64 T0, T1, delta, min_delta = NSEC_PER_SEC;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200334 int i;
335
336 for (i = 0; i < 10; i++) {
337 T0 = get_nsecs();
338 sleep_nsecs(10000);
339 T1 = get_nsecs();
340 delta = T1-T0;
341 min_delta = min(min_delta, delta);
342 }
343 min_delta -= 10000;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300344 sched->sleep_measurement_overhead = min_delta;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200345
Arnaldo Carvalho de Melo9486aa32011-01-22 20:37:02 -0200346 printf("sleep measurement overhead: %" PRIu64 " nsecs\n", min_delta);
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200347}
348
mingo39aeb522009-09-14 20:04:48 +0200349static struct sched_atom *
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200350get_new_event(struct task_desc *task, u64 timestamp)
Ingo Molnarec156762009-09-11 12:12:54 +0200351{
Arnaldo Carvalho de Melo36479482009-11-24 12:05:16 -0200352 struct sched_atom *event = zalloc(sizeof(*event));
Ingo Molnarec156762009-09-11 12:12:54 +0200353 unsigned long idx = task->nr_events;
354 size_t size;
355
356 event->timestamp = timestamp;
357 event->nr = idx;
358
359 task->nr_events++;
mingo39aeb522009-09-14 20:04:48 +0200360 size = sizeof(struct sched_atom *) * task->nr_events;
361 task->atoms = realloc(task->atoms, size);
362 BUG_ON(!task->atoms);
Ingo Molnarec156762009-09-11 12:12:54 +0200363
mingo39aeb522009-09-14 20:04:48 +0200364 task->atoms[idx] = event;
Ingo Molnarec156762009-09-11 12:12:54 +0200365
366 return event;
367}
368
mingo39aeb522009-09-14 20:04:48 +0200369static struct sched_atom *last_event(struct task_desc *task)
Ingo Molnarec156762009-09-11 12:12:54 +0200370{
371 if (!task->nr_events)
372 return NULL;
373
mingo39aeb522009-09-14 20:04:48 +0200374 return task->atoms[task->nr_events - 1];
Ingo Molnarec156762009-09-11 12:12:54 +0200375}
376
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300377static void add_sched_event_run(struct perf_sched *sched, struct task_desc *task,
378 u64 timestamp, u64 duration)
Ingo Molnarec156762009-09-11 12:12:54 +0200379{
mingo39aeb522009-09-14 20:04:48 +0200380 struct sched_atom *event, *curr_event = last_event(task);
Ingo Molnarec156762009-09-11 12:12:54 +0200381
382 /*
Ingo Molnarfbf94822009-09-11 12:12:54 +0200383 * optimize an existing RUN event by merging this one
384 * to it:
385 */
Ingo Molnarec156762009-09-11 12:12:54 +0200386 if (curr_event && curr_event->type == SCHED_EVENT_RUN) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300387 sched->nr_run_events_optimized++;
Ingo Molnarec156762009-09-11 12:12:54 +0200388 curr_event->duration += duration;
389 return;
390 }
391
392 event = get_new_event(task, timestamp);
393
394 event->type = SCHED_EVENT_RUN;
395 event->duration = duration;
396
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300397 sched->nr_run_events++;
Ingo Molnarec156762009-09-11 12:12:54 +0200398}
399
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300400static void add_sched_event_wakeup(struct perf_sched *sched, struct task_desc *task,
401 u64 timestamp, struct task_desc *wakee)
Ingo Molnarec156762009-09-11 12:12:54 +0200402{
mingo39aeb522009-09-14 20:04:48 +0200403 struct sched_atom *event, *wakee_event;
Ingo Molnarec156762009-09-11 12:12:54 +0200404
405 event = get_new_event(task, timestamp);
406 event->type = SCHED_EVENT_WAKEUP;
407 event->wakee = wakee;
408
409 wakee_event = last_event(wakee);
410 if (!wakee_event || wakee_event->type != SCHED_EVENT_SLEEP) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300411 sched->targetless_wakeups++;
Ingo Molnarec156762009-09-11 12:12:54 +0200412 return;
413 }
414 if (wakee_event->wait_sem) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300415 sched->multitarget_wakeups++;
Ingo Molnarec156762009-09-11 12:12:54 +0200416 return;
417 }
418
Arnaldo Carvalho de Melo36479482009-11-24 12:05:16 -0200419 wakee_event->wait_sem = zalloc(sizeof(*wakee_event->wait_sem));
Ingo Molnarec156762009-09-11 12:12:54 +0200420 sem_init(wakee_event->wait_sem, 0, 0);
421 wakee_event->specific_wait = 1;
422 event->wait_sem = wakee_event->wait_sem;
423
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300424 sched->nr_wakeup_events++;
Ingo Molnarec156762009-09-11 12:12:54 +0200425}
426
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300427static void add_sched_event_sleep(struct perf_sched *sched, struct task_desc *task,
428 u64 timestamp, u64 task_state __maybe_unused)
Ingo Molnarec156762009-09-11 12:12:54 +0200429{
mingo39aeb522009-09-14 20:04:48 +0200430 struct sched_atom *event = get_new_event(task, timestamp);
Ingo Molnarec156762009-09-11 12:12:54 +0200431
432 event->type = SCHED_EVENT_SLEEP;
433
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300434 sched->nr_sleep_events++;
Ingo Molnarec156762009-09-11 12:12:54 +0200435}
436
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300437static struct task_desc *register_pid(struct perf_sched *sched,
438 unsigned long pid, const char *comm)
Ingo Molnarec156762009-09-11 12:12:54 +0200439{
440 struct task_desc *task;
Yunlong Songcb06ac22015-03-31 21:46:30 +0800441 static int pid_max;
Ingo Molnarec156762009-09-11 12:12:54 +0200442
Yunlong Songcb06ac22015-03-31 21:46:30 +0800443 if (sched->pid_to_task == NULL) {
444 if (sysctl__read_int("kernel/pid_max", &pid_max) < 0)
445 pid_max = MAX_PID;
446 BUG_ON((sched->pid_to_task = calloc(pid_max, sizeof(struct task_desc *))) == NULL);
447 }
Yunlong Song3a423a52015-03-31 21:46:31 +0800448 if (pid >= (unsigned long)pid_max) {
449 BUG_ON((sched->pid_to_task = realloc(sched->pid_to_task, (pid + 1) *
450 sizeof(struct task_desc *))) == NULL);
451 while (pid >= (unsigned long)pid_max)
452 sched->pid_to_task[pid_max++] = NULL;
453 }
Ingo Molnarec156762009-09-11 12:12:54 +0200454
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300455 task = sched->pid_to_task[pid];
Ingo Molnarec156762009-09-11 12:12:54 +0200456
457 if (task)
458 return task;
459
Arnaldo Carvalho de Melo36479482009-11-24 12:05:16 -0200460 task = zalloc(sizeof(*task));
Ingo Molnarec156762009-09-11 12:12:54 +0200461 task->pid = pid;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300462 task->nr = sched->nr_tasks;
Ingo Molnarec156762009-09-11 12:12:54 +0200463 strcpy(task->comm, comm);
464 /*
465 * every task starts in sleeping state - this gets ignored
466 * if there's no wakeup pointing to this sleep state:
467 */
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300468 add_sched_event_sleep(sched, task, 0, 0);
Ingo Molnarec156762009-09-11 12:12:54 +0200469
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300470 sched->pid_to_task[pid] = task;
471 sched->nr_tasks++;
Yunlong Song0755bc42015-03-31 21:46:28 +0800472 sched->tasks = realloc(sched->tasks, sched->nr_tasks * sizeof(struct task_desc *));
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300473 BUG_ON(!sched->tasks);
474 sched->tasks[task->nr] = task;
Ingo Molnarec156762009-09-11 12:12:54 +0200475
Namhyung Kimbb963e12017-02-17 17:17:38 +0900476 if (verbose > 0)
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300477 printf("registered task #%ld, PID %ld (%s)\n", sched->nr_tasks, pid, comm);
Ingo Molnarec156762009-09-11 12:12:54 +0200478
479 return task;
480}
481
482
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300483static void print_task_traces(struct perf_sched *sched)
Ingo Molnarec156762009-09-11 12:12:54 +0200484{
485 struct task_desc *task;
486 unsigned long i;
487
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300488 for (i = 0; i < sched->nr_tasks; i++) {
489 task = sched->tasks[i];
Ingo Molnarad236fd2009-09-11 12:12:54 +0200490 printf("task %6ld (%20s:%10ld), nr_events: %ld\n",
Ingo Molnarec156762009-09-11 12:12:54 +0200491 task->nr, task->comm, task->pid, task->nr_events);
492 }
493}
494
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300495static void add_cross_task_wakeups(struct perf_sched *sched)
Ingo Molnarec156762009-09-11 12:12:54 +0200496{
497 struct task_desc *task1, *task2;
498 unsigned long i, j;
499
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300500 for (i = 0; i < sched->nr_tasks; i++) {
501 task1 = sched->tasks[i];
Ingo Molnarec156762009-09-11 12:12:54 +0200502 j = i + 1;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300503 if (j == sched->nr_tasks)
Ingo Molnarec156762009-09-11 12:12:54 +0200504 j = 0;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300505 task2 = sched->tasks[j];
506 add_sched_event_wakeup(sched, task1, 0, task2);
Ingo Molnarec156762009-09-11 12:12:54 +0200507 }
508}
509
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300510static void perf_sched__process_event(struct perf_sched *sched,
511 struct sched_atom *atom)
Ingo Molnarec156762009-09-11 12:12:54 +0200512{
513 int ret = 0;
Ingo Molnarec156762009-09-11 12:12:54 +0200514
mingo39aeb522009-09-14 20:04:48 +0200515 switch (atom->type) {
Ingo Molnarec156762009-09-11 12:12:54 +0200516 case SCHED_EVENT_RUN:
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300517 burn_nsecs(sched, atom->duration);
Ingo Molnarec156762009-09-11 12:12:54 +0200518 break;
519 case SCHED_EVENT_SLEEP:
mingo39aeb522009-09-14 20:04:48 +0200520 if (atom->wait_sem)
521 ret = sem_wait(atom->wait_sem);
Ingo Molnarec156762009-09-11 12:12:54 +0200522 BUG_ON(ret);
523 break;
524 case SCHED_EVENT_WAKEUP:
mingo39aeb522009-09-14 20:04:48 +0200525 if (atom->wait_sem)
526 ret = sem_post(atom->wait_sem);
Ingo Molnarec156762009-09-11 12:12:54 +0200527 BUG_ON(ret);
528 break;
Mike Galbraith55ffb7a2009-10-10 14:46:04 +0200529 case SCHED_EVENT_MIGRATION:
530 break;
Ingo Molnarec156762009-09-11 12:12:54 +0200531 default:
532 BUG_ON(1);
533 }
534}
535
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200536static u64 get_cpu_usage_nsec_parent(void)
Ingo Molnarec156762009-09-11 12:12:54 +0200537{
538 struct rusage ru;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200539 u64 sum;
Ingo Molnarec156762009-09-11 12:12:54 +0200540 int err;
541
542 err = getrusage(RUSAGE_SELF, &ru);
543 BUG_ON(err);
544
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300545 sum = ru.ru_utime.tv_sec * NSEC_PER_SEC + ru.ru_utime.tv_usec * NSEC_PER_USEC;
546 sum += ru.ru_stime.tv_sec * NSEC_PER_SEC + ru.ru_stime.tv_usec * NSEC_PER_USEC;
Ingo Molnarec156762009-09-11 12:12:54 +0200547
548 return sum;
549}
550
Yunlong Song939cda52015-03-31 21:46:34 +0800551static int self_open_counters(struct perf_sched *sched, unsigned long cur_task)
Ingo Molnarec156762009-09-11 12:12:54 +0200552{
Xiao Guangrongc0c9e722009-12-09 17:51:30 +0800553 struct perf_event_attr attr;
Yunlong Song939cda52015-03-31 21:46:34 +0800554 char sbuf[STRERR_BUFSIZE], info[STRERR_BUFSIZE];
Xiao Guangrongc0c9e722009-12-09 17:51:30 +0800555 int fd;
Yunlong Song939cda52015-03-31 21:46:34 +0800556 struct rlimit limit;
557 bool need_privilege = false;
Xiao Guangrongc0c9e722009-12-09 17:51:30 +0800558
559 memset(&attr, 0, sizeof(attr));
560
561 attr.type = PERF_TYPE_SOFTWARE;
562 attr.config = PERF_COUNT_SW_TASK_CLOCK;
563
Yunlong Song939cda52015-03-31 21:46:34 +0800564force_again:
Yann Droneaud57480d22014-06-30 22:28:47 +0200565 fd = sys_perf_event_open(&attr, 0, -1, -1,
566 perf_event_open_cloexec_flag());
Xiao Guangrongc0c9e722009-12-09 17:51:30 +0800567
Yunlong Song1aff59b2015-03-31 21:46:33 +0800568 if (fd < 0) {
Yunlong Song939cda52015-03-31 21:46:34 +0800569 if (errno == EMFILE) {
570 if (sched->force) {
571 BUG_ON(getrlimit(RLIMIT_NOFILE, &limit) == -1);
572 limit.rlim_cur += sched->nr_tasks - cur_task;
573 if (limit.rlim_cur > limit.rlim_max) {
574 limit.rlim_max = limit.rlim_cur;
575 need_privilege = true;
576 }
577 if (setrlimit(RLIMIT_NOFILE, &limit) == -1) {
578 if (need_privilege && errno == EPERM)
579 strcpy(info, "Need privilege\n");
580 } else
581 goto force_again;
582 } else
583 strcpy(info, "Have a try with -f option\n");
584 }
Namhyung Kim60b7d142012-09-12 11:11:06 +0900585 pr_err("Error: sys_perf_event_open() syscall returned "
Yunlong Song939cda52015-03-31 21:46:34 +0800586 "with %d (%s)\n%s", fd,
Arnaldo Carvalho de Meloc8b5f2c2016-07-06 11:56:20 -0300587 str_error_r(errno, sbuf, sizeof(sbuf)), info);
Yunlong Song1aff59b2015-03-31 21:46:33 +0800588 exit(EXIT_FAILURE);
589 }
Xiao Guangrongc0c9e722009-12-09 17:51:30 +0800590 return fd;
591}
592
593static u64 get_cpu_usage_nsec_self(int fd)
594{
595 u64 runtime;
Ingo Molnarec156762009-09-11 12:12:54 +0200596 int ret;
597
Xiao Guangrongc0c9e722009-12-09 17:51:30 +0800598 ret = read(fd, &runtime, sizeof(runtime));
599 BUG_ON(ret != sizeof(runtime));
Ingo Molnarec156762009-09-11 12:12:54 +0200600
Xiao Guangrongc0c9e722009-12-09 17:51:30 +0800601 return runtime;
Ingo Molnarec156762009-09-11 12:12:54 +0200602}
603
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300604struct sched_thread_parms {
605 struct task_desc *task;
606 struct perf_sched *sched;
Yunlong Song08097ab2015-03-31 21:46:32 +0800607 int fd;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300608};
609
Ingo Molnarec156762009-09-11 12:12:54 +0200610static void *thread_func(void *ctx)
611{
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300612 struct sched_thread_parms *parms = ctx;
613 struct task_desc *this_task = parms->task;
614 struct perf_sched *sched = parms->sched;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200615 u64 cpu_usage_0, cpu_usage_1;
Ingo Molnarec156762009-09-11 12:12:54 +0200616 unsigned long i, ret;
617 char comm2[22];
Yunlong Song08097ab2015-03-31 21:46:32 +0800618 int fd = parms->fd;
Ingo Molnarec156762009-09-11 12:12:54 +0200619
Arnaldo Carvalho de Melo74cf2492013-12-27 16:55:14 -0300620 zfree(&parms);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300621
Ingo Molnarec156762009-09-11 12:12:54 +0200622 sprintf(comm2, ":%s", this_task->comm);
623 prctl(PR_SET_NAME, comm2);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -0300624 if (fd < 0)
625 return NULL;
Ingo Molnarec156762009-09-11 12:12:54 +0200626again:
627 ret = sem_post(&this_task->ready_for_work);
628 BUG_ON(ret);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300629 ret = pthread_mutex_lock(&sched->start_work_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200630 BUG_ON(ret);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300631 ret = pthread_mutex_unlock(&sched->start_work_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200632 BUG_ON(ret);
Ingo Molnarec156762009-09-11 12:12:54 +0200633
Xiao Guangrongc0c9e722009-12-09 17:51:30 +0800634 cpu_usage_0 = get_cpu_usage_nsec_self(fd);
Ingo Molnarec156762009-09-11 12:12:54 +0200635
636 for (i = 0; i < this_task->nr_events; i++) {
637 this_task->curr_event = i;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300638 perf_sched__process_event(sched, this_task->atoms[i]);
Ingo Molnarec156762009-09-11 12:12:54 +0200639 }
640
Xiao Guangrongc0c9e722009-12-09 17:51:30 +0800641 cpu_usage_1 = get_cpu_usage_nsec_self(fd);
Ingo Molnarec156762009-09-11 12:12:54 +0200642 this_task->cpu_usage = cpu_usage_1 - cpu_usage_0;
Ingo Molnarec156762009-09-11 12:12:54 +0200643 ret = sem_post(&this_task->work_done_sem);
644 BUG_ON(ret);
Ingo Molnarec156762009-09-11 12:12:54 +0200645
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300646 ret = pthread_mutex_lock(&sched->work_done_wait_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200647 BUG_ON(ret);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300648 ret = pthread_mutex_unlock(&sched->work_done_wait_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200649 BUG_ON(ret);
Ingo Molnarec156762009-09-11 12:12:54 +0200650
651 goto again;
652}
653
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300654static void create_tasks(struct perf_sched *sched)
Ingo Molnarec156762009-09-11 12:12:54 +0200655{
656 struct task_desc *task;
657 pthread_attr_t attr;
658 unsigned long i;
659 int err;
660
661 err = pthread_attr_init(&attr);
662 BUG_ON(err);
Jiri Pirko12f7e032011-01-10 14:14:23 -0200663 err = pthread_attr_setstacksize(&attr,
664 (size_t) max(16 * 1024, PTHREAD_STACK_MIN));
Ingo Molnarec156762009-09-11 12:12:54 +0200665 BUG_ON(err);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300666 err = pthread_mutex_lock(&sched->start_work_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200667 BUG_ON(err);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300668 err = pthread_mutex_lock(&sched->work_done_wait_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200669 BUG_ON(err);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300670 for (i = 0; i < sched->nr_tasks; i++) {
671 struct sched_thread_parms *parms = malloc(sizeof(*parms));
672 BUG_ON(parms == NULL);
673 parms->task = task = sched->tasks[i];
674 parms->sched = sched;
Yunlong Song939cda52015-03-31 21:46:34 +0800675 parms->fd = self_open_counters(sched, i);
Ingo Molnarec156762009-09-11 12:12:54 +0200676 sem_init(&task->sleep_sem, 0, 0);
677 sem_init(&task->ready_for_work, 0, 0);
678 sem_init(&task->work_done_sem, 0, 0);
679 task->curr_event = 0;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300680 err = pthread_create(&task->thread, &attr, thread_func, parms);
Ingo Molnarec156762009-09-11 12:12:54 +0200681 BUG_ON(err);
682 }
683}
684
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300685static void wait_for_tasks(struct perf_sched *sched)
Ingo Molnarec156762009-09-11 12:12:54 +0200686{
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200687 u64 cpu_usage_0, cpu_usage_1;
Ingo Molnarec156762009-09-11 12:12:54 +0200688 struct task_desc *task;
689 unsigned long i, ret;
690
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300691 sched->start_time = get_nsecs();
692 sched->cpu_usage = 0;
693 pthread_mutex_unlock(&sched->work_done_wait_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200694
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300695 for (i = 0; i < sched->nr_tasks; i++) {
696 task = sched->tasks[i];
Ingo Molnarec156762009-09-11 12:12:54 +0200697 ret = sem_wait(&task->ready_for_work);
698 BUG_ON(ret);
699 sem_init(&task->ready_for_work, 0, 0);
700 }
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300701 ret = pthread_mutex_lock(&sched->work_done_wait_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200702 BUG_ON(ret);
703
704 cpu_usage_0 = get_cpu_usage_nsec_parent();
705
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300706 pthread_mutex_unlock(&sched->start_work_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200707
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300708 for (i = 0; i < sched->nr_tasks; i++) {
709 task = sched->tasks[i];
Ingo Molnarec156762009-09-11 12:12:54 +0200710 ret = sem_wait(&task->work_done_sem);
711 BUG_ON(ret);
712 sem_init(&task->work_done_sem, 0, 0);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300713 sched->cpu_usage += task->cpu_usage;
Ingo Molnarec156762009-09-11 12:12:54 +0200714 task->cpu_usage = 0;
715 }
716
717 cpu_usage_1 = get_cpu_usage_nsec_parent();
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300718 if (!sched->runavg_cpu_usage)
719 sched->runavg_cpu_usage = sched->cpu_usage;
Yunlong Songff5f3bb2015-03-31 21:46:36 +0800720 sched->runavg_cpu_usage = (sched->runavg_cpu_usage * (sched->replay_repeat - 1) + sched->cpu_usage) / sched->replay_repeat;
Ingo Molnarec156762009-09-11 12:12:54 +0200721
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300722 sched->parent_cpu_usage = cpu_usage_1 - cpu_usage_0;
723 if (!sched->runavg_parent_cpu_usage)
724 sched->runavg_parent_cpu_usage = sched->parent_cpu_usage;
Yunlong Songff5f3bb2015-03-31 21:46:36 +0800725 sched->runavg_parent_cpu_usage = (sched->runavg_parent_cpu_usage * (sched->replay_repeat - 1) +
726 sched->parent_cpu_usage)/sched->replay_repeat;
Ingo Molnarec156762009-09-11 12:12:54 +0200727
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300728 ret = pthread_mutex_lock(&sched->start_work_mutex);
Ingo Molnarec156762009-09-11 12:12:54 +0200729 BUG_ON(ret);
730
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300731 for (i = 0; i < sched->nr_tasks; i++) {
732 task = sched->tasks[i];
Ingo Molnarec156762009-09-11 12:12:54 +0200733 sem_init(&task->sleep_sem, 0, 0);
734 task->curr_event = 0;
735 }
736}
737
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300738static void run_one_test(struct perf_sched *sched)
Ingo Molnarec156762009-09-11 12:12:54 +0200739{
Kyle McMartinfb7d0b32011-01-24 11:13:04 -0500740 u64 T0, T1, delta, avg_delta, fluct;
Ingo Molnarec156762009-09-11 12:12:54 +0200741
742 T0 = get_nsecs();
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300743 wait_for_tasks(sched);
Ingo Molnarec156762009-09-11 12:12:54 +0200744 T1 = get_nsecs();
745
746 delta = T1 - T0;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300747 sched->sum_runtime += delta;
748 sched->nr_runs++;
Ingo Molnarec156762009-09-11 12:12:54 +0200749
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300750 avg_delta = sched->sum_runtime / sched->nr_runs;
Ingo Molnarec156762009-09-11 12:12:54 +0200751 if (delta < avg_delta)
752 fluct = avg_delta - delta;
753 else
754 fluct = delta - avg_delta;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300755 sched->sum_fluct += fluct;
756 if (!sched->run_avg)
757 sched->run_avg = delta;
Yunlong Songff5f3bb2015-03-31 21:46:36 +0800758 sched->run_avg = (sched->run_avg * (sched->replay_repeat - 1) + delta) / sched->replay_repeat;
Ingo Molnarec156762009-09-11 12:12:54 +0200759
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300760 printf("#%-3ld: %0.3f, ", sched->nr_runs, (double)delta / NSEC_PER_MSEC);
Ingo Molnarec156762009-09-11 12:12:54 +0200761
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300762 printf("ravg: %0.2f, ", (double)sched->run_avg / NSEC_PER_MSEC);
Ingo Molnarec156762009-09-11 12:12:54 +0200763
Ingo Molnarad236fd2009-09-11 12:12:54 +0200764 printf("cpu: %0.2f / %0.2f",
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300765 (double)sched->cpu_usage / NSEC_PER_MSEC, (double)sched->runavg_cpu_usage / NSEC_PER_MSEC);
Ingo Molnarec156762009-09-11 12:12:54 +0200766
767#if 0
768 /*
Ingo Molnarfbf94822009-09-11 12:12:54 +0200769 * rusage statistics done by the parent, these are less
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300770 * accurate than the sched->sum_exec_runtime based statistics:
Ingo Molnarfbf94822009-09-11 12:12:54 +0200771 */
Ingo Molnarad236fd2009-09-11 12:12:54 +0200772 printf(" [%0.2f / %0.2f]",
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300773 (double)sched->parent_cpu_usage / NSEC_PER_MSEC,
774 (double)sched->runavg_parent_cpu_usage / NSEC_PER_MSEC);
Ingo Molnarec156762009-09-11 12:12:54 +0200775#endif
776
Ingo Molnarad236fd2009-09-11 12:12:54 +0200777 printf("\n");
Ingo Molnarec156762009-09-11 12:12:54 +0200778
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300779 if (sched->nr_sleep_corrections)
780 printf(" (%ld sleep corrections)\n", sched->nr_sleep_corrections);
781 sched->nr_sleep_corrections = 0;
Ingo Molnarec156762009-09-11 12:12:54 +0200782}
783
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300784static void test_calibrations(struct perf_sched *sched)
Ingo Molnarec156762009-09-11 12:12:54 +0200785{
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200786 u64 T0, T1;
Ingo Molnarec156762009-09-11 12:12:54 +0200787
788 T0 = get_nsecs();
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300789 burn_nsecs(sched, NSEC_PER_MSEC);
Ingo Molnarec156762009-09-11 12:12:54 +0200790 T1 = get_nsecs();
791
Arnaldo Carvalho de Melo9486aa32011-01-22 20:37:02 -0200792 printf("the run test took %" PRIu64 " nsecs\n", T1 - T0);
Ingo Molnarec156762009-09-11 12:12:54 +0200793
794 T0 = get_nsecs();
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -0300795 sleep_nsecs(NSEC_PER_MSEC);
Ingo Molnarec156762009-09-11 12:12:54 +0200796 T1 = get_nsecs();
797
Arnaldo Carvalho de Melo9486aa32011-01-22 20:37:02 -0200798 printf("the sleep test took %" PRIu64 " nsecs\n", T1 - T0);
Ingo Molnarec156762009-09-11 12:12:54 +0200799}
800
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -0300801static int
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300802replay_wakeup_event(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +0200803 struct evsel *evsel, struct perf_sample *sample,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300804 struct machine *machine __maybe_unused)
Ingo Molnarec156762009-09-11 12:12:54 +0200805{
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300806 const char *comm = perf_evsel__strval(evsel, sample, "comm");
807 const u32 pid = perf_evsel__intval(evsel, sample, "pid");
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +0200808 struct task_desc *waker, *wakee;
809
Namhyung Kimbb963e12017-02-17 17:17:38 +0900810 if (verbose > 0) {
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -0300811 printf("sched_wakeup event %p\n", evsel);
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +0200812
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300813 printf(" ... pid %d woke up %s/%d\n", sample->tid, comm, pid);
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +0200814 }
815
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -0300816 waker = register_pid(sched, sample->tid, "<unknown>");
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300817 wakee = register_pid(sched, pid, comm);
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +0200818
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300819 add_sched_event_wakeup(sched, waker, sample->time, wakee);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -0300820 return 0;
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +0200821}
822
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300823static int replay_switch_event(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +0200824 struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300825 struct perf_sample *sample,
826 struct machine *machine __maybe_unused)
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +0200827{
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300828 const char *prev_comm = perf_evsel__strval(evsel, sample, "prev_comm"),
829 *next_comm = perf_evsel__strval(evsel, sample, "next_comm");
830 const u32 prev_pid = perf_evsel__intval(evsel, sample, "prev_pid"),
831 next_pid = perf_evsel__intval(evsel, sample, "next_pid");
832 const u64 prev_state = perf_evsel__intval(evsel, sample, "prev_state");
Irina Tirdea1d037ca2012-09-11 01:15:03 +0300833 struct task_desc *prev, __maybe_unused *next;
Arnaldo Carvalho de Melo7f7f8d02012-08-07 11:33:42 -0300834 u64 timestamp0, timestamp = sample->time;
835 int cpu = sample->cpu;
Ingo Molnarfbf94822009-09-11 12:12:54 +0200836 s64 delta;
837
Namhyung Kimbb963e12017-02-17 17:17:38 +0900838 if (verbose > 0)
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -0300839 printf("sched_switch event %p\n", evsel);
Ingo Molnarad236fd2009-09-11 12:12:54 +0200840
Ingo Molnarfbf94822009-09-11 12:12:54 +0200841 if (cpu >= MAX_CPUS || cpu < 0)
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -0300842 return 0;
Ingo Molnarfbf94822009-09-11 12:12:54 +0200843
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300844 timestamp0 = sched->cpu_last_switched[cpu];
Ingo Molnarfbf94822009-09-11 12:12:54 +0200845 if (timestamp0)
846 delta = timestamp - timestamp0;
847 else
848 delta = 0;
849
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -0300850 if (delta < 0) {
Namhyung Kim60b7d142012-09-12 11:11:06 +0900851 pr_err("hm, delta: %" PRIu64 " < 0 ?\n", delta);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -0300852 return -1;
853 }
Ingo Molnarfbf94822009-09-11 12:12:54 +0200854
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300855 pr_debug(" ... switch from %s/%d to %s/%d [ran %" PRIu64 " nsecs]\n",
856 prev_comm, prev_pid, next_comm, next_pid, delta);
Ingo Molnarfbf94822009-09-11 12:12:54 +0200857
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300858 prev = register_pid(sched, prev_pid, prev_comm);
859 next = register_pid(sched, next_pid, next_comm);
Ingo Molnarfbf94822009-09-11 12:12:54 +0200860
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300861 sched->cpu_last_switched[cpu] = timestamp;
Ingo Molnarfbf94822009-09-11 12:12:54 +0200862
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -0300863 add_sched_event_run(sched, prev, timestamp, delta);
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300864 add_sched_event_sleep(sched, prev, timestamp, prev_state);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -0300865
866 return 0;
Ingo Molnarfbf94822009-09-11 12:12:54 +0200867}
868
David Aherncb627502013-08-07 22:50:47 -0400869static int replay_fork_event(struct perf_sched *sched,
870 union perf_event *event,
871 struct machine *machine)
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +0200872{
David Aherncb627502013-08-07 22:50:47 -0400873 struct thread *child, *parent;
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300874
Adrian Hunter314add62013-08-27 11:23:03 +0300875 child = machine__findnew_thread(machine, event->fork.pid,
876 event->fork.tid);
877 parent = machine__findnew_thread(machine, event->fork.ppid,
878 event->fork.ptid);
David Aherncb627502013-08-07 22:50:47 -0400879
880 if (child == NULL || parent == NULL) {
881 pr_debug("thread does not exist on fork event: child %p, parent %p\n",
882 child, parent);
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -0300883 goto out_put;
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +0200884 }
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -0300885
Namhyung Kimbb963e12017-02-17 17:17:38 +0900886 if (verbose > 0) {
David Aherncb627502013-08-07 22:50:47 -0400887 printf("fork event\n");
Frederic Weisbeckerb9c51432013-09-11 14:46:56 +0200888 printf("... parent: %s/%d\n", thread__comm_str(parent), parent->tid);
889 printf("... child: %s/%d\n", thread__comm_str(child), child->tid);
David Aherncb627502013-08-07 22:50:47 -0400890 }
891
Frederic Weisbeckerb9c51432013-09-11 14:46:56 +0200892 register_pid(sched, parent->tid, thread__comm_str(parent));
893 register_pid(sched, child->tid, thread__comm_str(child));
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -0300894out_put:
895 thread__put(child);
896 thread__put(parent);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -0300897 return 0;
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +0200898}
899
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200900struct sort_dimension {
901 const char *name;
Ingo Molnarb5fae122009-09-11 12:12:54 +0200902 sort_fn_t cmp;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +0200903 struct list_head list;
904};
905
Changbin Du8640da92018-03-06 11:37:36 +0800906/*
907 * handle runtime stats saved per thread
908 */
909static struct thread_runtime *thread__init_runtime(struct thread *thread)
910{
911 struct thread_runtime *r;
912
913 r = zalloc(sizeof(struct thread_runtime));
914 if (!r)
915 return NULL;
916
917 init_stats(&r->run_stats);
918 thread__set_priv(thread, r);
919
920 return r;
921}
922
923static struct thread_runtime *thread__get_runtime(struct thread *thread)
924{
925 struct thread_runtime *tr;
926
927 tr = thread__priv(thread);
928 if (tr == NULL) {
929 tr = thread__init_runtime(thread);
930 if (tr == NULL)
931 pr_debug("Failed to malloc memory for runtime data.\n");
932 }
933
934 return tr;
935}
936
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +0200937static int
mingo39aeb522009-09-14 20:04:48 +0200938thread_lat_cmp(struct list_head *list, struct work_atoms *l, struct work_atoms *r)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +0200939{
940 struct sort_dimension *sort;
941 int ret = 0;
942
Ingo Molnarb5fae122009-09-11 12:12:54 +0200943 BUG_ON(list_empty(list));
944
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +0200945 list_for_each_entry(sort, list, list) {
946 ret = sort->cmp(l, r);
947 if (ret)
948 return ret;
949 }
950
951 return ret;
952}
953
mingo39aeb522009-09-14 20:04:48 +0200954static struct work_atoms *
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -0800955thread_atoms_search(struct rb_root_cached *root, struct thread *thread,
Ingo Molnarb5fae122009-09-11 12:12:54 +0200956 struct list_head *sort_list)
957{
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -0800958 struct rb_node *node = root->rb_root.rb_node;
mingo39aeb522009-09-14 20:04:48 +0200959 struct work_atoms key = { .thread = thread };
Ingo Molnarb5fae122009-09-11 12:12:54 +0200960
961 while (node) {
mingo39aeb522009-09-14 20:04:48 +0200962 struct work_atoms *atoms;
Ingo Molnarb5fae122009-09-11 12:12:54 +0200963 int cmp;
964
mingo39aeb522009-09-14 20:04:48 +0200965 atoms = container_of(node, struct work_atoms, node);
Ingo Molnarb5fae122009-09-11 12:12:54 +0200966
967 cmp = thread_lat_cmp(sort_list, &key, atoms);
968 if (cmp > 0)
969 node = node->rb_left;
970 else if (cmp < 0)
971 node = node->rb_right;
972 else {
973 BUG_ON(thread != atoms->thread);
974 return atoms;
975 }
976 }
977 return NULL;
978}
979
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +0200980static void
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -0800981__thread_latency_insert(struct rb_root_cached *root, struct work_atoms *data,
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +0200982 struct list_head *sort_list)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +0200983{
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -0800984 struct rb_node **new = &(root->rb_root.rb_node), *parent = NULL;
985 bool leftmost = true;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +0200986
987 while (*new) {
mingo39aeb522009-09-14 20:04:48 +0200988 struct work_atoms *this;
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +0200989 int cmp;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +0200990
mingo39aeb522009-09-14 20:04:48 +0200991 this = container_of(*new, struct work_atoms, node);
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +0200992 parent = *new;
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +0200993
994 cmp = thread_lat_cmp(sort_list, data, this);
995
996 if (cmp > 0)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +0200997 new = &((*new)->rb_left);
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -0800998 else {
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +0200999 new = &((*new)->rb_right);
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08001000 leftmost = false;
1001 }
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001002 }
1003
1004 rb_link_node(&data->node, parent, new);
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08001005 rb_insert_color_cached(&data->node, root, leftmost);
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001006}
1007
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001008static int thread_atoms_insert(struct perf_sched *sched, struct thread *thread)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001009{
Arnaldo Carvalho de Melo36479482009-11-24 12:05:16 -02001010 struct work_atoms *atoms = zalloc(sizeof(*atoms));
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001011 if (!atoms) {
1012 pr_err("No memory at %s\n", __func__);
1013 return -1;
1014 }
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001015
Arnaldo Carvalho de Melof3b623b2015-03-02 22:21:35 -03001016 atoms->thread = thread__get(thread);
mingo39aeb522009-09-14 20:04:48 +02001017 INIT_LIST_HEAD(&atoms->work_list);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001018 __thread_latency_insert(&sched->atom_root, atoms, &sched->cmp_pid);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001019 return 0;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001020}
1021
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001022static char sched_out_state(u64 prev_state)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001023{
1024 const char *str = TASK_STATE_TO_CHAR_STR;
1025
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001026 return str[prev_state];
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001027}
1028
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001029static int
mingo39aeb522009-09-14 20:04:48 +02001030add_sched_out_event(struct work_atoms *atoms,
1031 char run_state,
1032 u64 timestamp)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001033{
Arnaldo Carvalho de Melo36479482009-11-24 12:05:16 -02001034 struct work_atom *atom = zalloc(sizeof(*atom));
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001035 if (!atom) {
1036 pr_err("Non memory at %s", __func__);
1037 return -1;
1038 }
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001039
Frederic Weisbeckeraa1ab9d2009-09-14 03:01:12 +02001040 atom->sched_out_time = timestamp;
1041
mingo39aeb522009-09-14 20:04:48 +02001042 if (run_state == 'R') {
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +02001043 atom->state = THREAD_WAIT_CPU;
Frederic Weisbeckeraa1ab9d2009-09-14 03:01:12 +02001044 atom->wake_up_time = atom->sched_out_time;
Frederic Weisbeckerc6ced612009-09-13 00:46:19 +02001045 }
1046
mingo39aeb522009-09-14 20:04:48 +02001047 list_add_tail(&atom->list, &atoms->work_list);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001048 return 0;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001049}
1050
1051static void
Irina Tirdea1d037ca2012-09-11 01:15:03 +03001052add_runtime_event(struct work_atoms *atoms, u64 delta,
1053 u64 timestamp __maybe_unused)
mingo39aeb522009-09-14 20:04:48 +02001054{
1055 struct work_atom *atom;
1056
1057 BUG_ON(list_empty(&atoms->work_list));
1058
1059 atom = list_entry(atoms->work_list.prev, struct work_atom, list);
1060
1061 atom->runtime += delta;
1062 atoms->total_runtime += delta;
1063}
1064
1065static void
1066add_sched_in_event(struct work_atoms *atoms, u64 timestamp)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001067{
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +02001068 struct work_atom *atom;
Frederic Weisbecker66685672009-09-13 01:56:25 +02001069 u64 delta;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001070
mingo39aeb522009-09-14 20:04:48 +02001071 if (list_empty(&atoms->work_list))
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001072 return;
1073
mingo39aeb522009-09-14 20:04:48 +02001074 atom = list_entry(atoms->work_list.prev, struct work_atom, list);
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001075
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +02001076 if (atom->state != THREAD_WAIT_CPU)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001077 return;
1078
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +02001079 if (timestamp < atom->wake_up_time) {
1080 atom->state = THREAD_IGNORE;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001081 return;
1082 }
1083
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +02001084 atom->state = THREAD_SCHED_IN;
1085 atom->sched_in_time = timestamp;
Frederic Weisbecker66685672009-09-13 01:56:25 +02001086
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +02001087 delta = atom->sched_in_time - atom->wake_up_time;
Frederic Weisbecker66685672009-09-13 01:56:25 +02001088 atoms->total_lat += delta;
Frederic Weisbecker3786310a2009-12-09 21:40:08 +01001089 if (delta > atoms->max_lat) {
Frederic Weisbecker66685672009-09-13 01:56:25 +02001090 atoms->max_lat = delta;
Frederic Weisbecker3786310a2009-12-09 21:40:08 +01001091 atoms->max_lat_at = timestamp;
1092 }
Frederic Weisbecker66685672009-09-13 01:56:25 +02001093 atoms->nb_atoms++;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001094}
1095
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001096static int latency_switch_event(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001097 struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001098 struct perf_sample *sample,
1099 struct machine *machine)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001100{
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001101 const u32 prev_pid = perf_evsel__intval(evsel, sample, "prev_pid"),
1102 next_pid = perf_evsel__intval(evsel, sample, "next_pid");
1103 const u64 prev_state = perf_evsel__intval(evsel, sample, "prev_state");
mingo39aeb522009-09-14 20:04:48 +02001104 struct work_atoms *out_events, *in_events;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001105 struct thread *sched_out, *sched_in;
Arnaldo Carvalho de Melo7f7f8d02012-08-07 11:33:42 -03001106 u64 timestamp0, timestamp = sample->time;
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001107 int cpu = sample->cpu, err = -1;
Ingo Molnarea92ed52009-09-12 10:08:34 +02001108 s64 delta;
1109
mingo39aeb522009-09-14 20:04:48 +02001110 BUG_ON(cpu >= MAX_CPUS || cpu < 0);
Ingo Molnarea92ed52009-09-12 10:08:34 +02001111
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001112 timestamp0 = sched->cpu_last_switched[cpu];
1113 sched->cpu_last_switched[cpu] = timestamp;
Ingo Molnarea92ed52009-09-12 10:08:34 +02001114 if (timestamp0)
1115 delta = timestamp - timestamp0;
1116 else
1117 delta = 0;
1118
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001119 if (delta < 0) {
1120 pr_err("hm, delta: %" PRIu64 " < 0 ?\n", delta);
1121 return -1;
1122 }
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001123
Adrian Hunter1fcb8762014-07-14 13:02:25 +03001124 sched_out = machine__findnew_thread(machine, -1, prev_pid);
1125 sched_in = machine__findnew_thread(machine, -1, next_pid);
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001126 if (sched_out == NULL || sched_in == NULL)
1127 goto out_put;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001128
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001129 out_events = thread_atoms_search(&sched->atom_root, sched_out, &sched->cmp_pid);
mingo39aeb522009-09-14 20:04:48 +02001130 if (!out_events) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001131 if (thread_atoms_insert(sched, sched_out))
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001132 goto out_put;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001133 out_events = thread_atoms_search(&sched->atom_root, sched_out, &sched->cmp_pid);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001134 if (!out_events) {
1135 pr_err("out-event: Internal tree error");
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001136 goto out_put;
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001137 }
mingo39aeb522009-09-14 20:04:48 +02001138 }
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001139 if (add_sched_out_event(out_events, sched_out_state(prev_state), timestamp))
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001140 return -1;
mingo39aeb522009-09-14 20:04:48 +02001141
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001142 in_events = thread_atoms_search(&sched->atom_root, sched_in, &sched->cmp_pid);
mingo39aeb522009-09-14 20:04:48 +02001143 if (!in_events) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001144 if (thread_atoms_insert(sched, sched_in))
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001145 goto out_put;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001146 in_events = thread_atoms_search(&sched->atom_root, sched_in, &sched->cmp_pid);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001147 if (!in_events) {
1148 pr_err("in-event: Internal tree error");
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001149 goto out_put;
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001150 }
mingo39aeb522009-09-14 20:04:48 +02001151 /*
1152 * Take came in we have not heard about yet,
1153 * add in an initial atom in runnable state:
1154 */
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001155 if (add_sched_out_event(in_events, 'R', timestamp))
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001156 goto out_put;
mingo39aeb522009-09-14 20:04:48 +02001157 }
1158 add_sched_in_event(in_events, timestamp);
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001159 err = 0;
1160out_put:
1161 thread__put(sched_out);
1162 thread__put(sched_in);
1163 return err;
mingo39aeb522009-09-14 20:04:48 +02001164}
1165
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001166static int latency_runtime_event(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001167 struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001168 struct perf_sample *sample,
1169 struct machine *machine)
mingo39aeb522009-09-14 20:04:48 +02001170{
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001171 const u32 pid = perf_evsel__intval(evsel, sample, "pid");
1172 const u64 runtime = perf_evsel__intval(evsel, sample, "runtime");
Adrian Hunter1fcb8762014-07-14 13:02:25 +03001173 struct thread *thread = machine__findnew_thread(machine, -1, pid);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001174 struct work_atoms *atoms = thread_atoms_search(&sched->atom_root, thread, &sched->cmp_pid);
Arnaldo Carvalho de Melo7f7f8d02012-08-07 11:33:42 -03001175 u64 timestamp = sample->time;
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001176 int cpu = sample->cpu, err = -1;
1177
1178 if (thread == NULL)
1179 return -1;
mingo39aeb522009-09-14 20:04:48 +02001180
1181 BUG_ON(cpu >= MAX_CPUS || cpu < 0);
mingo39aeb522009-09-14 20:04:48 +02001182 if (!atoms) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001183 if (thread_atoms_insert(sched, thread))
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001184 goto out_put;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001185 atoms = thread_atoms_search(&sched->atom_root, thread, &sched->cmp_pid);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001186 if (!atoms) {
Namhyung Kim60b7d142012-09-12 11:11:06 +09001187 pr_err("in-event: Internal tree error");
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001188 goto out_put;
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001189 }
1190 if (add_sched_out_event(atoms, 'R', timestamp))
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001191 goto out_put;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001192 }
1193
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001194 add_runtime_event(atoms, runtime, timestamp);
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001195 err = 0;
1196out_put:
1197 thread__put(thread);
1198 return err;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001199}
1200
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001201static int latency_wakeup_event(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001202 struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001203 struct perf_sample *sample,
1204 struct machine *machine)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001205{
Peter Zijlstra0680ee72014-05-12 20:19:46 +02001206 const u32 pid = perf_evsel__intval(evsel, sample, "pid");
mingo39aeb522009-09-14 20:04:48 +02001207 struct work_atoms *atoms;
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +02001208 struct work_atom *atom;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001209 struct thread *wakee;
Arnaldo Carvalho de Melo7f7f8d02012-08-07 11:33:42 -03001210 u64 timestamp = sample->time;
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001211 int err = -1;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001212
Adrian Hunter1fcb8762014-07-14 13:02:25 +03001213 wakee = machine__findnew_thread(machine, -1, pid);
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001214 if (wakee == NULL)
1215 return -1;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001216 atoms = thread_atoms_search(&sched->atom_root, wakee, &sched->cmp_pid);
Frederic Weisbecker17562202009-09-12 23:11:32 +02001217 if (!atoms) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001218 if (thread_atoms_insert(sched, wakee))
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001219 goto out_put;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001220 atoms = thread_atoms_search(&sched->atom_root, wakee, &sched->cmp_pid);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001221 if (!atoms) {
Namhyung Kim60b7d142012-09-12 11:11:06 +09001222 pr_err("wakeup-event: Internal tree error");
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001223 goto out_put;
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001224 }
1225 if (add_sched_out_event(atoms, 'S', timestamp))
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001226 goto out_put;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001227 }
1228
mingo39aeb522009-09-14 20:04:48 +02001229 BUG_ON(list_empty(&atoms->work_list));
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001230
mingo39aeb522009-09-14 20:04:48 +02001231 atom = list_entry(atoms->work_list.prev, struct work_atom, list);
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001232
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001233 /*
Dongsheng Yang67d6259dd2014-05-13 10:38:21 +09001234 * As we do not guarantee the wakeup event happens when
1235 * task is out of run queue, also may happen when task is
1236 * on run queue and wakeup only change ->state to TASK_RUNNING,
1237 * then we should not set the ->wake_up_time when wake up a
1238 * task which is on run queue.
1239 *
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001240 * You WILL be missing events if you've recorded only
1241 * one CPU, or are only looking at only one, so don't
Dongsheng Yang67d6259dd2014-05-13 10:38:21 +09001242 * skip in this case.
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001243 */
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001244 if (sched->profile_cpu == -1 && atom->state != THREAD_SLEEPING)
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001245 goto out_ok;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001246
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001247 sched->nr_timestamps++;
Ingo Molnarea57c4f2009-09-13 18:15:54 +02001248 if (atom->sched_out_time > timestamp) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001249 sched->nr_unordered_timestamps++;
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001250 goto out_ok;
Ingo Molnarea57c4f2009-09-13 18:15:54 +02001251 }
Frederic Weisbeckeraa1ab9d2009-09-14 03:01:12 +02001252
Ingo Molnarb1ffe8f2009-09-11 12:12:54 +02001253 atom->state = THREAD_WAIT_CPU;
1254 atom->wake_up_time = timestamp;
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001255out_ok:
1256 err = 0;
1257out_put:
1258 thread__put(wakee);
1259 return err;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001260}
1261
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001262static int latency_migrate_task_event(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001263 struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001264 struct perf_sample *sample,
1265 struct machine *machine)
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001266{
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001267 const u32 pid = perf_evsel__intval(evsel, sample, "pid");
Arnaldo Carvalho de Melo7f7f8d02012-08-07 11:33:42 -03001268 u64 timestamp = sample->time;
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001269 struct work_atoms *atoms;
1270 struct work_atom *atom;
1271 struct thread *migrant;
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001272 int err = -1;
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001273
1274 /*
1275 * Only need to worry about migration when profiling one CPU.
1276 */
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001277 if (sched->profile_cpu == -1)
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001278 return 0;
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001279
Adrian Hunter1fcb8762014-07-14 13:02:25 +03001280 migrant = machine__findnew_thread(machine, -1, pid);
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001281 if (migrant == NULL)
1282 return -1;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001283 atoms = thread_atoms_search(&sched->atom_root, migrant, &sched->cmp_pid);
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001284 if (!atoms) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001285 if (thread_atoms_insert(sched, migrant))
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001286 goto out_put;
Frederic Weisbeckerb9c51432013-09-11 14:46:56 +02001287 register_pid(sched, migrant->tid, thread__comm_str(migrant));
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001288 atoms = thread_atoms_search(&sched->atom_root, migrant, &sched->cmp_pid);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001289 if (!atoms) {
Namhyung Kim60b7d142012-09-12 11:11:06 +09001290 pr_err("migration-event: Internal tree error");
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001291 goto out_put;
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001292 }
1293 if (add_sched_out_event(atoms, 'R', timestamp))
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001294 goto out_put;
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001295 }
1296
1297 BUG_ON(list_empty(&atoms->work_list));
1298
1299 atom = list_entry(atoms->work_list.prev, struct work_atom, list);
1300 atom->sched_in_time = atom->sched_out_time = atom->wake_up_time = timestamp;
1301
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001302 sched->nr_timestamps++;
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001303
1304 if (atom->sched_out_time > timestamp)
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001305 sched->nr_unordered_timestamps++;
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001306 err = 0;
1307out_put:
1308 thread__put(migrant);
1309 return err;
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001310}
1311
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001312static void output_lat_thread(struct perf_sched *sched, struct work_atoms *work_list)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001313{
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001314 int i;
1315 int ret;
Frederic Weisbecker66685672009-09-13 01:56:25 +02001316 u64 avg;
Namhyung Kim99620a52016-10-24 11:02:45 +09001317 char max_lat_at[32];
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001318
mingo39aeb522009-09-14 20:04:48 +02001319 if (!work_list->nb_atoms)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001320 return;
Ingo Molnarea57c4f2009-09-13 18:15:54 +02001321 /*
1322 * Ignore idle threads:
1323 */
Frederic Weisbeckerb9c51432013-09-11 14:46:56 +02001324 if (!strcmp(thread__comm_str(work_list->thread), "swapper"))
Ingo Molnarea57c4f2009-09-13 18:15:54 +02001325 return;
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001326
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001327 sched->all_runtime += work_list->total_runtime;
1328 sched->all_count += work_list->nb_atoms;
Frederic Weisbecker66685672009-09-13 01:56:25 +02001329
Josef Bacik2f80dd42015-05-22 09:18:40 -04001330 if (work_list->num_merged > 1)
1331 ret = printf(" %s:(%d) ", thread__comm_str(work_list->thread), work_list->num_merged);
1332 else
1333 ret = printf(" %s:%d ", thread__comm_str(work_list->thread), work_list->thread->tid);
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001334
mingo08f69e62009-09-14 18:30:44 +02001335 for (i = 0; i < 24 - ret; i++)
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001336 printf(" ");
1337
mingo39aeb522009-09-14 20:04:48 +02001338 avg = work_list->total_lat / work_list->nb_atoms;
Namhyung Kim99620a52016-10-24 11:02:45 +09001339 timestamp__scnprintf_usec(work_list->max_lat_at, max_lat_at, sizeof(max_lat_at));
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001340
Namhyung Kim99620a52016-10-24 11:02:45 +09001341 printf("|%11.3f ms |%9" PRIu64 " | avg:%9.3f ms | max:%9.3f ms | max at: %13s s\n",
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -03001342 (double)work_list->total_runtime / NSEC_PER_MSEC,
1343 work_list->nb_atoms, (double)avg / NSEC_PER_MSEC,
1344 (double)work_list->max_lat / NSEC_PER_MSEC,
Namhyung Kim99620a52016-10-24 11:02:45 +09001345 max_lat_at);
Frederic Weisbeckercdce9d72009-09-12 08:06:14 +02001346}
1347
mingo39aeb522009-09-14 20:04:48 +02001348static int pid_cmp(struct work_atoms *l, struct work_atoms *r)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001349{
Jiri Olsa0014de12015-11-02 12:10:25 +01001350 if (l->thread == r->thread)
1351 return 0;
Adrian Hunter38051232013-07-04 16:20:31 +03001352 if (l->thread->tid < r->thread->tid)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001353 return -1;
Adrian Hunter38051232013-07-04 16:20:31 +03001354 if (l->thread->tid > r->thread->tid)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001355 return 1;
Jiri Olsa0014de12015-11-02 12:10:25 +01001356 return (int)(l->thread - r->thread);
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001357}
1358
mingo39aeb522009-09-14 20:04:48 +02001359static int avg_cmp(struct work_atoms *l, struct work_atoms *r)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001360{
1361 u64 avgl, avgr;
1362
1363 if (!l->nb_atoms)
1364 return -1;
1365
1366 if (!r->nb_atoms)
1367 return 1;
1368
1369 avgl = l->total_lat / l->nb_atoms;
1370 avgr = r->total_lat / r->nb_atoms;
1371
1372 if (avgl < avgr)
1373 return -1;
1374 if (avgl > avgr)
1375 return 1;
1376
1377 return 0;
1378}
1379
mingo39aeb522009-09-14 20:04:48 +02001380static int max_cmp(struct work_atoms *l, struct work_atoms *r)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001381{
1382 if (l->max_lat < r->max_lat)
1383 return -1;
1384 if (l->max_lat > r->max_lat)
1385 return 1;
1386
1387 return 0;
1388}
1389
mingo39aeb522009-09-14 20:04:48 +02001390static int switch_cmp(struct work_atoms *l, struct work_atoms *r)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001391{
1392 if (l->nb_atoms < r->nb_atoms)
1393 return -1;
1394 if (l->nb_atoms > r->nb_atoms)
1395 return 1;
1396
1397 return 0;
1398}
1399
mingo39aeb522009-09-14 20:04:48 +02001400static int runtime_cmp(struct work_atoms *l, struct work_atoms *r)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001401{
1402 if (l->total_runtime < r->total_runtime)
1403 return -1;
1404 if (l->total_runtime > r->total_runtime)
1405 return 1;
1406
1407 return 0;
1408}
1409
Randy Dunlapcbef79a2009-10-05 13:17:29 -07001410static int sort_dimension__add(const char *tok, struct list_head *list)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001411{
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001412 size_t i;
1413 static struct sort_dimension avg_sort_dimension = {
1414 .name = "avg",
1415 .cmp = avg_cmp,
1416 };
1417 static struct sort_dimension max_sort_dimension = {
1418 .name = "max",
1419 .cmp = max_cmp,
1420 };
1421 static struct sort_dimension pid_sort_dimension = {
1422 .name = "pid",
1423 .cmp = pid_cmp,
1424 };
1425 static struct sort_dimension runtime_sort_dimension = {
1426 .name = "runtime",
1427 .cmp = runtime_cmp,
1428 };
1429 static struct sort_dimension switch_sort_dimension = {
1430 .name = "switch",
1431 .cmp = switch_cmp,
1432 };
1433 struct sort_dimension *available_sorts[] = {
1434 &pid_sort_dimension,
1435 &avg_sort_dimension,
1436 &max_sort_dimension,
1437 &switch_sort_dimension,
1438 &runtime_sort_dimension,
1439 };
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001440
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001441 for (i = 0; i < ARRAY_SIZE(available_sorts); i++) {
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001442 if (!strcmp(available_sorts[i]->name, tok)) {
1443 list_add_tail(&available_sorts[i]->list, list);
1444
1445 return 0;
1446 }
1447 }
1448
1449 return -1;
1450}
1451
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001452static void perf_sched__sort_lat(struct perf_sched *sched)
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001453{
1454 struct rb_node *node;
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08001455 struct rb_root_cached *root = &sched->atom_root;
Josef Bacik2f80dd42015-05-22 09:18:40 -04001456again:
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001457 for (;;) {
mingo39aeb522009-09-14 20:04:48 +02001458 struct work_atoms *data;
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08001459 node = rb_first_cached(root);
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001460 if (!node)
1461 break;
1462
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08001463 rb_erase_cached(node, root);
mingo39aeb522009-09-14 20:04:48 +02001464 data = rb_entry(node, struct work_atoms, node);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001465 __thread_latency_insert(&sched->sorted_atom_root, data, &sched->sort_list);
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001466 }
Josef Bacik2f80dd42015-05-22 09:18:40 -04001467 if (root == &sched->atom_root) {
1468 root = &sched->merged_atom_root;
1469 goto again;
1470 }
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02001471}
1472
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001473static int process_sched_wakeup_event(struct perf_tool *tool,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001474 struct evsel *evsel,
Irina Tirdea1d037ca2012-09-11 01:15:03 +03001475 struct perf_sample *sample,
Arnaldo Carvalho de Melo4218e672012-09-11 13:18:47 -03001476 struct machine *machine)
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +02001477{
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001478 struct perf_sched *sched = container_of(tool, struct perf_sched, tool);
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +02001479
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001480 if (sched->tp_handler->wakeup_event)
1481 return sched->tp_handler->wakeup_event(sched, evsel, sample, machine);
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +02001482
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -03001483 return 0;
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +02001484}
1485
Jiri Olsaa151a372016-04-12 15:29:29 +02001486union map_priv {
1487 void *ptr;
1488 bool color;
1489};
1490
1491static bool thread__has_color(struct thread *thread)
1492{
1493 union map_priv priv = {
1494 .ptr = thread__priv(thread),
1495 };
1496
1497 return priv.color;
1498}
1499
1500static struct thread*
1501map__findnew_thread(struct perf_sched *sched, struct machine *machine, pid_t pid, pid_t tid)
1502{
1503 struct thread *thread = machine__findnew_thread(machine, pid, tid);
1504 union map_priv priv = {
1505 .color = false,
1506 };
1507
1508 if (!sched->map.color_pids || !thread || thread__priv(thread))
1509 return thread;
1510
1511 if (thread_map__has(sched->map.color_pids, tid))
1512 priv.color = true;
1513
1514 thread__set_priv(thread, priv.ptr);
1515 return thread;
1516}
1517
Jiri Olsa32dcd022019-07-21 13:23:51 +02001518static int map_switch_event(struct perf_sched *sched, struct evsel *evsel,
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001519 struct perf_sample *sample, struct machine *machine)
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001520{
Dongsheng Yang9d372ca2014-05-16 14:37:05 +09001521 const u32 next_pid = perf_evsel__intval(evsel, sample, "next_pid");
1522 struct thread *sched_in;
Changbin Du8640da92018-03-06 11:37:36 +08001523 struct thread_runtime *tr;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001524 int new_shortname;
Arnaldo Carvalho de Melo7f7f8d02012-08-07 11:33:42 -03001525 u64 timestamp0, timestamp = sample->time;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001526 s64 delta;
Jiri Olsa99623c62016-04-12 15:29:26 +02001527 int i, this_cpu = sample->cpu;
1528 int cpus_nr;
1529 bool new_cpu = false;
Jiri Olsa8cd91192016-04-12 15:29:27 +02001530 const char *color = PERF_COLOR_NORMAL;
Namhyung Kim99620a52016-10-24 11:02:45 +09001531 char stimestamp[32];
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001532
1533 BUG_ON(this_cpu >= MAX_CPUS || this_cpu < 0);
1534
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001535 if (this_cpu > sched->max_cpu)
1536 sched->max_cpu = this_cpu;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001537
Jiri Olsa99623c62016-04-12 15:29:26 +02001538 if (sched->map.comp) {
1539 cpus_nr = bitmap_weight(sched->map.comp_cpus_mask, MAX_CPUS);
1540 if (!test_and_set_bit(this_cpu, sched->map.comp_cpus_mask)) {
1541 sched->map.comp_cpus[cpus_nr++] = this_cpu;
1542 new_cpu = true;
1543 }
1544 } else
1545 cpus_nr = sched->max_cpu;
1546
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001547 timestamp0 = sched->cpu_last_switched[this_cpu];
1548 sched->cpu_last_switched[this_cpu] = timestamp;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001549 if (timestamp0)
1550 delta = timestamp - timestamp0;
1551 else
1552 delta = 0;
1553
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001554 if (delta < 0) {
Namhyung Kim60b7d142012-09-12 11:11:06 +09001555 pr_err("hm, delta: %" PRIu64 " < 0 ?\n", delta);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001556 return -1;
1557 }
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001558
Jiri Olsaa151a372016-04-12 15:29:29 +02001559 sched_in = map__findnew_thread(sched, machine, -1, next_pid);
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001560 if (sched_in == NULL)
1561 return -1;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001562
Changbin Du8640da92018-03-06 11:37:36 +08001563 tr = thread__get_runtime(sched_in);
1564 if (tr == NULL) {
1565 thread__put(sched_in);
1566 return -1;
1567 }
1568
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001569 sched->curr_thread[this_cpu] = thread__get(sched_in);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001570
1571 printf(" ");
1572
1573 new_shortname = 0;
Changbin Du8640da92018-03-06 11:37:36 +08001574 if (!tr->shortname[0]) {
Dongsheng6bcab4e2014-05-06 14:39:01 +09001575 if (!strcmp(thread__comm_str(sched_in), "swapper")) {
1576 /*
1577 * Don't allocate a letter-number for swapper:0
1578 * as a shortname. Instead, we use '.' for it.
1579 */
Changbin Du8640da92018-03-06 11:37:36 +08001580 tr->shortname[0] = '.';
1581 tr->shortname[1] = ' ';
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001582 } else {
Changbin Du8640da92018-03-06 11:37:36 +08001583 tr->shortname[0] = sched->next_shortname1;
1584 tr->shortname[1] = sched->next_shortname2;
Dongsheng6bcab4e2014-05-06 14:39:01 +09001585
1586 if (sched->next_shortname1 < 'Z') {
1587 sched->next_shortname1++;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001588 } else {
Dongsheng6bcab4e2014-05-06 14:39:01 +09001589 sched->next_shortname1 = 'A';
1590 if (sched->next_shortname2 < '9')
1591 sched->next_shortname2++;
1592 else
1593 sched->next_shortname2 = '0';
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001594 }
1595 }
1596 new_shortname = 1;
1597 }
1598
Jiri Olsa99623c62016-04-12 15:29:26 +02001599 for (i = 0; i < cpus_nr; i++) {
1600 int cpu = sched->map.comp ? sched->map.comp_cpus[i] : i;
Jiri Olsaa151a372016-04-12 15:29:29 +02001601 struct thread *curr_thread = sched->curr_thread[cpu];
Changbin Du8640da92018-03-06 11:37:36 +08001602 struct thread_runtime *curr_tr;
Jiri Olsaa151a372016-04-12 15:29:29 +02001603 const char *pid_color = color;
Jiri Olsacf294f22016-04-12 15:29:30 +02001604 const char *cpu_color = color;
Jiri Olsaa151a372016-04-12 15:29:29 +02001605
1606 if (curr_thread && thread__has_color(curr_thread))
1607 pid_color = COLOR_PIDS;
Jiri Olsa99623c62016-04-12 15:29:26 +02001608
Jiri Olsa73643bb2016-04-12 15:29:31 +02001609 if (sched->map.cpus && !cpu_map__has(sched->map.cpus, cpu))
1610 continue;
1611
Jiri Olsacf294f22016-04-12 15:29:30 +02001612 if (sched->map.color_cpus && cpu_map__has(sched->map.color_cpus, cpu))
1613 cpu_color = COLOR_CPUS;
1614
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001615 if (cpu != this_cpu)
Namhyung Kim1208bb22016-10-24 11:02:43 +09001616 color_fprintf(stdout, color, " ");
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001617 else
Jiri Olsacf294f22016-04-12 15:29:30 +02001618 color_fprintf(stdout, cpu_color, "*");
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001619
Changbin Du8640da92018-03-06 11:37:36 +08001620 if (sched->curr_thread[cpu]) {
1621 curr_tr = thread__get_runtime(sched->curr_thread[cpu]);
1622 if (curr_tr == NULL) {
1623 thread__put(sched_in);
1624 return -1;
1625 }
1626 color_fprintf(stdout, pid_color, "%2s ", curr_tr->shortname);
1627 } else
Jiri Olsa8cd91192016-04-12 15:29:27 +02001628 color_fprintf(stdout, color, " ");
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001629 }
1630
Jiri Olsa73643bb2016-04-12 15:29:31 +02001631 if (sched->map.cpus && !cpu_map__has(sched->map.cpus, this_cpu))
1632 goto out;
1633
Namhyung Kim99620a52016-10-24 11:02:45 +09001634 timestamp__scnprintf_usec(timestamp, stimestamp, sizeof(stimestamp));
1635 color_fprintf(stdout, color, " %12s secs ", stimestamp);
Changbin Du99a3c3a2018-03-06 11:37:37 +08001636 if (new_shortname || tr->comm_changed || (verbose > 0 && sched_in->tid)) {
Jiri Olsaa151a372016-04-12 15:29:29 +02001637 const char *pid_color = color;
1638
1639 if (thread__has_color(sched_in))
1640 pid_color = COLOR_PIDS;
1641
1642 color_fprintf(stdout, pid_color, "%s => %s:%d",
Changbin Du8640da92018-03-06 11:37:36 +08001643 tr->shortname, thread__comm_str(sched_in), sched_in->tid);
Changbin Du99a3c3a2018-03-06 11:37:37 +08001644 tr->comm_changed = false;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001645 }
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001646
Jiri Olsa99623c62016-04-12 15:29:26 +02001647 if (sched->map.comp && new_cpu)
Jiri Olsa8cd91192016-04-12 15:29:27 +02001648 color_fprintf(stdout, color, " (CPU %d)", this_cpu);
Jiri Olsa99623c62016-04-12 15:29:26 +02001649
Jiri Olsa73643bb2016-04-12 15:29:31 +02001650out:
Jiri Olsa8cd91192016-04-12 15:29:27 +02001651 color_fprintf(stdout, color, "\n");
Jiri Olsa99623c62016-04-12 15:29:26 +02001652
Arnaldo Carvalho de Melob91fc392015-04-06 20:43:22 -03001653 thread__put(sched_in);
1654
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001655 return 0;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02001656}
1657
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001658static int process_sched_switch_event(struct perf_tool *tool,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001659 struct evsel *evsel,
Irina Tirdea1d037ca2012-09-11 01:15:03 +03001660 struct perf_sample *sample,
Arnaldo Carvalho de Melo4218e672012-09-11 13:18:47 -03001661 struct machine *machine)
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +02001662{
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001663 struct perf_sched *sched = container_of(tool, struct perf_sched, tool);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001664 int this_cpu = sample->cpu, err = 0;
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -03001665 u32 prev_pid = perf_evsel__intval(evsel, sample, "prev_pid"),
1666 next_pid = perf_evsel__intval(evsel, sample, "next_pid");
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +02001667
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001668 if (sched->curr_pid[this_cpu] != (u32)-1) {
Ingo Molnarc8a37752009-09-16 14:07:00 +02001669 /*
1670 * Are we trying to switch away a PID that is
1671 * not current?
1672 */
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -03001673 if (sched->curr_pid[this_cpu] != prev_pid)
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001674 sched->nr_context_switch_bugs++;
Ingo Molnarc8a37752009-09-16 14:07:00 +02001675 }
Ingo Molnarc8a37752009-09-16 14:07:00 +02001676
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001677 if (sched->tp_handler->switch_event)
1678 err = sched->tp_handler->switch_event(sched, evsel, sample, machine);
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -03001679
1680 sched->curr_pid[this_cpu] = next_pid;
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001681 return err;
Frederic Weisbecker419ab0d2009-09-12 03:59:01 +02001682}
1683
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001684static int process_sched_runtime_event(struct perf_tool *tool,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001685 struct evsel *evsel,
Irina Tirdea1d037ca2012-09-11 01:15:03 +03001686 struct perf_sample *sample,
Arnaldo Carvalho de Melo4218e672012-09-11 13:18:47 -03001687 struct machine *machine)
mingo39aeb522009-09-14 20:04:48 +02001688{
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001689 struct perf_sched *sched = container_of(tool, struct perf_sched, tool);
mingo39aeb522009-09-14 20:04:48 +02001690
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001691 if (sched->tp_handler->runtime_event)
1692 return sched->tp_handler->runtime_event(sched, evsel, sample, machine);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001693
1694 return 0;
Ingo Molnarec156762009-09-11 12:12:54 +02001695}
1696
David Aherncb627502013-08-07 22:50:47 -04001697static int perf_sched__process_fork_event(struct perf_tool *tool,
1698 union perf_event *event,
1699 struct perf_sample *sample,
1700 struct machine *machine)
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -03001701{
1702 struct perf_sched *sched = container_of(tool, struct perf_sched, tool);
1703
David Aherncb627502013-08-07 22:50:47 -04001704 /* run the fork event through the perf machineruy */
1705 perf_event__process_fork(tool, event, sample, machine);
1706
1707 /* and then run additional processing needed for this command */
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001708 if (sched->tp_handler->fork_event)
David Aherncb627502013-08-07 22:50:47 -04001709 return sched->tp_handler->fork_event(sched, event, machine);
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -03001710
1711 return 0;
1712}
1713
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001714static int process_sched_migrate_task_event(struct perf_tool *tool,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001715 struct evsel *evsel,
Irina Tirdea1d037ca2012-09-11 01:15:03 +03001716 struct perf_sample *sample,
Arnaldo Carvalho de Melo4218e672012-09-11 13:18:47 -03001717 struct machine *machine)
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001718{
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03001719 struct perf_sched *sched = container_of(tool, struct perf_sched, tool);
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001720
Arnaldo Carvalho de Melo9ec3f4e2012-09-11 19:29:17 -03001721 if (sched->tp_handler->migrate_task_event)
1722 return sched->tp_handler->migrate_task_event(sched, evsel, sample, machine);
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001723
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -03001724 return 0;
Mike Galbraith55ffb7a2009-10-10 14:46:04 +02001725}
1726
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001727typedef int (*tracepoint_handler)(struct perf_tool *tool,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001728 struct evsel *evsel,
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001729 struct perf_sample *sample,
Arnaldo Carvalho de Melo4218e672012-09-11 13:18:47 -03001730 struct machine *machine);
Arnaldo Carvalho de Meloee29be62011-11-28 17:57:40 -02001731
Irina Tirdea1d037ca2012-09-11 01:15:03 +03001732static int perf_sched__process_tracepoint_sample(struct perf_tool *tool __maybe_unused,
1733 union perf_event *event __maybe_unused,
Arnaldo Carvalho de Meloee29be62011-11-28 17:57:40 -02001734 struct perf_sample *sample,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001735 struct evsel *evsel,
Arnaldo Carvalho de Meloee29be62011-11-28 17:57:40 -02001736 struct machine *machine)
Ingo Molnarec156762009-09-11 12:12:54 +02001737{
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001738 int err = 0;
Ingo Molnarec156762009-09-11 12:12:54 +02001739
Arnaldo Carvalho de Melo744a9712013-11-06 10:17:38 -03001740 if (evsel->handler != NULL) {
1741 tracepoint_handler f = evsel->handler;
Arnaldo Carvalho de Melo2b7fcbc2012-09-11 19:29:17 -03001742 err = f(tool, evsel, sample, machine);
Arnaldo Carvalho de Meloee29be62011-11-28 17:57:40 -02001743 }
Ingo Molnar0a02ad92009-09-11 12:12:54 +02001744
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001745 return err;
Ingo Molnar0a02ad92009-09-11 12:12:54 +02001746}
1747
Changbin Du99a3c3a2018-03-06 11:37:37 +08001748static int perf_sched__process_comm(struct perf_tool *tool __maybe_unused,
1749 union perf_event *event,
1750 struct perf_sample *sample,
1751 struct machine *machine)
1752{
1753 struct thread *thread;
1754 struct thread_runtime *tr;
1755 int err;
1756
1757 err = perf_event__process_comm(tool, event, sample, machine);
1758 if (err)
1759 return err;
1760
1761 thread = machine__find_thread(machine, sample->pid, sample->tid);
1762 if (!thread) {
1763 pr_err("Internal error: can't find thread\n");
1764 return -1;
1765 }
1766
1767 tr = thread__get_runtime(thread);
1768 if (tr == NULL) {
1769 thread__put(thread);
1770 return -1;
1771 }
1772
1773 tr->comm_changed = true;
1774 thread__put(thread);
1775
1776 return 0;
1777}
1778
Arnaldo Carvalho de Meloae536ac2015-03-02 22:28:41 -03001779static int perf_sched__read_events(struct perf_sched *sched)
Ingo Molnar0a02ad92009-09-11 12:12:54 +02001780{
Jiri Olsa32dcd022019-07-21 13:23:51 +02001781 const struct evsel_str_handler handlers[] = {
Arnaldo Carvalho de Meloee29be62011-11-28 17:57:40 -02001782 { "sched:sched_switch", process_sched_switch_event, },
1783 { "sched:sched_stat_runtime", process_sched_runtime_event, },
1784 { "sched:sched_wakeup", process_sched_wakeup_event, },
1785 { "sched:sched_wakeup_new", process_sched_wakeup_event, },
Arnaldo Carvalho de Meloee29be62011-11-28 17:57:40 -02001786 { "sched:sched_migrate_task", process_sched_migrate_task_event, },
1787 };
Arnaldo Carvalho de Meloda378962012-06-27 13:08:42 -03001788 struct perf_session *session;
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001789 struct perf_data data = {
Jiri Olsa2d4f2792019-02-21 10:41:30 +01001790 .path = input_name,
1791 .mode = PERF_DATA_MODE_READ,
1792 .force = sched->force,
Jiri Olsaf5fc14122013-10-15 16:27:32 +02001793 };
Arnaldo Carvalho de Meloae536ac2015-03-02 22:28:41 -03001794 int rc = -1;
Arnaldo Carvalho de Meloda378962012-06-27 13:08:42 -03001795
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01001796 session = perf_session__new(&data, false, &sched->tool);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001797 if (session == NULL) {
1798 pr_debug("No Memory for session\n");
1799 return -1;
1800 }
Arnaldo Carvalho de Melo94c744b2009-12-11 21:24:02 -02001801
Namhyung Kim0a7e6d12014-08-12 15:40:45 +09001802 symbol__init(&session->header.env);
Namhyung Kim04934102014-08-12 15:40:41 +09001803
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001804 if (perf_session__set_tracepoints_handlers(session, handlers))
1805 goto out_delete;
Arnaldo Carvalho de Meloee29be62011-11-28 17:57:40 -02001806
Arnaldo Carvalho de Melocee75ac2010-05-14 13:16:55 -03001807 if (perf_session__has_traces(session, "record -R")) {
Arnaldo Carvalho de Melob7b61cb2015-03-03 11:58:45 -03001808 int err = perf_session__process_events(session);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001809 if (err) {
1810 pr_err("Failed to process events, error %d", err);
1811 goto out_delete;
1812 }
Jiri Olsa4c09baf2011-08-08 23:03:34 +02001813
Arnaldo Carvalho de Melo75be9892015-02-14 14:50:11 -03001814 sched->nr_events = session->evlist->stats.nr_events[0];
1815 sched->nr_lost_events = session->evlist->stats.total_lost;
1816 sched->nr_lost_chunks = session->evlist->stats.nr_events[PERF_RECORD_LOST];
Arnaldo Carvalho de Melocee75ac2010-05-14 13:16:55 -03001817 }
Arnaldo Carvalho de Melod549c7692009-12-27 21:37:02 -02001818
Arnaldo Carvalho de Meloae536ac2015-03-02 22:28:41 -03001819 rc = 0;
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03001820out_delete:
1821 perf_session__delete(session);
Arnaldo Carvalho de Meloae536ac2015-03-02 22:28:41 -03001822 return rc;
Ingo Molnar0a02ad92009-09-11 12:12:54 +02001823}
1824
David Ahern49394a22016-11-16 15:06:29 +09001825/*
1826 * scheduling times are printed as msec.usec
1827 */
1828static inline void print_sched_time(unsigned long long nsecs, int width)
1829{
1830 unsigned long msecs;
1831 unsigned long usecs;
1832
1833 msecs = nsecs / NSEC_PER_MSEC;
1834 nsecs -= msecs * NSEC_PER_MSEC;
1835 usecs = nsecs / NSEC_PER_USEC;
1836 printf("%*lu.%03lu ", width, msecs, usecs);
1837}
1838
1839/*
1840 * returns runtime data for event, allocating memory for it the
1841 * first time it is used.
1842 */
Jiri Olsa32dcd022019-07-21 13:23:51 +02001843static struct evsel_runtime *perf_evsel__get_runtime(struct evsel *evsel)
David Ahern49394a22016-11-16 15:06:29 +09001844{
1845 struct evsel_runtime *r = evsel->priv;
1846
1847 if (r == NULL) {
1848 r = zalloc(sizeof(struct evsel_runtime));
1849 evsel->priv = r;
1850 }
1851
1852 return r;
1853}
1854
1855/*
1856 * save last time event was seen per cpu
1857 */
Jiri Olsa32dcd022019-07-21 13:23:51 +02001858static void perf_evsel__save_time(struct evsel *evsel,
David Ahern49394a22016-11-16 15:06:29 +09001859 u64 timestamp, u32 cpu)
1860{
1861 struct evsel_runtime *r = perf_evsel__get_runtime(evsel);
1862
1863 if (r == NULL)
1864 return;
1865
1866 if ((cpu >= r->ncpu) || (r->last_time == NULL)) {
1867 int i, n = __roundup_pow_of_two(cpu+1);
1868 void *p = r->last_time;
1869
1870 p = realloc(r->last_time, n * sizeof(u64));
1871 if (!p)
1872 return;
1873
1874 r->last_time = p;
1875 for (i = r->ncpu; i < n; ++i)
1876 r->last_time[i] = (u64) 0;
1877
1878 r->ncpu = n;
1879 }
1880
1881 r->last_time[cpu] = timestamp;
1882}
1883
1884/* returns last time this event was seen on the given cpu */
Jiri Olsa32dcd022019-07-21 13:23:51 +02001885static u64 perf_evsel__get_time(struct evsel *evsel, u32 cpu)
David Ahern49394a22016-11-16 15:06:29 +09001886{
1887 struct evsel_runtime *r = perf_evsel__get_runtime(evsel);
1888
1889 if ((r == NULL) || (r->last_time == NULL) || (cpu >= r->ncpu))
1890 return 0;
1891
1892 return r->last_time[cpu];
1893}
1894
Namhyung Kim9b8087d2016-12-22 15:03:48 +09001895static int comm_width = 30;
David Ahern49394a22016-11-16 15:06:29 +09001896
1897static char *timehist_get_commstr(struct thread *thread)
1898{
1899 static char str[32];
1900 const char *comm = thread__comm_str(thread);
1901 pid_t tid = thread->tid;
1902 pid_t pid = thread->pid_;
1903 int n;
1904
1905 if (pid == 0)
1906 n = scnprintf(str, sizeof(str), "%s", comm);
1907
1908 else if (tid != pid)
1909 n = scnprintf(str, sizeof(str), "%s[%d/%d]", comm, tid, pid);
1910
1911 else
1912 n = scnprintf(str, sizeof(str), "%s[%d]", comm, tid);
1913
1914 if (n > comm_width)
1915 comm_width = n;
1916
1917 return str;
1918}
1919
David Aherna407b062016-11-16 15:06:33 +09001920static void timehist_header(struct perf_sched *sched)
David Ahern49394a22016-11-16 15:06:29 +09001921{
David Aherna407b062016-11-16 15:06:33 +09001922 u32 ncpus = sched->max_cpu + 1;
1923 u32 i, j;
1924
David Ahern49394a22016-11-16 15:06:29 +09001925 printf("%15s %6s ", "time", "cpu");
1926
David Aherna407b062016-11-16 15:06:33 +09001927 if (sched->show_cpu_visual) {
1928 printf(" ");
1929 for (i = 0, j = 0; i < ncpus; ++i) {
1930 printf("%x", j++);
1931 if (j > 15)
1932 j = 0;
1933 }
1934 printf(" ");
1935 }
1936
Namhyung Kim0e6758e2016-12-22 15:03:48 +09001937 printf(" %-*s %9s %9s %9s", comm_width,
David Ahern49394a22016-11-16 15:06:29 +09001938 "task name", "wait time", "sch delay", "run time");
1939
Namhyung Kim414e0502017-01-13 19:45:22 +09001940 if (sched->show_state)
1941 printf(" %s", "state");
1942
David Ahern49394a22016-11-16 15:06:29 +09001943 printf("\n");
1944
1945 /*
1946 * units row
1947 */
1948 printf("%15s %-6s ", "", "");
1949
David Aherna407b062016-11-16 15:06:33 +09001950 if (sched->show_cpu_visual)
1951 printf(" %*s ", ncpus, "");
1952
Namhyung Kim414e0502017-01-13 19:45:22 +09001953 printf(" %-*s %9s %9s %9s", comm_width,
Namhyung Kim0e6758e2016-12-22 15:03:48 +09001954 "[tid/pid]", "(msec)", "(msec)", "(msec)");
David Ahern49394a22016-11-16 15:06:29 +09001955
Namhyung Kim414e0502017-01-13 19:45:22 +09001956 if (sched->show_state)
1957 printf(" %5s", "");
1958
1959 printf("\n");
1960
David Ahern49394a22016-11-16 15:06:29 +09001961 /*
1962 * separator
1963 */
1964 printf("%.15s %.6s ", graph_dotted_line, graph_dotted_line);
1965
David Aherna407b062016-11-16 15:06:33 +09001966 if (sched->show_cpu_visual)
1967 printf(" %.*s ", ncpus, graph_dotted_line);
1968
Namhyung Kim0e6758e2016-12-22 15:03:48 +09001969 printf(" %.*s %.9s %.9s %.9s", comm_width,
David Ahern49394a22016-11-16 15:06:29 +09001970 graph_dotted_line, graph_dotted_line, graph_dotted_line,
1971 graph_dotted_line);
1972
Namhyung Kim414e0502017-01-13 19:45:22 +09001973 if (sched->show_state)
1974 printf(" %.5s", graph_dotted_line);
1975
David Ahern49394a22016-11-16 15:06:29 +09001976 printf("\n");
1977}
1978
Namhyung Kim414e0502017-01-13 19:45:22 +09001979static char task_state_char(struct thread *thread, int state)
1980{
1981 static const char state_to_char[] = TASK_STATE_TO_CHAR_STR;
1982 unsigned bit = state ? ffs(state) : 0;
1983
1984 /* 'I' for idle */
1985 if (thread->tid == 0)
1986 return 'I';
1987
1988 return bit < sizeof(state_to_char) - 1 ? state_to_char[bit] : '?';
1989}
1990
David Ahernfc1469f2016-11-16 15:06:31 +09001991static void timehist_print_sample(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +02001992 struct evsel *evsel,
David Ahernfc1469f2016-11-16 15:06:31 +09001993 struct perf_sample *sample,
David Ahern6c973c92016-11-16 15:06:32 +09001994 struct addr_location *al,
David Ahern853b7402016-11-29 10:15:44 -07001995 struct thread *thread,
Namhyung Kim414e0502017-01-13 19:45:22 +09001996 u64 t, int state)
David Ahern49394a22016-11-16 15:06:29 +09001997{
1998 struct thread_runtime *tr = thread__priv(thread);
Brendan Gregg292c4a82017-03-14 01:56:29 +00001999 const char *next_comm = perf_evsel__strval(evsel, sample, "next_comm");
2000 const u32 next_pid = perf_evsel__intval(evsel, sample, "next_pid");
David Aherna407b062016-11-16 15:06:33 +09002001 u32 max_cpus = sched->max_cpu + 1;
David Ahern49394a22016-11-16 15:06:29 +09002002 char tstr[64];
Brendan Gregg292c4a82017-03-14 01:56:29 +00002003 char nstr[30];
Namhyung Kim941bdea2017-01-13 19:45:21 +09002004 u64 wait_time;
David Ahern49394a22016-11-16 15:06:29 +09002005
David Ahern853b7402016-11-29 10:15:44 -07002006 timestamp__scnprintf_usec(t, tstr, sizeof(tstr));
David Ahern49394a22016-11-16 15:06:29 +09002007 printf("%15s [%04d] ", tstr, sample->cpu);
2008
David Aherna407b062016-11-16 15:06:33 +09002009 if (sched->show_cpu_visual) {
2010 u32 i;
2011 char c;
2012
2013 printf(" ");
2014 for (i = 0; i < max_cpus; ++i) {
2015 /* flag idle times with 'i'; others are sched events */
2016 if (i == sample->cpu)
2017 c = (thread->tid == 0) ? 'i' : 's';
2018 else
2019 c = ' ';
2020 printf("%c", c);
2021 }
2022 printf(" ");
2023 }
2024
David Ahern49394a22016-11-16 15:06:29 +09002025 printf(" %-*s ", comm_width, timehist_get_commstr(thread));
2026
Namhyung Kim941bdea2017-01-13 19:45:21 +09002027 wait_time = tr->dt_sleep + tr->dt_iowait + tr->dt_preempt;
2028 print_sched_time(wait_time, 6);
2029
David Ahern49394a22016-11-16 15:06:29 +09002030 print_sched_time(tr->dt_delay, 6);
2031 print_sched_time(tr->dt_run, 6);
David Ahernfc1469f2016-11-16 15:06:31 +09002032
Namhyung Kim414e0502017-01-13 19:45:22 +09002033 if (sched->show_state)
2034 printf(" %5c ", task_state_char(thread, state));
2035
Brendan Gregg292c4a82017-03-14 01:56:29 +00002036 if (sched->show_next) {
2037 snprintf(nstr, sizeof(nstr), "next: %s[%d]", next_comm, next_pid);
2038 printf(" %-*s", comm_width, nstr);
2039 }
2040
2041 if (sched->show_wakeups && !sched->show_next)
David Ahernfc1469f2016-11-16 15:06:31 +09002042 printf(" %-*s", comm_width, "");
2043
David Ahern6c973c92016-11-16 15:06:32 +09002044 if (thread->tid == 0)
2045 goto out;
2046
2047 if (sched->show_callchain)
2048 printf(" ");
2049
2050 sample__fprintf_sym(sample, al, 0,
2051 EVSEL__PRINT_SYM | EVSEL__PRINT_ONELINE |
Namhyung Kim2d9bbf62016-11-24 10:11:13 +09002052 EVSEL__PRINT_CALLCHAIN_ARROW |
2053 EVSEL__PRINT_SKIP_IGNORED,
David Ahern6c973c92016-11-16 15:06:32 +09002054 &callchain_cursor, stdout);
2055
2056out:
David Ahern49394a22016-11-16 15:06:29 +09002057 printf("\n");
2058}
2059
2060/*
2061 * Explanation of delta-time stats:
2062 *
2063 * t = time of current schedule out event
2064 * tprev = time of previous sched out event
2065 * also time of schedule-in event for current task
2066 * last_time = time of last sched change event for current task
2067 * (i.e, time process was last scheduled out)
2068 * ready_to_run = time of wakeup for current task
2069 *
2070 * -----|------------|------------|------------|------
2071 * last ready tprev t
2072 * time to run
2073 *
2074 * |-------- dt_wait --------|
2075 * |- dt_delay -|-- dt_run --|
2076 *
2077 * dt_run = run time of current task
2078 * dt_wait = time between last schedule out event for task and tprev
2079 * represents time spent off the cpu
2080 * dt_delay = time between wakeup and schedule-in of task
2081 */
2082
2083static void timehist_update_runtime_stats(struct thread_runtime *r,
2084 u64 t, u64 tprev)
2085{
2086 r->dt_delay = 0;
Namhyung Kim941bdea2017-01-13 19:45:21 +09002087 r->dt_sleep = 0;
2088 r->dt_iowait = 0;
2089 r->dt_preempt = 0;
David Ahern49394a22016-11-16 15:06:29 +09002090 r->dt_run = 0;
Namhyung Kim941bdea2017-01-13 19:45:21 +09002091
David Ahern49394a22016-11-16 15:06:29 +09002092 if (tprev) {
2093 r->dt_run = t - tprev;
2094 if (r->ready_to_run) {
2095 if (r->ready_to_run > tprev)
2096 pr_debug("time travel: wakeup time for task > previous sched_switch event\n");
2097 else
2098 r->dt_delay = tprev - r->ready_to_run;
2099 }
2100
2101 if (r->last_time > tprev)
2102 pr_debug("time travel: last sched out time for task > previous sched_switch event\n");
Namhyung Kim941bdea2017-01-13 19:45:21 +09002103 else if (r->last_time) {
2104 u64 dt_wait = tprev - r->last_time;
2105
2106 if (r->last_state == TASK_RUNNING)
2107 r->dt_preempt = dt_wait;
2108 else if (r->last_state == TASK_UNINTERRUPTIBLE)
2109 r->dt_iowait = dt_wait;
2110 else
2111 r->dt_sleep = dt_wait;
2112 }
David Ahern49394a22016-11-16 15:06:29 +09002113 }
2114
2115 update_stats(&r->run_stats, r->dt_run);
Namhyung Kim587782c2017-01-13 19:45:23 +09002116
2117 r->total_run_time += r->dt_run;
2118 r->total_delay_time += r->dt_delay;
2119 r->total_sleep_time += r->dt_sleep;
2120 r->total_iowait_time += r->dt_iowait;
2121 r->total_preempt_time += r->dt_preempt;
David Ahern49394a22016-11-16 15:06:29 +09002122}
2123
Namhyung Kim96039c72016-12-08 23:47:50 +09002124static bool is_idle_sample(struct perf_sample *sample,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002125 struct evsel *evsel)
David Ahern49394a22016-11-16 15:06:29 +09002126{
2127 /* pid 0 == swapper == idle task */
Namhyung Kim96039c72016-12-08 23:47:50 +09002128 if (strcmp(perf_evsel__name(evsel), "sched:sched_switch") == 0)
2129 return perf_evsel__intval(evsel, sample, "prev_pid") == 0;
David Ahern49394a22016-11-16 15:06:29 +09002130
Namhyung Kim96039c72016-12-08 23:47:50 +09002131 return sample->pid == 0;
2132}
2133
2134static void save_task_callchain(struct perf_sched *sched,
2135 struct perf_sample *sample,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002136 struct evsel *evsel,
Namhyung Kim96039c72016-12-08 23:47:50 +09002137 struct machine *machine)
2138{
2139 struct callchain_cursor *cursor = &callchain_cursor;
2140 struct thread *thread;
David Ahern6c973c92016-11-16 15:06:32 +09002141
2142 /* want main thread for process - has maps */
2143 thread = machine__findnew_thread(machine, sample->pid, sample->pid);
2144 if (thread == NULL) {
2145 pr_debug("Failed to get thread for pid %d.\n", sample->pid);
Namhyung Kim96039c72016-12-08 23:47:50 +09002146 return;
David Ahern6c973c92016-11-16 15:06:32 +09002147 }
2148
Arnaldo Carvalho de Melo4c505632018-05-28 16:07:56 -03002149 if (!sched->show_callchain || sample->callchain == NULL)
Namhyung Kim96039c72016-12-08 23:47:50 +09002150 return;
David Ahern6c973c92016-11-16 15:06:32 +09002151
2152 if (thread__resolve_callchain(thread, cursor, evsel, sample,
Namhyung Kim8388deb2016-11-24 10:11:14 +09002153 NULL, NULL, sched->max_stack + 2) != 0) {
Namhyung Kimbb963e12017-02-17 17:17:38 +09002154 if (verbose > 0)
Arnaldo Carvalho de Melo62d94b02017-06-27 11:22:31 -03002155 pr_err("Failed to resolve callchain. Skipping\n");
David Ahern6c973c92016-11-16 15:06:32 +09002156
Namhyung Kim96039c72016-12-08 23:47:50 +09002157 return;
David Ahern6c973c92016-11-16 15:06:32 +09002158 }
Namhyung Kimcdeb01b2016-11-24 10:11:12 +09002159
David Ahern6c973c92016-11-16 15:06:32 +09002160 callchain_cursor_commit(cursor);
Namhyung Kimcdeb01b2016-11-24 10:11:12 +09002161
2162 while (true) {
2163 struct callchain_cursor_node *node;
2164 struct symbol *sym;
2165
2166 node = callchain_cursor_current(cursor);
2167 if (node == NULL)
2168 break;
2169
2170 sym = node->sym;
Arnaldo Carvalho de Meloa7c38992017-02-13 16:52:15 -03002171 if (sym) {
Namhyung Kimcdeb01b2016-11-24 10:11:12 +09002172 if (!strcmp(sym->name, "schedule") ||
2173 !strcmp(sym->name, "__schedule") ||
2174 !strcmp(sym->name, "preempt_schedule"))
2175 sym->ignore = 1;
2176 }
2177
2178 callchain_cursor_advance(cursor);
2179 }
David Ahern49394a22016-11-16 15:06:29 +09002180}
2181
Namhyung Kim3bc2fa92016-12-08 23:47:51 +09002182static int init_idle_thread(struct thread *thread)
2183{
2184 struct idle_thread_runtime *itr;
2185
2186 thread__set_comm(thread, idle_comm, 0);
2187
2188 itr = zalloc(sizeof(*itr));
2189 if (itr == NULL)
2190 return -ENOMEM;
2191
2192 init_stats(&itr->tr.run_stats);
2193 callchain_init(&itr->callchain);
2194 callchain_cursor_reset(&itr->cursor);
2195 thread__set_priv(thread, itr);
2196
2197 return 0;
2198}
2199
David Ahern49394a22016-11-16 15:06:29 +09002200/*
2201 * Track idle stats per cpu by maintaining a local thread
2202 * struct for the idle task on each cpu.
2203 */
2204static int init_idle_threads(int ncpu)
2205{
Namhyung Kim3bc2fa92016-12-08 23:47:51 +09002206 int i, ret;
David Ahern49394a22016-11-16 15:06:29 +09002207
2208 idle_threads = zalloc(ncpu * sizeof(struct thread *));
2209 if (!idle_threads)
2210 return -ENOMEM;
2211
Namhyung Kimb3363522016-12-06 12:40:05 +09002212 idle_max_cpu = ncpu;
David Ahern49394a22016-11-16 15:06:29 +09002213
2214 /* allocate the actual thread struct if needed */
2215 for (i = 0; i < ncpu; ++i) {
2216 idle_threads[i] = thread__new(0, 0);
2217 if (idle_threads[i] == NULL)
2218 return -ENOMEM;
2219
Namhyung Kim3bc2fa92016-12-08 23:47:51 +09002220 ret = init_idle_thread(idle_threads[i]);
2221 if (ret < 0)
2222 return ret;
David Ahern49394a22016-11-16 15:06:29 +09002223 }
2224
2225 return 0;
2226}
2227
2228static void free_idle_threads(void)
2229{
2230 int i;
2231
2232 if (idle_threads == NULL)
2233 return;
2234
Namhyung Kimb3363522016-12-06 12:40:05 +09002235 for (i = 0; i < idle_max_cpu; ++i) {
David Ahern49394a22016-11-16 15:06:29 +09002236 if ((idle_threads[i]))
2237 thread__delete(idle_threads[i]);
2238 }
2239
2240 free(idle_threads);
2241}
2242
2243static struct thread *get_idle_thread(int cpu)
2244{
2245 /*
2246 * expand/allocate array of pointers to local thread
2247 * structs if needed
2248 */
2249 if ((cpu >= idle_max_cpu) || (idle_threads == NULL)) {
2250 int i, j = __roundup_pow_of_two(cpu+1);
2251 void *p;
2252
2253 p = realloc(idle_threads, j * sizeof(struct thread *));
2254 if (!p)
2255 return NULL;
2256
2257 idle_threads = (struct thread **) p;
Namhyung Kimb3363522016-12-06 12:40:05 +09002258 for (i = idle_max_cpu; i < j; ++i)
David Ahern49394a22016-11-16 15:06:29 +09002259 idle_threads[i] = NULL;
2260
2261 idle_max_cpu = j;
2262 }
2263
2264 /* allocate a new thread struct if needed */
2265 if (idle_threads[cpu] == NULL) {
2266 idle_threads[cpu] = thread__new(0, 0);
2267
2268 if (idle_threads[cpu]) {
Namhyung Kim3bc2fa92016-12-08 23:47:51 +09002269 if (init_idle_thread(idle_threads[cpu]) < 0)
2270 return NULL;
David Ahern49394a22016-11-16 15:06:29 +09002271 }
2272 }
2273
2274 return idle_threads[cpu];
2275}
2276
Arnaldo Carvalho de Melo4c505632018-05-28 16:07:56 -03002277static void save_idle_callchain(struct perf_sched *sched,
2278 struct idle_thread_runtime *itr,
Namhyung Kim699b5b92016-12-08 23:47:52 +09002279 struct perf_sample *sample)
2280{
Arnaldo Carvalho de Melo4c505632018-05-28 16:07:56 -03002281 if (!sched->show_callchain || sample->callchain == NULL)
Namhyung Kim699b5b92016-12-08 23:47:52 +09002282 return;
2283
2284 callchain_cursor__copy(&itr->cursor, &callchain_cursor);
2285}
2286
David Ahern6c973c92016-11-16 15:06:32 +09002287static struct thread *timehist_get_thread(struct perf_sched *sched,
2288 struct perf_sample *sample,
David Ahern49394a22016-11-16 15:06:29 +09002289 struct machine *machine,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002290 struct evsel *evsel)
David Ahern49394a22016-11-16 15:06:29 +09002291{
2292 struct thread *thread;
2293
Namhyung Kim96039c72016-12-08 23:47:50 +09002294 if (is_idle_sample(sample, evsel)) {
David Ahern49394a22016-11-16 15:06:29 +09002295 thread = get_idle_thread(sample->cpu);
2296 if (thread == NULL)
2297 pr_err("Failed to get idle thread for cpu %d.\n", sample->cpu);
2298
2299 } else {
Namhyung Kim5d92d962016-12-06 12:40:03 +09002300 /* there were samples with tid 0 but non-zero pid */
2301 thread = machine__findnew_thread(machine, sample->pid,
2302 sample->tid ?: sample->pid);
David Ahern49394a22016-11-16 15:06:29 +09002303 if (thread == NULL) {
2304 pr_debug("Failed to get thread for tid %d. skipping sample.\n",
2305 sample->tid);
2306 }
Namhyung Kim96039c72016-12-08 23:47:50 +09002307
2308 save_task_callchain(sched, sample, evsel, machine);
Namhyung Kim699b5b92016-12-08 23:47:52 +09002309 if (sched->idle_hist) {
2310 struct thread *idle;
2311 struct idle_thread_runtime *itr;
2312
2313 idle = get_idle_thread(sample->cpu);
2314 if (idle == NULL) {
2315 pr_err("Failed to get idle thread for cpu %d.\n", sample->cpu);
2316 return NULL;
2317 }
2318
2319 itr = thread__priv(idle);
2320 if (itr == NULL)
2321 return NULL;
2322
2323 itr->last_thread = thread;
2324
2325 /* copy task callchain when entering to idle */
2326 if (perf_evsel__intval(evsel, sample, "next_pid") == 0)
Arnaldo Carvalho de Melo4c505632018-05-28 16:07:56 -03002327 save_idle_callchain(sched, itr, sample);
Namhyung Kim699b5b92016-12-08 23:47:52 +09002328 }
David Ahern49394a22016-11-16 15:06:29 +09002329 }
2330
2331 return thread;
2332}
2333
David Ahern52df1382016-11-16 15:06:30 +09002334static bool timehist_skip_sample(struct perf_sched *sched,
Namhyung Kima4b2b6f2016-12-08 23:47:53 +09002335 struct thread *thread,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002336 struct evsel *evsel,
Namhyung Kima4b2b6f2016-12-08 23:47:53 +09002337 struct perf_sample *sample)
David Ahern49394a22016-11-16 15:06:29 +09002338{
2339 bool rc = false;
2340
David Ahern52df1382016-11-16 15:06:30 +09002341 if (thread__is_filtered(thread)) {
David Ahern49394a22016-11-16 15:06:29 +09002342 rc = true;
David Ahern52df1382016-11-16 15:06:30 +09002343 sched->skipped_samples++;
2344 }
David Ahern49394a22016-11-16 15:06:29 +09002345
Namhyung Kima4b2b6f2016-12-08 23:47:53 +09002346 if (sched->idle_hist) {
2347 if (strcmp(perf_evsel__name(evsel), "sched:sched_switch"))
2348 rc = true;
2349 else if (perf_evsel__intval(evsel, sample, "prev_pid") != 0 &&
2350 perf_evsel__intval(evsel, sample, "next_pid") != 0)
2351 rc = true;
2352 }
2353
David Ahern49394a22016-11-16 15:06:29 +09002354 return rc;
2355}
2356
David Ahernfc1469f2016-11-16 15:06:31 +09002357static void timehist_print_wakeup_event(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002358 struct evsel *evsel,
David Ahernfc1469f2016-11-16 15:06:31 +09002359 struct perf_sample *sample,
2360 struct machine *machine,
2361 struct thread *awakened)
2362{
2363 struct thread *thread;
2364 char tstr[64];
2365
2366 thread = machine__findnew_thread(machine, sample->pid, sample->tid);
2367 if (thread == NULL)
2368 return;
2369
2370 /* show wakeup unless both awakee and awaker are filtered */
Namhyung Kima4b2b6f2016-12-08 23:47:53 +09002371 if (timehist_skip_sample(sched, thread, evsel, sample) &&
2372 timehist_skip_sample(sched, awakened, evsel, sample)) {
David Ahernfc1469f2016-11-16 15:06:31 +09002373 return;
2374 }
2375
2376 timestamp__scnprintf_usec(sample->time, tstr, sizeof(tstr));
2377 printf("%15s [%04d] ", tstr, sample->cpu);
David Aherna407b062016-11-16 15:06:33 +09002378 if (sched->show_cpu_visual)
2379 printf(" %*s ", sched->max_cpu + 1, "");
David Ahernfc1469f2016-11-16 15:06:31 +09002380
2381 printf(" %-*s ", comm_width, timehist_get_commstr(thread));
2382
2383 /* dt spacer */
2384 printf(" %9s %9s %9s ", "", "", "");
2385
2386 printf("awakened: %s", timehist_get_commstr(awakened));
2387
2388 printf("\n");
2389}
2390
2391static int timehist_sched_wakeup_event(struct perf_tool *tool,
David Ahern49394a22016-11-16 15:06:29 +09002392 union perf_event *event __maybe_unused,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002393 struct evsel *evsel,
David Ahern49394a22016-11-16 15:06:29 +09002394 struct perf_sample *sample,
2395 struct machine *machine)
2396{
David Ahernfc1469f2016-11-16 15:06:31 +09002397 struct perf_sched *sched = container_of(tool, struct perf_sched, tool);
David Ahern49394a22016-11-16 15:06:29 +09002398 struct thread *thread;
2399 struct thread_runtime *tr = NULL;
2400 /* want pid of awakened task not pid in sample */
2401 const u32 pid = perf_evsel__intval(evsel, sample, "pid");
2402
2403 thread = machine__findnew_thread(machine, 0, pid);
2404 if (thread == NULL)
2405 return -1;
2406
2407 tr = thread__get_runtime(thread);
2408 if (tr == NULL)
2409 return -1;
2410
2411 if (tr->ready_to_run == 0)
2412 tr->ready_to_run = sample->time;
2413
David Ahernfc1469f2016-11-16 15:06:31 +09002414 /* show wakeups if requested */
David Ahern853b7402016-11-29 10:15:44 -07002415 if (sched->show_wakeups &&
2416 !perf_time__skip_sample(&sched->ptime, sample->time))
Namhyung Kima4b2b6f2016-12-08 23:47:53 +09002417 timehist_print_wakeup_event(sched, evsel, sample, machine, thread);
David Ahernfc1469f2016-11-16 15:06:31 +09002418
David Ahern49394a22016-11-16 15:06:29 +09002419 return 0;
2420}
2421
David Ahern350f54f2016-11-25 09:28:41 -07002422static void timehist_print_migration_event(struct perf_sched *sched,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002423 struct evsel *evsel,
David Ahern350f54f2016-11-25 09:28:41 -07002424 struct perf_sample *sample,
2425 struct machine *machine,
2426 struct thread *migrated)
2427{
2428 struct thread *thread;
2429 char tstr[64];
2430 u32 max_cpus = sched->max_cpu + 1;
2431 u32 ocpu, dcpu;
2432
2433 if (sched->summary_only)
2434 return;
2435
2436 max_cpus = sched->max_cpu + 1;
2437 ocpu = perf_evsel__intval(evsel, sample, "orig_cpu");
2438 dcpu = perf_evsel__intval(evsel, sample, "dest_cpu");
2439
2440 thread = machine__findnew_thread(machine, sample->pid, sample->tid);
2441 if (thread == NULL)
2442 return;
2443
Namhyung Kima4b2b6f2016-12-08 23:47:53 +09002444 if (timehist_skip_sample(sched, thread, evsel, sample) &&
2445 timehist_skip_sample(sched, migrated, evsel, sample)) {
David Ahern350f54f2016-11-25 09:28:41 -07002446 return;
2447 }
2448
2449 timestamp__scnprintf_usec(sample->time, tstr, sizeof(tstr));
2450 printf("%15s [%04d] ", tstr, sample->cpu);
2451
2452 if (sched->show_cpu_visual) {
2453 u32 i;
2454 char c;
2455
2456 printf(" ");
2457 for (i = 0; i < max_cpus; ++i) {
2458 c = (i == sample->cpu) ? 'm' : ' ';
2459 printf("%c", c);
2460 }
2461 printf(" ");
2462 }
2463
2464 printf(" %-*s ", comm_width, timehist_get_commstr(thread));
2465
2466 /* dt spacer */
2467 printf(" %9s %9s %9s ", "", "", "");
2468
2469 printf("migrated: %s", timehist_get_commstr(migrated));
2470 printf(" cpu %d => %d", ocpu, dcpu);
2471
2472 printf("\n");
2473}
2474
2475static int timehist_migrate_task_event(struct perf_tool *tool,
2476 union perf_event *event __maybe_unused,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002477 struct evsel *evsel,
David Ahern350f54f2016-11-25 09:28:41 -07002478 struct perf_sample *sample,
2479 struct machine *machine)
2480{
2481 struct perf_sched *sched = container_of(tool, struct perf_sched, tool);
2482 struct thread *thread;
2483 struct thread_runtime *tr = NULL;
2484 /* want pid of migrated task not pid in sample */
2485 const u32 pid = perf_evsel__intval(evsel, sample, "pid");
2486
2487 thread = machine__findnew_thread(machine, 0, pid);
2488 if (thread == NULL)
2489 return -1;
2490
2491 tr = thread__get_runtime(thread);
2492 if (tr == NULL)
2493 return -1;
2494
2495 tr->migrations++;
2496
2497 /* show migrations if requested */
2498 timehist_print_migration_event(sched, evsel, sample, machine, thread);
2499
2500 return 0;
2501}
2502
David Ahern52df1382016-11-16 15:06:30 +09002503static int timehist_sched_change_event(struct perf_tool *tool,
David Ahern49394a22016-11-16 15:06:29 +09002504 union perf_event *event,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002505 struct evsel *evsel,
David Ahern49394a22016-11-16 15:06:29 +09002506 struct perf_sample *sample,
2507 struct machine *machine)
2508{
David Ahernfc1469f2016-11-16 15:06:31 +09002509 struct perf_sched *sched = container_of(tool, struct perf_sched, tool);
David Ahern853b7402016-11-29 10:15:44 -07002510 struct perf_time_interval *ptime = &sched->ptime;
David Ahern49394a22016-11-16 15:06:29 +09002511 struct addr_location al;
2512 struct thread *thread;
2513 struct thread_runtime *tr = NULL;
David Ahern853b7402016-11-29 10:15:44 -07002514 u64 tprev, t = sample->time;
David Ahern49394a22016-11-16 15:06:29 +09002515 int rc = 0;
Namhyung Kim414e0502017-01-13 19:45:22 +09002516 int state = perf_evsel__intval(evsel, sample, "prev_state");
2517
David Ahern49394a22016-11-16 15:06:29 +09002518
2519 if (machine__resolve(machine, &al, sample) < 0) {
2520 pr_err("problem processing %d event. skipping it\n",
2521 event->header.type);
2522 rc = -1;
2523 goto out;
2524 }
2525
David Ahern6c973c92016-11-16 15:06:32 +09002526 thread = timehist_get_thread(sched, sample, machine, evsel);
David Ahern49394a22016-11-16 15:06:29 +09002527 if (thread == NULL) {
2528 rc = -1;
2529 goto out;
2530 }
2531
Namhyung Kima4b2b6f2016-12-08 23:47:53 +09002532 if (timehist_skip_sample(sched, thread, evsel, sample))
David Ahern49394a22016-11-16 15:06:29 +09002533 goto out;
2534
2535 tr = thread__get_runtime(thread);
2536 if (tr == NULL) {
2537 rc = -1;
2538 goto out;
2539 }
2540
2541 tprev = perf_evsel__get_time(evsel, sample->cpu);
2542
David Ahern853b7402016-11-29 10:15:44 -07002543 /*
2544 * If start time given:
2545 * - sample time is under window user cares about - skip sample
2546 * - tprev is under window user cares about - reset to start of window
2547 */
2548 if (ptime->start && ptime->start > t)
2549 goto out;
2550
Namhyung Kimbdd75722016-12-22 15:03:49 +09002551 if (tprev && ptime->start > tprev)
David Ahern853b7402016-11-29 10:15:44 -07002552 tprev = ptime->start;
2553
2554 /*
2555 * If end time given:
2556 * - previous sched event is out of window - we are done
2557 * - sample time is beyond window user cares about - reset it
2558 * to close out stats for time window interest
2559 */
2560 if (ptime->end) {
2561 if (tprev > ptime->end)
2562 goto out;
2563
2564 if (t > ptime->end)
2565 t = ptime->end;
2566 }
2567
Namhyung Kim07235f82016-12-08 23:47:54 +09002568 if (!sched->idle_hist || thread->tid == 0) {
2569 timehist_update_runtime_stats(tr, t, tprev);
2570
2571 if (sched->idle_hist) {
2572 struct idle_thread_runtime *itr = (void *)tr;
2573 struct thread_runtime *last_tr;
2574
2575 BUG_ON(thread->tid != 0);
2576
2577 if (itr->last_thread == NULL)
2578 goto out;
2579
2580 /* add current idle time as last thread's runtime */
2581 last_tr = thread__get_runtime(itr->last_thread);
2582 if (last_tr == NULL)
2583 goto out;
2584
2585 timehist_update_runtime_stats(last_tr, t, tprev);
2586 /*
2587 * remove delta time of last thread as it's not updated
2588 * and otherwise it will show an invalid value next
2589 * time. we only care total run time and run stat.
2590 */
2591 last_tr->dt_run = 0;
Namhyung Kim07235f82016-12-08 23:47:54 +09002592 last_tr->dt_delay = 0;
Namhyung Kim941bdea2017-01-13 19:45:21 +09002593 last_tr->dt_sleep = 0;
2594 last_tr->dt_iowait = 0;
2595 last_tr->dt_preempt = 0;
Namhyung Kim07235f82016-12-08 23:47:54 +09002596
Namhyung Kimba957eb2016-12-08 23:47:55 +09002597 if (itr->cursor.nr)
2598 callchain_append(&itr->callchain, &itr->cursor, t - tprev);
2599
Namhyung Kim07235f82016-12-08 23:47:54 +09002600 itr->last_thread = NULL;
2601 }
2602 }
David Ahern853b7402016-11-29 10:15:44 -07002603
David Ahern52df1382016-11-16 15:06:30 +09002604 if (!sched->summary_only)
Brendan Gregg292c4a82017-03-14 01:56:29 +00002605 timehist_print_sample(sched, evsel, sample, &al, thread, t, state);
David Ahern49394a22016-11-16 15:06:29 +09002606
2607out:
Namhyung Kim9396c9c2016-12-22 15:03:50 +09002608 if (sched->hist_time.start == 0 && t >= ptime->start)
2609 sched->hist_time.start = t;
2610 if (ptime->end == 0 || t <= ptime->end)
2611 sched->hist_time.end = t;
2612
David Ahern49394a22016-11-16 15:06:29 +09002613 if (tr) {
2614 /* time of this sched_switch event becomes last time task seen */
2615 tr->last_time = sample->time;
2616
Namhyung Kim941bdea2017-01-13 19:45:21 +09002617 /* last state is used to determine where to account wait time */
Namhyung Kim414e0502017-01-13 19:45:22 +09002618 tr->last_state = state;
Namhyung Kim941bdea2017-01-13 19:45:21 +09002619
David Ahern49394a22016-11-16 15:06:29 +09002620 /* sched out event for task so reset ready to run time */
2621 tr->ready_to_run = 0;
2622 }
2623
2624 perf_evsel__save_time(evsel, sample->time, sample->cpu);
2625
2626 return rc;
2627}
2628
2629static int timehist_sched_switch_event(struct perf_tool *tool,
2630 union perf_event *event,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002631 struct evsel *evsel,
David Ahern49394a22016-11-16 15:06:29 +09002632 struct perf_sample *sample,
2633 struct machine *machine __maybe_unused)
2634{
2635 return timehist_sched_change_event(tool, event, evsel, sample, machine);
2636}
2637
2638static int process_lost(struct perf_tool *tool __maybe_unused,
2639 union perf_event *event,
2640 struct perf_sample *sample,
2641 struct machine *machine __maybe_unused)
2642{
2643 char tstr[64];
2644
2645 timestamp__scnprintf_usec(sample->time, tstr, sizeof(tstr));
2646 printf("%15s ", tstr);
Jiri Olsa5290ed62019-08-25 20:17:46 +02002647 printf("lost %" PRI_lu64 " events on cpu %d\n", event->lost.lost, sample->cpu);
David Ahern49394a22016-11-16 15:06:29 +09002648
2649 return 0;
2650}
2651
2652
David Ahern52df1382016-11-16 15:06:30 +09002653static void print_thread_runtime(struct thread *t,
2654 struct thread_runtime *r)
2655{
2656 double mean = avg_stats(&r->run_stats);
2657 float stddev;
2658
2659 printf("%*s %5d %9" PRIu64 " ",
2660 comm_width, timehist_get_commstr(t), t->ppid,
2661 (u64) r->run_stats.n);
2662
2663 print_sched_time(r->total_run_time, 8);
2664 stddev = rel_stddev_stats(stddev_stats(&r->run_stats), mean);
2665 print_sched_time(r->run_stats.min, 6);
2666 printf(" ");
2667 print_sched_time((u64) mean, 6);
2668 printf(" ");
2669 print_sched_time(r->run_stats.max, 6);
2670 printf(" ");
2671 printf("%5.2f", stddev);
David Ahern350f54f2016-11-25 09:28:41 -07002672 printf(" %5" PRIu64, r->migrations);
David Ahern52df1382016-11-16 15:06:30 +09002673 printf("\n");
2674}
2675
Namhyung Kim587782c2017-01-13 19:45:23 +09002676static void print_thread_waittime(struct thread *t,
2677 struct thread_runtime *r)
2678{
2679 printf("%*s %5d %9" PRIu64 " ",
2680 comm_width, timehist_get_commstr(t), t->ppid,
2681 (u64) r->run_stats.n);
2682
2683 print_sched_time(r->total_run_time, 8);
2684 print_sched_time(r->total_sleep_time, 6);
2685 printf(" ");
2686 print_sched_time(r->total_iowait_time, 6);
2687 printf(" ");
2688 print_sched_time(r->total_preempt_time, 6);
2689 printf(" ");
2690 print_sched_time(r->total_delay_time, 6);
2691 printf("\n");
2692}
2693
David Ahern52df1382016-11-16 15:06:30 +09002694struct total_run_stats {
Namhyung Kim587782c2017-01-13 19:45:23 +09002695 struct perf_sched *sched;
David Ahern52df1382016-11-16 15:06:30 +09002696 u64 sched_count;
2697 u64 task_count;
2698 u64 total_run_time;
2699};
2700
2701static int __show_thread_runtime(struct thread *t, void *priv)
2702{
2703 struct total_run_stats *stats = priv;
2704 struct thread_runtime *r;
2705
2706 if (thread__is_filtered(t))
2707 return 0;
2708
2709 r = thread__priv(t);
2710 if (r && r->run_stats.n) {
2711 stats->task_count++;
2712 stats->sched_count += r->run_stats.n;
2713 stats->total_run_time += r->total_run_time;
Namhyung Kim587782c2017-01-13 19:45:23 +09002714
2715 if (stats->sched->show_state)
2716 print_thread_waittime(t, r);
2717 else
2718 print_thread_runtime(t, r);
David Ahern52df1382016-11-16 15:06:30 +09002719 }
2720
2721 return 0;
2722}
2723
2724static int show_thread_runtime(struct thread *t, void *priv)
2725{
2726 if (t->dead)
2727 return 0;
2728
2729 return __show_thread_runtime(t, priv);
2730}
2731
2732static int show_deadthread_runtime(struct thread *t, void *priv)
2733{
2734 if (!t->dead)
2735 return 0;
2736
2737 return __show_thread_runtime(t, priv);
2738}
2739
Namhyung Kimba957eb2016-12-08 23:47:55 +09002740static size_t callchain__fprintf_folded(FILE *fp, struct callchain_node *node)
2741{
2742 const char *sep = " <- ";
2743 struct callchain_list *chain;
2744 size_t ret = 0;
2745 char bf[1024];
2746 bool first;
2747
2748 if (node == NULL)
2749 return 0;
2750
2751 ret = callchain__fprintf_folded(fp, node->parent);
2752 first = (ret == 0);
2753
2754 list_for_each_entry(chain, &node->val, list) {
2755 if (chain->ip >= PERF_CONTEXT_MAX)
2756 continue;
2757 if (chain->ms.sym && chain->ms.sym->ignore)
2758 continue;
2759 ret += fprintf(fp, "%s%s", first ? "" : sep,
2760 callchain_list__sym_name(chain, bf, sizeof(bf),
2761 false));
2762 first = false;
2763 }
2764
2765 return ret;
2766}
2767
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08002768static size_t timehist_print_idlehist_callchain(struct rb_root_cached *root)
Namhyung Kimba957eb2016-12-08 23:47:55 +09002769{
2770 size_t ret = 0;
2771 FILE *fp = stdout;
2772 struct callchain_node *chain;
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08002773 struct rb_node *rb_node = rb_first_cached(root);
Namhyung Kimba957eb2016-12-08 23:47:55 +09002774
2775 printf(" %16s %8s %s\n", "Idle time (msec)", "Count", "Callchains");
2776 printf(" %.16s %.8s %.50s\n", graph_dotted_line, graph_dotted_line,
2777 graph_dotted_line);
2778
2779 while (rb_node) {
2780 chain = rb_entry(rb_node, struct callchain_node, rb_node);
2781 rb_node = rb_next(rb_node);
2782
2783 ret += fprintf(fp, " ");
2784 print_sched_time(chain->hit, 12);
2785 ret += 16; /* print_sched_time returns 2nd arg + 4 */
2786 ret += fprintf(fp, " %8d ", chain->count);
2787 ret += callchain__fprintf_folded(fp, chain);
2788 ret += fprintf(fp, "\n");
2789 }
2790
2791 return ret;
2792}
2793
David Ahern52df1382016-11-16 15:06:30 +09002794static void timehist_print_summary(struct perf_sched *sched,
2795 struct perf_session *session)
2796{
2797 struct machine *m = &session->machines.host;
2798 struct total_run_stats totals;
2799 u64 task_count;
2800 struct thread *t;
2801 struct thread_runtime *r;
2802 int i;
Namhyung Kim9396c9c2016-12-22 15:03:50 +09002803 u64 hist_time = sched->hist_time.end - sched->hist_time.start;
David Ahern52df1382016-11-16 15:06:30 +09002804
2805 memset(&totals, 0, sizeof(totals));
Namhyung Kim587782c2017-01-13 19:45:23 +09002806 totals.sched = sched;
David Ahern52df1382016-11-16 15:06:30 +09002807
Namhyung Kim07235f82016-12-08 23:47:54 +09002808 if (sched->idle_hist) {
2809 printf("\nIdle-time summary\n");
2810 printf("%*s parent sched-out ", comm_width, "comm");
2811 printf(" idle-time min-idle avg-idle max-idle stddev migrations\n");
Namhyung Kim587782c2017-01-13 19:45:23 +09002812 } else if (sched->show_state) {
2813 printf("\nWait-time summary\n");
2814 printf("%*s parent sched-in ", comm_width, "comm");
2815 printf(" run-time sleep iowait preempt delay\n");
Namhyung Kim07235f82016-12-08 23:47:54 +09002816 } else {
2817 printf("\nRuntime summary\n");
2818 printf("%*s parent sched-in ", comm_width, "comm");
2819 printf(" run-time min-run avg-run max-run stddev migrations\n");
2820 }
David Ahern52df1382016-11-16 15:06:30 +09002821 printf("%*s (count) ", comm_width, "");
Namhyung Kim587782c2017-01-13 19:45:23 +09002822 printf(" (msec) (msec) (msec) (msec) %s\n",
2823 sched->show_state ? "(msec)" : "%");
David Ahern350f54f2016-11-25 09:28:41 -07002824 printf("%.117s\n", graph_dotted_line);
David Ahern52df1382016-11-16 15:06:30 +09002825
2826 machine__for_each_thread(m, show_thread_runtime, &totals);
2827 task_count = totals.task_count;
2828 if (!task_count)
2829 printf("<no still running tasks>\n");
2830
2831 printf("\nTerminated tasks:\n");
2832 machine__for_each_thread(m, show_deadthread_runtime, &totals);
2833 if (task_count == totals.task_count)
2834 printf("<no terminated tasks>\n");
2835
2836 /* CPU idle stats not tracked when samples were skipped */
Namhyung Kim07235f82016-12-08 23:47:54 +09002837 if (sched->skipped_samples && !sched->idle_hist)
David Ahern52df1382016-11-16 15:06:30 +09002838 return;
2839
2840 printf("\nIdle stats:\n");
Namhyung Kimb3363522016-12-06 12:40:05 +09002841 for (i = 0; i < idle_max_cpu; ++i) {
David Ahern52df1382016-11-16 15:06:30 +09002842 t = idle_threads[i];
2843 if (!t)
2844 continue;
2845
2846 r = thread__priv(t);
2847 if (r && r->run_stats.n) {
2848 totals.sched_count += r->run_stats.n;
2849 printf(" CPU %2d idle for ", i);
2850 print_sched_time(r->total_run_time, 6);
Namhyung Kim9396c9c2016-12-22 15:03:50 +09002851 printf(" msec (%6.2f%%)\n", 100.0 * r->total_run_time / hist_time);
David Ahern52df1382016-11-16 15:06:30 +09002852 } else
2853 printf(" CPU %2d idle entire time window\n", i);
2854 }
2855
Arnaldo Carvalho de Melo4c505632018-05-28 16:07:56 -03002856 if (sched->idle_hist && sched->show_callchain) {
Namhyung Kimba957eb2016-12-08 23:47:55 +09002857 callchain_param.mode = CHAIN_FOLDED;
2858 callchain_param.value = CCVAL_PERIOD;
2859
2860 callchain_register_param(&callchain_param);
2861
2862 printf("\nIdle stats by callchain:\n");
2863 for (i = 0; i < idle_max_cpu; ++i) {
2864 struct idle_thread_runtime *itr;
2865
2866 t = idle_threads[i];
2867 if (!t)
2868 continue;
2869
2870 itr = thread__priv(t);
2871 if (itr == NULL)
2872 continue;
2873
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08002874 callchain_param.sort(&itr->sorted_root.rb_root, &itr->callchain,
Namhyung Kimba957eb2016-12-08 23:47:55 +09002875 0, &callchain_param);
2876
2877 printf(" CPU %2d:", i);
2878 print_sched_time(itr->tr.total_run_time, 6);
2879 printf(" msec\n");
2880 timehist_print_idlehist_callchain(&itr->sorted_root);
2881 printf("\n");
2882 }
2883 }
2884
David Ahern52df1382016-11-16 15:06:30 +09002885 printf("\n"
2886 " Total number of unique tasks: %" PRIu64 "\n"
Namhyung Kim9396c9c2016-12-22 15:03:50 +09002887 "Total number of context switches: %" PRIu64 "\n",
David Ahern52df1382016-11-16 15:06:30 +09002888 totals.task_count, totals.sched_count);
2889
Namhyung Kim9396c9c2016-12-22 15:03:50 +09002890 printf(" Total run time (msec): ");
David Ahern52df1382016-11-16 15:06:30 +09002891 print_sched_time(totals.total_run_time, 2);
2892 printf("\n");
Namhyung Kim9396c9c2016-12-22 15:03:50 +09002893
2894 printf(" Total scheduling time (msec): ");
2895 print_sched_time(hist_time, 2);
2896 printf(" (x %d)\n", sched->max_cpu);
David Ahern52df1382016-11-16 15:06:30 +09002897}
2898
David Ahern49394a22016-11-16 15:06:29 +09002899typedef int (*sched_handler)(struct perf_tool *tool,
2900 union perf_event *event,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002901 struct evsel *evsel,
David Ahern49394a22016-11-16 15:06:29 +09002902 struct perf_sample *sample,
2903 struct machine *machine);
2904
2905static int perf_timehist__process_sample(struct perf_tool *tool,
2906 union perf_event *event,
2907 struct perf_sample *sample,
Jiri Olsa32dcd022019-07-21 13:23:51 +02002908 struct evsel *evsel,
David Ahern49394a22016-11-16 15:06:29 +09002909 struct machine *machine)
2910{
2911 struct perf_sched *sched = container_of(tool, struct perf_sched, tool);
2912 int err = 0;
2913 int this_cpu = sample->cpu;
2914
2915 if (this_cpu > sched->max_cpu)
2916 sched->max_cpu = this_cpu;
2917
2918 if (evsel->handler != NULL) {
2919 sched_handler f = evsel->handler;
2920
2921 err = f(tool, event, evsel, sample, machine);
2922 }
2923
2924 return err;
2925}
2926
David Ahern6c973c92016-11-16 15:06:32 +09002927static int timehist_check_attr(struct perf_sched *sched,
Jiri Olsa63503db2019-07-21 13:23:52 +02002928 struct evlist *evlist)
David Ahern6c973c92016-11-16 15:06:32 +09002929{
Jiri Olsa32dcd022019-07-21 13:23:51 +02002930 struct evsel *evsel;
David Ahern6c973c92016-11-16 15:06:32 +09002931 struct evsel_runtime *er;
2932
Jiri Olsace9036a2019-07-21 13:24:23 +02002933 list_for_each_entry(evsel, &evlist->core.entries, core.node) {
David Ahern6c973c92016-11-16 15:06:32 +09002934 er = perf_evsel__get_runtime(evsel);
2935 if (er == NULL) {
2936 pr_err("Failed to allocate memory for evsel runtime data\n");
2937 return -1;
2938 }
2939
Arnaldo Carvalho de Melo27de9b22018-05-28 16:00:29 -03002940 if (sched->show_callchain && !evsel__has_callchain(evsel)) {
David Ahern6c973c92016-11-16 15:06:32 +09002941 pr_info("Samples do not have callchains.\n");
2942 sched->show_callchain = 0;
2943 symbol_conf.use_callchain = 0;
2944 }
2945 }
2946
2947 return 0;
2948}
2949
David Ahern49394a22016-11-16 15:06:29 +09002950static int perf_sched__timehist(struct perf_sched *sched)
2951{
Jiri Olsa32dcd022019-07-21 13:23:51 +02002952 const struct evsel_str_handler handlers[] = {
David Ahern49394a22016-11-16 15:06:29 +09002953 { "sched:sched_switch", timehist_sched_switch_event, },
2954 { "sched:sched_wakeup", timehist_sched_wakeup_event, },
2955 { "sched:sched_wakeup_new", timehist_sched_wakeup_event, },
2956 };
Jiri Olsa32dcd022019-07-21 13:23:51 +02002957 const struct evsel_str_handler migrate_handlers[] = {
David Ahern350f54f2016-11-25 09:28:41 -07002958 { "sched:sched_migrate_task", timehist_migrate_task_event, },
2959 };
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01002960 struct perf_data data = {
Jiri Olsa2d4f2792019-02-21 10:41:30 +01002961 .path = input_name,
2962 .mode = PERF_DATA_MODE_READ,
2963 .force = sched->force,
David Ahern49394a22016-11-16 15:06:29 +09002964 };
2965
2966 struct perf_session *session;
Jiri Olsa63503db2019-07-21 13:23:52 +02002967 struct evlist *evlist;
David Ahern49394a22016-11-16 15:06:29 +09002968 int err = -1;
2969
2970 /*
2971 * event handlers for timehist option
2972 */
2973 sched->tool.sample = perf_timehist__process_sample;
2974 sched->tool.mmap = perf_event__process_mmap;
2975 sched->tool.comm = perf_event__process_comm;
2976 sched->tool.exit = perf_event__process_exit;
2977 sched->tool.fork = perf_event__process_fork;
2978 sched->tool.lost = process_lost;
2979 sched->tool.attr = perf_event__process_attr;
2980 sched->tool.tracing_data = perf_event__process_tracing_data;
2981 sched->tool.build_id = perf_event__process_build_id;
2982
2983 sched->tool.ordered_events = true;
2984 sched->tool.ordering_requires_timestamps = true;
2985
David Ahern6c973c92016-11-16 15:06:32 +09002986 symbol_conf.use_callchain = sched->show_callchain;
2987
Jiri Olsa8ceb41d2017-01-23 22:07:59 +01002988 session = perf_session__new(&data, false, &sched->tool);
David Ahern49394a22016-11-16 15:06:29 +09002989 if (session == NULL)
2990 return -ENOMEM;
2991
David Ahern52df1382016-11-16 15:06:30 +09002992 evlist = session->evlist;
2993
David Ahern49394a22016-11-16 15:06:29 +09002994 symbol__init(&session->header.env);
2995
David Ahern853b7402016-11-29 10:15:44 -07002996 if (perf_time__parse_str(&sched->ptime, sched->time_str) != 0) {
2997 pr_err("Invalid time string\n");
2998 return -EINVAL;
2999 }
3000
David Ahern6c973c92016-11-16 15:06:32 +09003001 if (timehist_check_attr(sched, evlist) != 0)
3002 goto out;
3003
David Ahern49394a22016-11-16 15:06:29 +09003004 setup_pager();
3005
3006 /* setup per-evsel handlers */
3007 if (perf_session__set_tracepoints_handlers(session, handlers))
3008 goto out;
3009
David Ahernf45bf8d2016-11-29 13:39:48 -07003010 /* sched_switch event at a minimum needs to exist */
3011 if (!perf_evlist__find_tracepoint_by_name(session->evlist,
3012 "sched:sched_switch")) {
3013 pr_err("No sched_switch events found. Have you run 'perf sched record'?\n");
David Ahern49394a22016-11-16 15:06:29 +09003014 goto out;
David Ahernf45bf8d2016-11-29 13:39:48 -07003015 }
David Ahern49394a22016-11-16 15:06:29 +09003016
David Ahern350f54f2016-11-25 09:28:41 -07003017 if (sched->show_migrations &&
3018 perf_session__set_tracepoints_handlers(session, migrate_handlers))
3019 goto out;
3020
David Ahern49394a22016-11-16 15:06:29 +09003021 /* pre-allocate struct for per-CPU idle stats */
3022 sched->max_cpu = session->header.env.nr_cpus_online;
3023 if (sched->max_cpu == 0)
3024 sched->max_cpu = 4;
3025 if (init_idle_threads(sched->max_cpu))
3026 goto out;
3027
David Ahern52df1382016-11-16 15:06:30 +09003028 /* summary_only implies summary option, but don't overwrite summary if set */
3029 if (sched->summary_only)
3030 sched->summary = sched->summary_only;
3031
3032 if (!sched->summary_only)
David Aherna407b062016-11-16 15:06:33 +09003033 timehist_header(sched);
David Ahern49394a22016-11-16 15:06:29 +09003034
3035 err = perf_session__process_events(session);
3036 if (err) {
3037 pr_err("Failed to process events, error %d", err);
3038 goto out;
3039 }
3040
David Ahern52df1382016-11-16 15:06:30 +09003041 sched->nr_events = evlist->stats.nr_events[0];
3042 sched->nr_lost_events = evlist->stats.total_lost;
3043 sched->nr_lost_chunks = evlist->stats.nr_events[PERF_RECORD_LOST];
3044
3045 if (sched->summary)
3046 timehist_print_summary(sched, session);
3047
David Ahern49394a22016-11-16 15:06:29 +09003048out:
3049 free_idle_threads();
3050 perf_session__delete(session);
3051
3052 return err;
3053}
3054
3055
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003056static void print_bad_events(struct perf_sched *sched)
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003057{
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003058 if (sched->nr_unordered_timestamps && sched->nr_timestamps) {
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003059 printf(" INFO: %.3f%% unordered timestamps (%ld out of %ld)\n",
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003060 (double)sched->nr_unordered_timestamps/(double)sched->nr_timestamps*100.0,
3061 sched->nr_unordered_timestamps, sched->nr_timestamps);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003062 }
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003063 if (sched->nr_lost_events && sched->nr_events) {
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003064 printf(" INFO: %.3f%% lost events (%ld out of %ld, in %ld chunks)\n",
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003065 (double)sched->nr_lost_events/(double)sched->nr_events * 100.0,
3066 sched->nr_lost_events, sched->nr_events, sched->nr_lost_chunks);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003067 }
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003068 if (sched->nr_context_switch_bugs && sched->nr_timestamps) {
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003069 printf(" INFO: %.3f%% context switch bugs (%ld out of %ld)",
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003070 (double)sched->nr_context_switch_bugs/(double)sched->nr_timestamps*100.0,
3071 sched->nr_context_switch_bugs, sched->nr_timestamps);
3072 if (sched->nr_lost_events)
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003073 printf(" (due to lost events?)");
3074 printf("\n");
3075 }
3076}
3077
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08003078static void __merge_work_atoms(struct rb_root_cached *root, struct work_atoms *data)
Josef Bacik2f80dd42015-05-22 09:18:40 -04003079{
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08003080 struct rb_node **new = &(root->rb_root.rb_node), *parent = NULL;
Josef Bacik2f80dd42015-05-22 09:18:40 -04003081 struct work_atoms *this;
3082 const char *comm = thread__comm_str(data->thread), *this_comm;
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08003083 bool leftmost = true;
Josef Bacik2f80dd42015-05-22 09:18:40 -04003084
3085 while (*new) {
3086 int cmp;
3087
3088 this = container_of(*new, struct work_atoms, node);
3089 parent = *new;
3090
3091 this_comm = thread__comm_str(this->thread);
3092 cmp = strcmp(comm, this_comm);
3093 if (cmp > 0) {
3094 new = &((*new)->rb_left);
3095 } else if (cmp < 0) {
3096 new = &((*new)->rb_right);
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08003097 leftmost = false;
Josef Bacik2f80dd42015-05-22 09:18:40 -04003098 } else {
3099 this->num_merged++;
3100 this->total_runtime += data->total_runtime;
3101 this->nb_atoms += data->nb_atoms;
3102 this->total_lat += data->total_lat;
3103 list_splice(&data->work_list, &this->work_list);
3104 if (this->max_lat < data->max_lat) {
3105 this->max_lat = data->max_lat;
3106 this->max_lat_at = data->max_lat_at;
3107 }
3108 zfree(&data);
3109 return;
3110 }
3111 }
3112
3113 data->num_merged++;
3114 rb_link_node(&data->node, parent, new);
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08003115 rb_insert_color_cached(&data->node, root, leftmost);
Josef Bacik2f80dd42015-05-22 09:18:40 -04003116}
3117
3118static void perf_sched__merge_lat(struct perf_sched *sched)
3119{
3120 struct work_atoms *data;
3121 struct rb_node *node;
3122
3123 if (sched->skip_merge)
3124 return;
3125
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08003126 while ((node = rb_first_cached(&sched->atom_root))) {
3127 rb_erase_cached(node, &sched->atom_root);
Josef Bacik2f80dd42015-05-22 09:18:40 -04003128 data = rb_entry(node, struct work_atoms, node);
3129 __merge_work_atoms(&sched->merged_atom_root, data);
3130 }
3131}
3132
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003133static int perf_sched__lat(struct perf_sched *sched)
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003134{
3135 struct rb_node *next;
3136
3137 setup_pager();
David Ahernad9def72013-08-07 22:50:44 -04003138
Arnaldo Carvalho de Meloae536ac2015-03-02 22:28:41 -03003139 if (perf_sched__read_events(sched))
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03003140 return -1;
David Ahernad9def72013-08-07 22:50:44 -04003141
Josef Bacik2f80dd42015-05-22 09:18:40 -04003142 perf_sched__merge_lat(sched);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003143 perf_sched__sort_lat(sched);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003144
Ramkumar Ramachandra80790e02014-03-17 10:18:21 -04003145 printf("\n -----------------------------------------------------------------------------------------------------------------\n");
3146 printf(" Task | Runtime ms | Switches | Average delay ms | Maximum delay ms | Maximum delay at |\n");
3147 printf(" -----------------------------------------------------------------------------------------------------------------\n");
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003148
Davidlohr Buesocb4c13a2018-12-06 11:18:19 -08003149 next = rb_first_cached(&sched->sorted_atom_root);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003150
3151 while (next) {
3152 struct work_atoms *work_list;
3153
3154 work_list = rb_entry(next, struct work_atoms, node);
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003155 output_lat_thread(sched, work_list);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003156 next = rb_next(next);
Arnaldo Carvalho de Meloae536ac2015-03-02 22:28:41 -03003157 thread__zput(work_list->thread);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003158 }
3159
Ramkumar Ramachandra80790e02014-03-17 10:18:21 -04003160 printf(" -----------------------------------------------------------------------------------------------------------------\n");
Arnaldo Carvalho de Melo9486aa32011-01-22 20:37:02 -02003161 printf(" TOTAL: |%11.3f ms |%9" PRIu64 " |\n",
Arnaldo Carvalho de Melo4fc76e42016-08-08 12:23:49 -03003162 (double)sched->all_runtime / NSEC_PER_MSEC, sched->all_count);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003163
3164 printf(" ---------------------------------------------------\n");
3165
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003166 print_bad_events(sched);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003167 printf("\n");
3168
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03003169 return 0;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003170}
3171
Jiri Olsa99623c62016-04-12 15:29:26 +02003172static int setup_map_cpus(struct perf_sched *sched)
3173{
Jiri Olsaf8548392019-07-21 13:23:49 +02003174 struct perf_cpu_map *map;
Jiri Olsa73643bb2016-04-12 15:29:31 +02003175
Jiri Olsa99623c62016-04-12 15:29:26 +02003176 sched->max_cpu = sysconf(_SC_NPROCESSORS_CONF);
3177
3178 if (sched->map.comp) {
3179 sched->map.comp_cpus = zalloc(sched->max_cpu * sizeof(int));
Jiri Olsacf294f22016-04-12 15:29:30 +02003180 if (!sched->map.comp_cpus)
3181 return -1;
Jiri Olsa99623c62016-04-12 15:29:26 +02003182 }
3183
Jiri Olsa73643bb2016-04-12 15:29:31 +02003184 if (!sched->map.cpus_str)
3185 return 0;
3186
Jiri Olsa9c3516d2019-07-21 13:24:30 +02003187 map = perf_cpu_map__new(sched->map.cpus_str);
Jiri Olsa73643bb2016-04-12 15:29:31 +02003188 if (!map) {
3189 pr_err("failed to get cpus map from %s\n", sched->map.cpus_str);
3190 return -1;
3191 }
3192
3193 sched->map.cpus = map;
Jiri Olsa99623c62016-04-12 15:29:26 +02003194 return 0;
3195}
3196
Jiri Olsaa151a372016-04-12 15:29:29 +02003197static int setup_color_pids(struct perf_sched *sched)
3198{
Jiri Olsa9749b902019-07-21 13:23:50 +02003199 struct perf_thread_map *map;
Jiri Olsaa151a372016-04-12 15:29:29 +02003200
3201 if (!sched->map.color_pids_str)
3202 return 0;
3203
3204 map = thread_map__new_by_tid_str(sched->map.color_pids_str);
3205 if (!map) {
3206 pr_err("failed to get thread map from %s\n", sched->map.color_pids_str);
3207 return -1;
3208 }
3209
3210 sched->map.color_pids = map;
3211 return 0;
3212}
3213
Jiri Olsacf294f22016-04-12 15:29:30 +02003214static int setup_color_cpus(struct perf_sched *sched)
3215{
Jiri Olsaf8548392019-07-21 13:23:49 +02003216 struct perf_cpu_map *map;
Jiri Olsacf294f22016-04-12 15:29:30 +02003217
3218 if (!sched->map.color_cpus_str)
3219 return 0;
3220
Jiri Olsa9c3516d2019-07-21 13:24:30 +02003221 map = perf_cpu_map__new(sched->map.color_cpus_str);
Jiri Olsacf294f22016-04-12 15:29:30 +02003222 if (!map) {
3223 pr_err("failed to get thread map from %s\n", sched->map.color_cpus_str);
3224 return -1;
3225 }
3226
3227 sched->map.color_cpus = map;
3228 return 0;
3229}
3230
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003231static int perf_sched__map(struct perf_sched *sched)
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003232{
Jiri Olsa99623c62016-04-12 15:29:26 +02003233 if (setup_map_cpus(sched))
3234 return -1;
Ingo Molnar40749d02009-09-17 18:24:55 +02003235
Jiri Olsaa151a372016-04-12 15:29:29 +02003236 if (setup_color_pids(sched))
3237 return -1;
3238
Jiri Olsacf294f22016-04-12 15:29:30 +02003239 if (setup_color_cpus(sched))
3240 return -1;
3241
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003242 setup_pager();
Arnaldo Carvalho de Meloae536ac2015-03-02 22:28:41 -03003243 if (perf_sched__read_events(sched))
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03003244 return -1;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003245 print_bad_events(sched);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03003246 return 0;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003247}
3248
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003249static int perf_sched__replay(struct perf_sched *sched)
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003250{
3251 unsigned long i;
3252
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003253 calibrate_run_measurement_overhead(sched);
3254 calibrate_sleep_measurement_overhead(sched);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003255
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003256 test_calibrations(sched);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003257
Arnaldo Carvalho de Meloae536ac2015-03-02 22:28:41 -03003258 if (perf_sched__read_events(sched))
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03003259 return -1;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003260
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003261 printf("nr_run_events: %ld\n", sched->nr_run_events);
3262 printf("nr_sleep_events: %ld\n", sched->nr_sleep_events);
3263 printf("nr_wakeup_events: %ld\n", sched->nr_wakeup_events);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003264
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003265 if (sched->targetless_wakeups)
3266 printf("target-less wakeups: %ld\n", sched->targetless_wakeups);
3267 if (sched->multitarget_wakeups)
3268 printf("multi-target wakeups: %ld\n", sched->multitarget_wakeups);
3269 if (sched->nr_run_events_optimized)
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003270 printf("run atoms optimized: %ld\n",
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003271 sched->nr_run_events_optimized);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003272
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003273 print_task_traces(sched);
3274 add_cross_task_wakeups(sched);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003275
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003276 create_tasks(sched);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003277 printf("------------------------------------------------------------\n");
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003278 for (i = 0; i < sched->replay_repeat; i++)
3279 run_one_test(sched);
Arnaldo Carvalho de Meloa116e052012-09-08 22:53:06 -03003280
3281 return 0;
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003282}
3283
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003284static void setup_sorting(struct perf_sched *sched, const struct option *options,
3285 const char * const usage_msg[])
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02003286{
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003287 char *tmp, *tok, *str = strdup(sched->sort_order);
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02003288
3289 for (tok = strtok_r(str, ", ", &tmp);
3290 tok; tok = strtok_r(NULL, ", ", &tmp)) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003291 if (sort_dimension__add(tok, &sched->sort_list) < 0) {
Namhyung Kimc7118362015-10-25 00:49:27 +09003292 usage_with_options_msg(usage_msg, options,
3293 "Unknown --sort key: `%s'", tok);
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02003294 }
3295 }
3296
3297 free(str);
3298
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003299 sort_dimension__add("pid", &sched->cmp_pid);
Frederic Weisbeckerdaa1d7a2009-09-13 03:36:29 +02003300}
3301
Ingo Molnar1fc35b22009-09-13 09:44:29 +02003302static int __cmd_record(int argc, const char **argv)
3303{
3304 unsigned int rec_argc, i, j;
3305 const char **rec_argv;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003306 const char * const record_args[] = {
3307 "record",
3308 "-a",
3309 "-R",
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003310 "-m", "1024",
3311 "-c", "1",
3312 "-e", "sched:sched_switch",
3313 "-e", "sched:sched_stat_wait",
3314 "-e", "sched:sched_stat_sleep",
3315 "-e", "sched:sched_stat_iowait",
3316 "-e", "sched:sched_stat_runtime",
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003317 "-e", "sched:sched_process_fork",
3318 "-e", "sched:sched_wakeup",
Dongsheng7fff9592014-05-05 16:05:53 +09003319 "-e", "sched:sched_wakeup_new",
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003320 "-e", "sched:sched_migrate_task",
3321 };
Ingo Molnar1fc35b22009-09-13 09:44:29 +02003322
3323 rec_argc = ARRAY_SIZE(record_args) + argc - 1;
3324 rec_argv = calloc(rec_argc + 1, sizeof(char *));
3325
Arnaldo Carvalho de Meloe462dc52011-01-10 10:48:47 -02003326 if (rec_argv == NULL)
Chris Samuelce47dc52010-11-13 13:35:06 +11003327 return -ENOMEM;
3328
Ingo Molnar1fc35b22009-09-13 09:44:29 +02003329 for (i = 0; i < ARRAY_SIZE(record_args); i++)
3330 rec_argv[i] = strdup(record_args[i]);
3331
3332 for (j = 1; j < (unsigned int)argc; j++, i++)
3333 rec_argv[i] = argv[j];
3334
3335 BUG_ON(i != rec_argc);
3336
Arnaldo Carvalho de Melob0ad8ea2017-03-27 11:47:20 -03003337 return cmd_record(i, rec_argv);
Ingo Molnar1fc35b22009-09-13 09:44:29 +02003338}
3339
Arnaldo Carvalho de Melob0ad8ea2017-03-27 11:47:20 -03003340int cmd_sched(int argc, const char **argv)
Ingo Molnar0a02ad92009-09-11 12:12:54 +02003341{
Rasmus Villemoes49b8e2b2018-11-03 00:06:23 +01003342 static const char default_sort_order[] = "avg, max, switch, runtime";
Adrian Hunter8a39df82013-10-22 10:34:15 +03003343 struct perf_sched sched = {
3344 .tool = {
3345 .sample = perf_sched__process_tracepoint_sample,
Changbin Du99a3c3a2018-03-06 11:37:37 +08003346 .comm = perf_sched__process_comm,
Hari Bathinif3b36142017-03-08 02:11:43 +05303347 .namespaces = perf_event__process_namespaces,
Adrian Hunter8a39df82013-10-22 10:34:15 +03003348 .lost = perf_event__process_lost,
3349 .fork = perf_sched__process_fork_event,
Jiri Olsa0a8cb852014-07-06 14:18:21 +02003350 .ordered_events = true,
Adrian Hunter8a39df82013-10-22 10:34:15 +03003351 },
3352 .cmp_pid = LIST_HEAD_INIT(sched.cmp_pid),
3353 .sort_list = LIST_HEAD_INIT(sched.sort_list),
3354 .start_work_mutex = PTHREAD_MUTEX_INITIALIZER,
3355 .work_done_wait_mutex = PTHREAD_MUTEX_INITIALIZER,
Adrian Hunter8a39df82013-10-22 10:34:15 +03003356 .sort_order = default_sort_order,
3357 .replay_repeat = 10,
3358 .profile_cpu = -1,
3359 .next_shortname1 = 'A',
3360 .next_shortname2 = '0',
Josef Bacik2f80dd42015-05-22 09:18:40 -04003361 .skip_merge = 0,
David Ahern6c973c92016-11-16 15:06:32 +09003362 .show_callchain = 1,
3363 .max_stack = 5,
Adrian Hunter8a39df82013-10-22 10:34:15 +03003364 };
Namhyung Kim77f02f42016-10-24 12:00:03 +09003365 const struct option sched_options[] = {
3366 OPT_STRING('i', "input", &input_name, "file",
3367 "input file name"),
3368 OPT_INCR('v', "verbose", &verbose,
3369 "be more verbose (show symbol address, etc)"),
3370 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
3371 "dump raw trace in ASCII"),
Namhyung Kim6fa94252016-12-06 12:40:01 +09003372 OPT_BOOLEAN('f', "force", &sched.force, "don't complain, do it"),
Namhyung Kim77f02f42016-10-24 12:00:03 +09003373 OPT_END()
3374 };
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003375 const struct option latency_options[] = {
3376 OPT_STRING('s', "sort", &sched.sort_order, "key[,key2...]",
3377 "sort by key(s): runtime, switch, avg, max"),
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003378 OPT_INTEGER('C', "CPU", &sched.profile_cpu,
3379 "CPU to profile on"),
Josef Bacik2f80dd42015-05-22 09:18:40 -04003380 OPT_BOOLEAN('p', "pids", &sched.skip_merge,
3381 "latency stats per pid instead of per comm"),
Namhyung Kim77f02f42016-10-24 12:00:03 +09003382 OPT_PARENT(sched_options)
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003383 };
3384 const struct option replay_options[] = {
3385 OPT_UINTEGER('r', "repeat", &sched.replay_repeat,
3386 "repeat the workload replay N times (-1: infinite)"),
Namhyung Kim77f02f42016-10-24 12:00:03 +09003387 OPT_PARENT(sched_options)
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003388 };
Jiri Olsa99623c62016-04-12 15:29:26 +02003389 const struct option map_options[] = {
3390 OPT_BOOLEAN(0, "compact", &sched.map.comp,
3391 "map output in compact mode"),
Jiri Olsaa151a372016-04-12 15:29:29 +02003392 OPT_STRING(0, "color-pids", &sched.map.color_pids_str, "pids",
3393 "highlight given pids in map"),
Jiri Olsacf294f22016-04-12 15:29:30 +02003394 OPT_STRING(0, "color-cpus", &sched.map.color_cpus_str, "cpus",
3395 "highlight given CPUs in map"),
Jiri Olsa73643bb2016-04-12 15:29:31 +02003396 OPT_STRING(0, "cpus", &sched.map.cpus_str, "cpus",
3397 "display given CPUs in map"),
Namhyung Kim77f02f42016-10-24 12:00:03 +09003398 OPT_PARENT(sched_options)
Jiri Olsa99623c62016-04-12 15:29:26 +02003399 };
David Ahern49394a22016-11-16 15:06:29 +09003400 const struct option timehist_options[] = {
3401 OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
3402 "file", "vmlinux pathname"),
3403 OPT_STRING(0, "kallsyms", &symbol_conf.kallsyms_name,
3404 "file", "kallsyms pathname"),
David Ahern6c973c92016-11-16 15:06:32 +09003405 OPT_BOOLEAN('g', "call-graph", &sched.show_callchain,
3406 "Display call chains if present (default on)"),
3407 OPT_UINTEGER(0, "max-stack", &sched.max_stack,
3408 "Maximum number of functions to display backtrace."),
David Ahern49394a22016-11-16 15:06:29 +09003409 OPT_STRING(0, "symfs", &symbol_conf.symfs, "directory",
3410 "Look for files with symbols relative to this directory"),
David Ahern52df1382016-11-16 15:06:30 +09003411 OPT_BOOLEAN('s', "summary", &sched.summary_only,
3412 "Show only syscall summary with statistics"),
3413 OPT_BOOLEAN('S', "with-summary", &sched.summary,
3414 "Show all syscalls and summary with statistics"),
David Ahernfc1469f2016-11-16 15:06:31 +09003415 OPT_BOOLEAN('w', "wakeups", &sched.show_wakeups, "Show wakeup events"),
Brendan Gregg292c4a82017-03-14 01:56:29 +00003416 OPT_BOOLEAN('n', "next", &sched.show_next, "Show next task"),
David Ahern350f54f2016-11-25 09:28:41 -07003417 OPT_BOOLEAN('M', "migrations", &sched.show_migrations, "Show migration events"),
David Aherna407b062016-11-16 15:06:33 +09003418 OPT_BOOLEAN('V', "cpu-visual", &sched.show_cpu_visual, "Add CPU visual"),
Namhyung Kim07235f82016-12-08 23:47:54 +09003419 OPT_BOOLEAN('I', "idle-hist", &sched.idle_hist, "Show idle events only"),
David Ahern853b7402016-11-29 10:15:44 -07003420 OPT_STRING(0, "time", &sched.time_str, "str",
3421 "Time span for analysis (start,stop)"),
Namhyung Kim414e0502017-01-13 19:45:22 +09003422 OPT_BOOLEAN(0, "state", &sched.show_state, "Show task state when sched-out"),
David Ahern0f59d7a2017-09-01 10:49:12 -07003423 OPT_STRING('p', "pid", &symbol_conf.pid_list_str, "pid[,pid...]",
3424 "analyze events only for given process id(s)"),
3425 OPT_STRING('t', "tid", &symbol_conf.tid_list_str, "tid[,tid...]",
3426 "analyze events only for given thread id(s)"),
David Ahern49394a22016-11-16 15:06:29 +09003427 OPT_PARENT(sched_options)
3428 };
3429
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003430 const char * const latency_usage[] = {
3431 "perf sched latency [<options>]",
3432 NULL
3433 };
3434 const char * const replay_usage[] = {
3435 "perf sched replay [<options>]",
3436 NULL
3437 };
Jiri Olsa99623c62016-04-12 15:29:26 +02003438 const char * const map_usage[] = {
3439 "perf sched map [<options>]",
3440 NULL
3441 };
David Ahern49394a22016-11-16 15:06:29 +09003442 const char * const timehist_usage[] = {
3443 "perf sched timehist [<options>]",
3444 NULL
3445 };
Ramkumar Ramachandraa83edb22014-03-14 23:17:54 -04003446 const char *const sched_subcommands[] = { "record", "latency", "map",
David Ahern49394a22016-11-16 15:06:29 +09003447 "replay", "script",
3448 "timehist", NULL };
Ramkumar Ramachandraa83edb22014-03-14 23:17:54 -04003449 const char *sched_usage[] = {
3450 NULL,
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003451 NULL
3452 };
3453 struct trace_sched_handler lat_ops = {
3454 .wakeup_event = latency_wakeup_event,
3455 .switch_event = latency_switch_event,
3456 .runtime_event = latency_runtime_event,
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003457 .migrate_task_event = latency_migrate_task_event,
3458 };
3459 struct trace_sched_handler map_ops = {
3460 .switch_event = map_switch_event,
3461 };
3462 struct trace_sched_handler replay_ops = {
3463 .wakeup_event = replay_wakeup_event,
3464 .switch_event = replay_switch_event,
3465 .fork_event = replay_fork_event,
3466 };
Adrian Hunter156a2b02013-10-22 10:34:16 +03003467 unsigned int i;
3468
3469 for (i = 0; i < ARRAY_SIZE(sched.curr_pid); i++)
3470 sched.curr_pid[i] = -1;
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003471
Ramkumar Ramachandraa83edb22014-03-14 23:17:54 -04003472 argc = parse_options_subcommand(argc, argv, sched_options, sched_subcommands,
3473 sched_usage, PARSE_OPT_STOP_AT_NON_OPTION);
Ingo Molnarf2858d82009-09-11 12:12:54 +02003474 if (!argc)
3475 usage_with_options(sched_usage, sched_options);
3476
Xiao Guangrongc0777c52009-12-07 12:04:49 +08003477 /*
Ingo Molnar133dc4c2010-11-16 18:45:39 +01003478 * Aliased to 'perf script' for now:
Xiao Guangrongc0777c52009-12-07 12:04:49 +08003479 */
Ingo Molnar133dc4c2010-11-16 18:45:39 +01003480 if (!strcmp(argv[0], "script"))
Arnaldo Carvalho de Melob0ad8ea2017-03-27 11:47:20 -03003481 return cmd_script(argc, argv);
Xiao Guangrongc0777c52009-12-07 12:04:49 +08003482
Ingo Molnar1fc35b22009-09-13 09:44:29 +02003483 if (!strncmp(argv[0], "rec", 3)) {
3484 return __cmd_record(argc, argv);
3485 } else if (!strncmp(argv[0], "lat", 3)) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003486 sched.tp_handler = &lat_ops;
Ingo Molnarf2858d82009-09-11 12:12:54 +02003487 if (argc > 1) {
3488 argc = parse_options(argc, argv, latency_options, latency_usage, 0);
3489 if (argc)
3490 usage_with_options(latency_usage, latency_options);
Ingo Molnarf2858d82009-09-11 12:12:54 +02003491 }
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003492 setup_sorting(&sched, latency_options, latency_usage);
3493 return perf_sched__lat(&sched);
Ingo Molnar0ec04e12009-09-16 17:40:48 +02003494 } else if (!strcmp(argv[0], "map")) {
Jiri Olsa99623c62016-04-12 15:29:26 +02003495 if (argc) {
Jiri Olsaa151a372016-04-12 15:29:29 +02003496 argc = parse_options(argc, argv, map_options, map_usage, 0);
Jiri Olsa99623c62016-04-12 15:29:26 +02003497 if (argc)
3498 usage_with_options(map_usage, map_options);
3499 }
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003500 sched.tp_handler = &map_ops;
3501 setup_sorting(&sched, latency_options, latency_usage);
3502 return perf_sched__map(&sched);
Ingo Molnarf2858d82009-09-11 12:12:54 +02003503 } else if (!strncmp(argv[0], "rep", 3)) {
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003504 sched.tp_handler = &replay_ops;
Ingo Molnarf2858d82009-09-11 12:12:54 +02003505 if (argc) {
3506 argc = parse_options(argc, argv, replay_options, replay_usage, 0);
3507 if (argc)
3508 usage_with_options(replay_usage, replay_options);
3509 }
Arnaldo Carvalho de Melo0e9b07e2012-09-11 17:29:27 -03003510 return perf_sched__replay(&sched);
David Ahern49394a22016-11-16 15:06:29 +09003511 } else if (!strcmp(argv[0], "timehist")) {
3512 if (argc) {
3513 argc = parse_options(argc, argv, timehist_options,
3514 timehist_usage, 0);
3515 if (argc)
3516 usage_with_options(timehist_usage, timehist_options);
3517 }
Brendan Gregg292c4a82017-03-14 01:56:29 +00003518 if ((sched.show_wakeups || sched.show_next) &&
3519 sched.summary_only) {
3520 pr_err(" Error: -s and -[n|w] are mutually exclusive.\n");
David Ahernfc1469f2016-11-16 15:06:31 +09003521 parse_options_usage(timehist_usage, timehist_options, "s", true);
Brendan Gregg292c4a82017-03-14 01:56:29 +00003522 if (sched.show_wakeups)
3523 parse_options_usage(NULL, timehist_options, "w", true);
3524 if (sched.show_next)
3525 parse_options_usage(NULL, timehist_options, "n", true);
David Ahernfc1469f2016-11-16 15:06:31 +09003526 return -EINVAL;
3527 }
3528
David Ahern49394a22016-11-16 15:06:29 +09003529 return perf_sched__timehist(&sched);
Ingo Molnarf2858d82009-09-11 12:12:54 +02003530 } else {
3531 usage_with_options(sched_usage, sched_options);
Ingo Molnar0a02ad92009-09-11 12:12:54 +02003532 }
3533
Ingo Molnarec156762009-09-11 12:12:54 +02003534 return 0;
Ingo Molnar0a02ad92009-09-11 12:12:54 +02003535}