blob: bc0b309c3f19e2ce7e07b2d0419d9157d423497a [file] [log] [blame]
Li Zefan2e76c242013-03-29 14:36:31 +08001#include <linux/cgroup.h>
2#include <linux/slab.h>
3#include <linux/percpu.h>
4#include <linux/spinlock.h>
5#include <linux/cpumask.h>
6#include <linux/seq_file.h>
7#include <linux/rcupdate.h>
8#include <linux/kernel_stat.h>
Ingo Molnarb329fd52013-04-10 15:10:50 +02009#include <linux/err.h>
Li Zefan2e76c242013-03-29 14:36:31 +080010
11#include "sched.h"
12
13/*
14 * CPU accounting code for task groups.
15 *
16 * Based on the work by Paul Menage (menage@google.com) and Balbir Singh
17 * (balbir@in.ibm.com).
18 */
19
Li Zefand1712792013-03-29 14:38:13 +080020/* Time spent by the tasks of the cpu accounting group executing in ... */
21enum cpuacct_stat_index {
22 CPUACCT_STAT_USER, /* ... user mode */
23 CPUACCT_STAT_SYSTEM, /* ... kernel mode */
24
25 CPUACCT_STAT_NSTATS,
26};
27
Zhao Lei9acacc22016-06-20 17:37:18 +080028static const char * const cpuacct_stat_desc[] = {
29 [CPUACCT_STAT_USER] = "user",
30 [CPUACCT_STAT_SYSTEM] = "system",
Dongsheng Yangd7400372016-03-22 16:37:08 +080031};
32
33struct cpuacct_usage {
Zhao Lei9acacc22016-06-20 17:37:18 +080034 u64 usages[CPUACCT_STAT_NSTATS];
Dongsheng Yangd7400372016-03-22 16:37:08 +080035};
36
Li Zefand1712792013-03-29 14:38:13 +080037/* track cpu usage of a group of tasks and its child groups */
38struct cpuacct {
39 struct cgroup_subsys_state css;
40 /* cpuusage holds pointer to a u64-type object on every cpu */
Dongsheng Yangd7400372016-03-22 16:37:08 +080041 struct cpuacct_usage __percpu *cpuusage;
Li Zefand1712792013-03-29 14:38:13 +080042 struct kernel_cpustat __percpu *cpustat;
43};
44
Tejun Heoa7c6d552013-08-08 20:11:23 -040045static inline struct cpuacct *css_ca(struct cgroup_subsys_state *css)
46{
47 return css ? container_of(css, struct cpuacct, css) : NULL;
48}
49
Li Zefand1712792013-03-29 14:38:13 +080050/* return cpu accounting group to which this task belongs */
51static inline struct cpuacct *task_ca(struct task_struct *tsk)
52{
Tejun Heo073219e2014-02-08 10:36:58 -050053 return css_ca(task_css(tsk, cpuacct_cgrp_id));
Li Zefand1712792013-03-29 14:38:13 +080054}
55
Li Zefand1712792013-03-29 14:38:13 +080056static inline struct cpuacct *parent_ca(struct cpuacct *ca)
57{
Tejun Heo5c9d5352014-05-16 13:22:48 -040058 return css_ca(ca->css.parent);
Li Zefand1712792013-03-29 14:38:13 +080059}
60
Dongsheng Yangd7400372016-03-22 16:37:08 +080061static DEFINE_PER_CPU(struct cpuacct_usage, root_cpuacct_cpuusage);
Li Zefan14c6d3c2013-03-29 14:44:04 +080062static struct cpuacct root_cpuacct = {
63 .cpustat = &kernel_cpustat,
64 .cpuusage = &root_cpuacct_cpuusage,
65};
Li Zefan2e76c242013-03-29 14:36:31 +080066
67/* create a new cpu accounting group */
Tejun Heoeb954192013-08-08 20:11:23 -040068static struct cgroup_subsys_state *
69cpuacct_css_alloc(struct cgroup_subsys_state *parent_css)
Li Zefan2e76c242013-03-29 14:36:31 +080070{
71 struct cpuacct *ca;
72
Tejun Heoeb954192013-08-08 20:11:23 -040073 if (!parent_css)
Li Zefan2e76c242013-03-29 14:36:31 +080074 return &root_cpuacct.css;
75
76 ca = kzalloc(sizeof(*ca), GFP_KERNEL);
77 if (!ca)
78 goto out;
79
Dongsheng Yangd7400372016-03-22 16:37:08 +080080 ca->cpuusage = alloc_percpu(struct cpuacct_usage);
Li Zefan2e76c242013-03-29 14:36:31 +080081 if (!ca->cpuusage)
82 goto out_free_ca;
83
84 ca->cpustat = alloc_percpu(struct kernel_cpustat);
85 if (!ca->cpustat)
86 goto out_free_cpuusage;
87
88 return &ca->css;
89
90out_free_cpuusage:
91 free_percpu(ca->cpuusage);
92out_free_ca:
93 kfree(ca);
94out:
95 return ERR_PTR(-ENOMEM);
96}
97
98/* destroy an existing cpu accounting group */
Tejun Heoeb954192013-08-08 20:11:23 -040099static void cpuacct_css_free(struct cgroup_subsys_state *css)
Li Zefan2e76c242013-03-29 14:36:31 +0800100{
Tejun Heoeb954192013-08-08 20:11:23 -0400101 struct cpuacct *ca = css_ca(css);
Li Zefan2e76c242013-03-29 14:36:31 +0800102
103 free_percpu(ca->cpustat);
104 free_percpu(ca->cpuusage);
105 kfree(ca);
106}
107
Dongsheng Yangd7400372016-03-22 16:37:08 +0800108static u64 cpuacct_cpuusage_read(struct cpuacct *ca, int cpu,
Zhao Lei9acacc22016-06-20 17:37:18 +0800109 enum cpuacct_stat_index index)
Li Zefan2e76c242013-03-29 14:36:31 +0800110{
Dongsheng Yangd7400372016-03-22 16:37:08 +0800111 struct cpuacct_usage *cpuusage = per_cpu_ptr(ca->cpuusage, cpu);
Li Zefan2e76c242013-03-29 14:36:31 +0800112 u64 data;
113
Dongsheng Yangd7400372016-03-22 16:37:08 +0800114 /*
Zhao Lei9acacc22016-06-20 17:37:18 +0800115 * We allow index == CPUACCT_STAT_NSTATS here to read
Dongsheng Yangd7400372016-03-22 16:37:08 +0800116 * the sum of suages.
117 */
Zhao Lei9acacc22016-06-20 17:37:18 +0800118 BUG_ON(index > CPUACCT_STAT_NSTATS);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800119
Li Zefan2e76c242013-03-29 14:36:31 +0800120#ifndef CONFIG_64BIT
121 /*
122 * Take rq->lock to make 64-bit read safe on 32-bit platforms.
123 */
124 raw_spin_lock_irq(&cpu_rq(cpu)->lock);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800125#endif
126
Zhao Lei9acacc22016-06-20 17:37:18 +0800127 if (index == CPUACCT_STAT_NSTATS) {
Dongsheng Yangd7400372016-03-22 16:37:08 +0800128 int i = 0;
129
130 data = 0;
Zhao Lei9acacc22016-06-20 17:37:18 +0800131 for (i = 0; i < CPUACCT_STAT_NSTATS; i++)
Dongsheng Yangd7400372016-03-22 16:37:08 +0800132 data += cpuusage->usages[i];
133 } else {
134 data = cpuusage->usages[index];
135 }
136
137#ifndef CONFIG_64BIT
Li Zefan2e76c242013-03-29 14:36:31 +0800138 raw_spin_unlock_irq(&cpu_rq(cpu)->lock);
Li Zefan2e76c242013-03-29 14:36:31 +0800139#endif
140
141 return data;
142}
143
144static void cpuacct_cpuusage_write(struct cpuacct *ca, int cpu, u64 val)
145{
Dongsheng Yangd7400372016-03-22 16:37:08 +0800146 struct cpuacct_usage *cpuusage = per_cpu_ptr(ca->cpuusage, cpu);
147 int i;
Li Zefan2e76c242013-03-29 14:36:31 +0800148
149#ifndef CONFIG_64BIT
150 /*
151 * Take rq->lock to make 64-bit write safe on 32-bit platforms.
152 */
153 raw_spin_lock_irq(&cpu_rq(cpu)->lock);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800154#endif
155
Zhao Lei9acacc22016-06-20 17:37:18 +0800156 for (i = 0; i < CPUACCT_STAT_NSTATS; i++)
Dongsheng Yangd7400372016-03-22 16:37:08 +0800157 cpuusage->usages[i] = val;
158
159#ifndef CONFIG_64BIT
Li Zefan2e76c242013-03-29 14:36:31 +0800160 raw_spin_unlock_irq(&cpu_rq(cpu)->lock);
Li Zefan2e76c242013-03-29 14:36:31 +0800161#endif
162}
163
164/* return total cpu usage (in nanoseconds) of a group */
Dongsheng Yangd7400372016-03-22 16:37:08 +0800165static u64 __cpuusage_read(struct cgroup_subsys_state *css,
Zhao Lei9acacc22016-06-20 17:37:18 +0800166 enum cpuacct_stat_index index)
Li Zefan2e76c242013-03-29 14:36:31 +0800167{
Tejun Heo182446d2013-08-08 20:11:24 -0400168 struct cpuacct *ca = css_ca(css);
Li Zefan2e76c242013-03-29 14:36:31 +0800169 u64 totalcpuusage = 0;
170 int i;
171
Zhao Lei5ca37262016-03-22 16:37:07 +0800172 for_each_possible_cpu(i)
Dongsheng Yangd7400372016-03-22 16:37:08 +0800173 totalcpuusage += cpuacct_cpuusage_read(ca, i, index);
Li Zefan2e76c242013-03-29 14:36:31 +0800174
175 return totalcpuusage;
176}
177
Dongsheng Yangd7400372016-03-22 16:37:08 +0800178static u64 cpuusage_user_read(struct cgroup_subsys_state *css,
179 struct cftype *cft)
180{
Zhao Lei9acacc22016-06-20 17:37:18 +0800181 return __cpuusage_read(css, CPUACCT_STAT_USER);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800182}
183
184static u64 cpuusage_sys_read(struct cgroup_subsys_state *css,
185 struct cftype *cft)
186{
Zhao Lei9acacc22016-06-20 17:37:18 +0800187 return __cpuusage_read(css, CPUACCT_STAT_SYSTEM);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800188}
189
190static u64 cpuusage_read(struct cgroup_subsys_state *css, struct cftype *cft)
191{
Zhao Lei9acacc22016-06-20 17:37:18 +0800192 return __cpuusage_read(css, CPUACCT_STAT_NSTATS);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800193}
194
Tejun Heo182446d2013-08-08 20:11:24 -0400195static int cpuusage_write(struct cgroup_subsys_state *css, struct cftype *cft,
Dongsheng Yang1a736b72015-12-21 19:14:42 +0800196 u64 val)
Li Zefan2e76c242013-03-29 14:36:31 +0800197{
Tejun Heo182446d2013-08-08 20:11:24 -0400198 struct cpuacct *ca = css_ca(css);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800199 int cpu;
Li Zefan2e76c242013-03-29 14:36:31 +0800200
Dongsheng Yang1a736b72015-12-21 19:14:42 +0800201 /*
202 * Only allow '0' here to do a reset.
203 */
Dongsheng Yangd7400372016-03-22 16:37:08 +0800204 if (val)
205 return -EINVAL;
Li Zefan2e76c242013-03-29 14:36:31 +0800206
Dongsheng Yangd7400372016-03-22 16:37:08 +0800207 for_each_possible_cpu(cpu)
208 cpuacct_cpuusage_write(ca, cpu, 0);
Li Zefan2e76c242013-03-29 14:36:31 +0800209
Dongsheng Yangd7400372016-03-22 16:37:08 +0800210 return 0;
Li Zefan2e76c242013-03-29 14:36:31 +0800211}
212
Dongsheng Yangd7400372016-03-22 16:37:08 +0800213static int __cpuacct_percpu_seq_show(struct seq_file *m,
Zhao Lei9acacc22016-06-20 17:37:18 +0800214 enum cpuacct_stat_index index)
Li Zefan2e76c242013-03-29 14:36:31 +0800215{
Tejun Heo2da8ca82013-12-05 12:28:04 -0500216 struct cpuacct *ca = css_ca(seq_css(m));
Li Zefan2e76c242013-03-29 14:36:31 +0800217 u64 percpu;
218 int i;
219
Zhao Lei5ca37262016-03-22 16:37:07 +0800220 for_each_possible_cpu(i) {
Dongsheng Yangd7400372016-03-22 16:37:08 +0800221 percpu = cpuacct_cpuusage_read(ca, i, index);
Li Zefan2e76c242013-03-29 14:36:31 +0800222 seq_printf(m, "%llu ", (unsigned long long) percpu);
223 }
224 seq_printf(m, "\n");
225 return 0;
226}
227
Dongsheng Yangd7400372016-03-22 16:37:08 +0800228static int cpuacct_percpu_user_seq_show(struct seq_file *m, void *V)
229{
Zhao Lei9acacc22016-06-20 17:37:18 +0800230 return __cpuacct_percpu_seq_show(m, CPUACCT_STAT_USER);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800231}
232
233static int cpuacct_percpu_sys_seq_show(struct seq_file *m, void *V)
234{
Zhao Lei9acacc22016-06-20 17:37:18 +0800235 return __cpuacct_percpu_seq_show(m, CPUACCT_STAT_SYSTEM);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800236}
237
238static int cpuacct_percpu_seq_show(struct seq_file *m, void *V)
239{
Zhao Lei9acacc22016-06-20 17:37:18 +0800240 return __cpuacct_percpu_seq_show(m, CPUACCT_STAT_NSTATS);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800241}
242
Zhao Lei277a13e2016-06-20 17:37:20 +0800243static int cpuacct_all_seq_show(struct seq_file *m, void *V)
244{
245 struct cpuacct *ca = css_ca(seq_css(m));
246 int index;
247 int cpu;
248
249 seq_puts(m, "cpu");
250 for (index = 0; index < CPUACCT_STAT_NSTATS; index++)
251 seq_printf(m, " %s", cpuacct_stat_desc[index]);
252 seq_puts(m, "\n");
253
254 for_each_possible_cpu(cpu) {
255 struct cpuacct_usage *cpuusage = per_cpu_ptr(ca->cpuusage, cpu);
256
257 seq_printf(m, "%d", cpu);
258
259 for (index = 0; index < CPUACCT_STAT_NSTATS; index++) {
260#ifndef CONFIG_64BIT
261 /*
262 * Take rq->lock to make 64-bit read safe on 32-bit
263 * platforms.
264 */
265 raw_spin_lock_irq(&cpu_rq(cpu)->lock);
266#endif
267
268 seq_printf(m, " %llu", cpuusage->usages[index]);
269
270#ifndef CONFIG_64BIT
271 raw_spin_unlock_irq(&cpu_rq(cpu)->lock);
272#endif
273 }
274 seq_puts(m, "\n");
275 }
276 return 0;
277}
278
Tejun Heo2da8ca82013-12-05 12:28:04 -0500279static int cpuacct_stats_show(struct seq_file *sf, void *v)
Li Zefan2e76c242013-03-29 14:36:31 +0800280{
Tejun Heo2da8ca82013-12-05 12:28:04 -0500281 struct cpuacct *ca = css_ca(seq_css(sf));
Zhao Lei8e546bf2016-06-20 17:37:19 +0800282 s64 val[CPUACCT_STAT_NSTATS];
Li Zefan2e76c242013-03-29 14:36:31 +0800283 int cpu;
Zhao Lei8e546bf2016-06-20 17:37:19 +0800284 int stat;
Li Zefan2e76c242013-03-29 14:36:31 +0800285
Zhao Lei8e546bf2016-06-20 17:37:19 +0800286 memset(val, 0, sizeof(val));
Zhao Lei5ca37262016-03-22 16:37:07 +0800287 for_each_possible_cpu(cpu) {
Zhao Lei8e546bf2016-06-20 17:37:19 +0800288 u64 *cpustat = per_cpu_ptr(ca->cpustat, cpu)->cpustat;
Li Zefan2e76c242013-03-29 14:36:31 +0800289
Zhao Lei8e546bf2016-06-20 17:37:19 +0800290 val[CPUACCT_STAT_USER] += cpustat[CPUTIME_USER];
291 val[CPUACCT_STAT_USER] += cpustat[CPUTIME_NICE];
292 val[CPUACCT_STAT_SYSTEM] += cpustat[CPUTIME_SYSTEM];
293 val[CPUACCT_STAT_SYSTEM] += cpustat[CPUTIME_IRQ];
294 val[CPUACCT_STAT_SYSTEM] += cpustat[CPUTIME_SOFTIRQ];
Li Zefan2e76c242013-03-29 14:36:31 +0800295 }
296
Zhao Lei8e546bf2016-06-20 17:37:19 +0800297 for (stat = 0; stat < CPUACCT_STAT_NSTATS; stat++) {
298 seq_printf(sf, "%s %lld\n",
299 cpuacct_stat_desc[stat],
300 cputime64_to_clock_t(val[stat]));
301 }
Li Zefan2e76c242013-03-29 14:36:31 +0800302
303 return 0;
304}
305
306static struct cftype files[] = {
307 {
308 .name = "usage",
309 .read_u64 = cpuusage_read,
310 .write_u64 = cpuusage_write,
311 },
312 {
Dongsheng Yangd7400372016-03-22 16:37:08 +0800313 .name = "usage_user",
314 .read_u64 = cpuusage_user_read,
315 },
316 {
317 .name = "usage_sys",
318 .read_u64 = cpuusage_sys_read,
319 },
320 {
Li Zefan2e76c242013-03-29 14:36:31 +0800321 .name = "usage_percpu",
Tejun Heo2da8ca82013-12-05 12:28:04 -0500322 .seq_show = cpuacct_percpu_seq_show,
Li Zefan2e76c242013-03-29 14:36:31 +0800323 },
324 {
Dongsheng Yangd7400372016-03-22 16:37:08 +0800325 .name = "usage_percpu_user",
326 .seq_show = cpuacct_percpu_user_seq_show,
327 },
328 {
329 .name = "usage_percpu_sys",
330 .seq_show = cpuacct_percpu_sys_seq_show,
331 },
332 {
Zhao Lei277a13e2016-06-20 17:37:20 +0800333 .name = "usage_all",
334 .seq_show = cpuacct_all_seq_show,
335 },
336 {
Li Zefan2e76c242013-03-29 14:36:31 +0800337 .name = "stat",
Tejun Heo2da8ca82013-12-05 12:28:04 -0500338 .seq_show = cpuacct_stats_show,
Li Zefan2e76c242013-03-29 14:36:31 +0800339 },
340 { } /* terminate */
341};
342
343/*
344 * charge this task's execution time to its accounting group.
345 *
346 * called with rq->lock held.
347 */
348void cpuacct_charge(struct task_struct *tsk, u64 cputime)
349{
350 struct cpuacct *ca;
Zhao Lei9acacc22016-06-20 17:37:18 +0800351 int index = CPUACCT_STAT_SYSTEM;
Anton Blanchardbd928832016-04-06 21:59:50 +1000352 struct pt_regs *regs = task_pt_regs(tsk);
Dongsheng Yangd7400372016-03-22 16:37:08 +0800353
Anton Blanchardbd928832016-04-06 21:59:50 +1000354 if (regs && user_mode(regs))
Zhao Lei9acacc22016-06-20 17:37:18 +0800355 index = CPUACCT_STAT_USER;
Li Zefan2e76c242013-03-29 14:36:31 +0800356
357 rcu_read_lock();
Dongsheng Yangd7400372016-03-22 16:37:08 +0800358
Zhao Lei73e6aaf2016-03-17 12:19:43 +0800359 for (ca = task_ca(tsk); ca; ca = parent_ca(ca))
Dongsheng Yangd7400372016-03-22 16:37:08 +0800360 this_cpu_ptr(ca->cpuusage)->usages[index] += cputime;
361
Li Zefan2e76c242013-03-29 14:36:31 +0800362 rcu_read_unlock();
363}
364
Li Zefan1966aaf2013-03-29 14:37:06 +0800365/*
366 * Add user/system time to cpuacct.
367 *
368 * Note: it's the caller that updates the account of the root cgroup.
369 */
Zhao Lei73e6aaf2016-03-17 12:19:43 +0800370void cpuacct_account_field(struct task_struct *tsk, int index, u64 val)
Li Zefan1966aaf2013-03-29 14:37:06 +0800371{
Li Zefan1966aaf2013-03-29 14:37:06 +0800372 struct cpuacct *ca;
373
Li Zefan1966aaf2013-03-29 14:37:06 +0800374 rcu_read_lock();
Zhao Lei73e6aaf2016-03-17 12:19:43 +0800375 for (ca = task_ca(tsk); ca != &root_cpuacct; ca = parent_ca(ca))
376 this_cpu_ptr(ca->cpustat)->cpustat[index] += val;
Li Zefan1966aaf2013-03-29 14:37:06 +0800377 rcu_read_unlock();
378}
379
Tejun Heo073219e2014-02-08 10:36:58 -0500380struct cgroup_subsys cpuacct_cgrp_subsys = {
Li Zefan621e2de2013-03-29 14:44:15 +0800381 .css_alloc = cpuacct_css_alloc,
382 .css_free = cpuacct_css_free,
Tejun Heo55779642014-07-15 11:05:09 -0400383 .legacy_cftypes = files,
Tejun Heob38e42e2016-02-23 10:00:50 -0500384 .early_init = true,
Li Zefan2e76c242013-03-29 14:36:31 +0800385};