blob: f6926a149a71d40ed9d4f061f01c04766de3e5f9 [file] [log] [blame]
Li Zefan2e76c242013-03-29 14:36:31 +08001#include <linux/cgroup.h>
2#include <linux/slab.h>
3#include <linux/percpu.h>
4#include <linux/spinlock.h>
5#include <linux/cpumask.h>
6#include <linux/seq_file.h>
7#include <linux/rcupdate.h>
8#include <linux/kernel_stat.h>
Ingo Molnarb329fd52013-04-10 15:10:50 +02009#include <linux/err.h>
Li Zefan2e76c242013-03-29 14:36:31 +080010
11#include "sched.h"
12
13/*
14 * CPU accounting code for task groups.
15 *
16 * Based on the work by Paul Menage (menage@google.com) and Balbir Singh
17 * (balbir@in.ibm.com).
18 */
19
Li Zefand1712792013-03-29 14:38:13 +080020/* Time spent by the tasks of the cpu accounting group executing in ... */
21enum cpuacct_stat_index {
22 CPUACCT_STAT_USER, /* ... user mode */
23 CPUACCT_STAT_SYSTEM, /* ... kernel mode */
24
25 CPUACCT_STAT_NSTATS,
26};
27
28/* track cpu usage of a group of tasks and its child groups */
29struct cpuacct {
30 struct cgroup_subsys_state css;
31 /* cpuusage holds pointer to a u64-type object on every cpu */
32 u64 __percpu *cpuusage;
33 struct kernel_cpustat __percpu *cpustat;
34};
35
Tejun Heoa7c6d552013-08-08 20:11:23 -040036static inline struct cpuacct *css_ca(struct cgroup_subsys_state *css)
37{
38 return css ? container_of(css, struct cpuacct, css) : NULL;
39}
40
Li Zefand1712792013-03-29 14:38:13 +080041/* return cpu accounting group corresponding to this container */
42static inline struct cpuacct *cgroup_ca(struct cgroup *cgrp)
43{
Tejun Heoa7c6d552013-08-08 20:11:23 -040044 return css_ca(cgroup_css(cgrp, cpuacct_subsys_id));
Li Zefand1712792013-03-29 14:38:13 +080045}
46
47/* return cpu accounting group to which this task belongs */
48static inline struct cpuacct *task_ca(struct task_struct *tsk)
49{
Tejun Heoa7c6d552013-08-08 20:11:23 -040050 return css_ca(task_css(tsk, cpuacct_subsys_id));
Li Zefand1712792013-03-29 14:38:13 +080051}
52
Li Zefand1712792013-03-29 14:38:13 +080053static inline struct cpuacct *parent_ca(struct cpuacct *ca)
54{
Tejun Heo63876982013-08-08 20:11:23 -040055 return css_ca(css_parent(&ca->css));
Li Zefand1712792013-03-29 14:38:13 +080056}
57
Li Zefan7943e152013-03-29 14:43:46 +080058static DEFINE_PER_CPU(u64, root_cpuacct_cpuusage);
Li Zefan14c6d3c2013-03-29 14:44:04 +080059static struct cpuacct root_cpuacct = {
60 .cpustat = &kernel_cpustat,
61 .cpuusage = &root_cpuacct_cpuusage,
62};
Li Zefan2e76c242013-03-29 14:36:31 +080063
64/* create a new cpu accounting group */
65static struct cgroup_subsys_state *cpuacct_css_alloc(struct cgroup *cgrp)
66{
67 struct cpuacct *ca;
68
69 if (!cgrp->parent)
70 return &root_cpuacct.css;
71
72 ca = kzalloc(sizeof(*ca), GFP_KERNEL);
73 if (!ca)
74 goto out;
75
76 ca->cpuusage = alloc_percpu(u64);
77 if (!ca->cpuusage)
78 goto out_free_ca;
79
80 ca->cpustat = alloc_percpu(struct kernel_cpustat);
81 if (!ca->cpustat)
82 goto out_free_cpuusage;
83
84 return &ca->css;
85
86out_free_cpuusage:
87 free_percpu(ca->cpuusage);
88out_free_ca:
89 kfree(ca);
90out:
91 return ERR_PTR(-ENOMEM);
92}
93
94/* destroy an existing cpu accounting group */
95static void cpuacct_css_free(struct cgroup *cgrp)
96{
97 struct cpuacct *ca = cgroup_ca(cgrp);
98
99 free_percpu(ca->cpustat);
100 free_percpu(ca->cpuusage);
101 kfree(ca);
102}
103
104static u64 cpuacct_cpuusage_read(struct cpuacct *ca, int cpu)
105{
106 u64 *cpuusage = per_cpu_ptr(ca->cpuusage, cpu);
107 u64 data;
108
109#ifndef CONFIG_64BIT
110 /*
111 * Take rq->lock to make 64-bit read safe on 32-bit platforms.
112 */
113 raw_spin_lock_irq(&cpu_rq(cpu)->lock);
114 data = *cpuusage;
115 raw_spin_unlock_irq(&cpu_rq(cpu)->lock);
116#else
117 data = *cpuusage;
118#endif
119
120 return data;
121}
122
123static void cpuacct_cpuusage_write(struct cpuacct *ca, int cpu, u64 val)
124{
125 u64 *cpuusage = per_cpu_ptr(ca->cpuusage, cpu);
126
127#ifndef CONFIG_64BIT
128 /*
129 * Take rq->lock to make 64-bit write safe on 32-bit platforms.
130 */
131 raw_spin_lock_irq(&cpu_rq(cpu)->lock);
132 *cpuusage = val;
133 raw_spin_unlock_irq(&cpu_rq(cpu)->lock);
134#else
135 *cpuusage = val;
136#endif
137}
138
139/* return total cpu usage (in nanoseconds) of a group */
140static u64 cpuusage_read(struct cgroup *cgrp, struct cftype *cft)
141{
142 struct cpuacct *ca = cgroup_ca(cgrp);
143 u64 totalcpuusage = 0;
144 int i;
145
146 for_each_present_cpu(i)
147 totalcpuusage += cpuacct_cpuusage_read(ca, i);
148
149 return totalcpuusage;
150}
151
152static int cpuusage_write(struct cgroup *cgrp, struct cftype *cftype,
153 u64 reset)
154{
155 struct cpuacct *ca = cgroup_ca(cgrp);
156 int err = 0;
157 int i;
158
159 if (reset) {
160 err = -EINVAL;
161 goto out;
162 }
163
164 for_each_present_cpu(i)
165 cpuacct_cpuusage_write(ca, i, 0);
166
167out:
168 return err;
169}
170
171static int cpuacct_percpu_seq_read(struct cgroup *cgroup, struct cftype *cft,
172 struct seq_file *m)
173{
174 struct cpuacct *ca = cgroup_ca(cgroup);
175 u64 percpu;
176 int i;
177
178 for_each_present_cpu(i) {
179 percpu = cpuacct_cpuusage_read(ca, i);
180 seq_printf(m, "%llu ", (unsigned long long) percpu);
181 }
182 seq_printf(m, "\n");
183 return 0;
184}
185
186static const char * const cpuacct_stat_desc[] = {
187 [CPUACCT_STAT_USER] = "user",
188 [CPUACCT_STAT_SYSTEM] = "system",
189};
190
191static int cpuacct_stats_show(struct cgroup *cgrp, struct cftype *cft,
192 struct cgroup_map_cb *cb)
193{
194 struct cpuacct *ca = cgroup_ca(cgrp);
195 int cpu;
196 s64 val = 0;
197
198 for_each_online_cpu(cpu) {
199 struct kernel_cpustat *kcpustat = per_cpu_ptr(ca->cpustat, cpu);
200 val += kcpustat->cpustat[CPUTIME_USER];
201 val += kcpustat->cpustat[CPUTIME_NICE];
202 }
203 val = cputime64_to_clock_t(val);
204 cb->fill(cb, cpuacct_stat_desc[CPUACCT_STAT_USER], val);
205
206 val = 0;
207 for_each_online_cpu(cpu) {
208 struct kernel_cpustat *kcpustat = per_cpu_ptr(ca->cpustat, cpu);
209 val += kcpustat->cpustat[CPUTIME_SYSTEM];
210 val += kcpustat->cpustat[CPUTIME_IRQ];
211 val += kcpustat->cpustat[CPUTIME_SOFTIRQ];
212 }
213
214 val = cputime64_to_clock_t(val);
215 cb->fill(cb, cpuacct_stat_desc[CPUACCT_STAT_SYSTEM], val);
216
217 return 0;
218}
219
220static struct cftype files[] = {
221 {
222 .name = "usage",
223 .read_u64 = cpuusage_read,
224 .write_u64 = cpuusage_write,
225 },
226 {
227 .name = "usage_percpu",
228 .read_seq_string = cpuacct_percpu_seq_read,
229 },
230 {
231 .name = "stat",
232 .read_map = cpuacct_stats_show,
233 },
234 { } /* terminate */
235};
236
237/*
238 * charge this task's execution time to its accounting group.
239 *
240 * called with rq->lock held.
241 */
242void cpuacct_charge(struct task_struct *tsk, u64 cputime)
243{
244 struct cpuacct *ca;
245 int cpu;
246
Li Zefan2e76c242013-03-29 14:36:31 +0800247 cpu = task_cpu(tsk);
248
249 rcu_read_lock();
250
251 ca = task_ca(tsk);
252
Li Zefan543bc0e2013-03-29 14:37:29 +0800253 while (true) {
Li Zefan2e76c242013-03-29 14:36:31 +0800254 u64 *cpuusage = per_cpu_ptr(ca->cpuusage, cpu);
255 *cpuusage += cputime;
Li Zefan543bc0e2013-03-29 14:37:29 +0800256
257 ca = parent_ca(ca);
258 if (!ca)
259 break;
Li Zefan2e76c242013-03-29 14:36:31 +0800260 }
261
262 rcu_read_unlock();
263}
264
Li Zefan1966aaf2013-03-29 14:37:06 +0800265/*
266 * Add user/system time to cpuacct.
267 *
268 * Note: it's the caller that updates the account of the root cgroup.
269 */
270void cpuacct_account_field(struct task_struct *p, int index, u64 val)
271{
272 struct kernel_cpustat *kcpustat;
273 struct cpuacct *ca;
274
Li Zefan1966aaf2013-03-29 14:37:06 +0800275 rcu_read_lock();
276 ca = task_ca(p);
Li Zefan5f40d802013-03-29 14:37:43 +0800277 while (ca != &root_cpuacct) {
Li Zefan1966aaf2013-03-29 14:37:06 +0800278 kcpustat = this_cpu_ptr(ca->cpustat);
279 kcpustat->cpustat[index] += val;
Tejun Heo63876982013-08-08 20:11:23 -0400280 ca = parent_ca(ca);
Li Zefan1966aaf2013-03-29 14:37:06 +0800281 }
282 rcu_read_unlock();
283}
284
Li Zefan2e76c242013-03-29 14:36:31 +0800285struct cgroup_subsys cpuacct_subsys = {
Li Zefan621e2de2013-03-29 14:44:15 +0800286 .name = "cpuacct",
287 .css_alloc = cpuacct_css_alloc,
288 .css_free = cpuacct_css_free,
289 .subsys_id = cpuacct_subsys_id,
290 .base_cftypes = files,
291 .early_init = 1,
Li Zefan2e76c242013-03-29 14:36:31 +0800292};