1 #include <linux/cgroup.h>
2 #include <linux/slab.h>
3 #include <linux/percpu.h>
4 #include <linux/spinlock.h>
5 #include <linux/cpumask.h>
6 #include <linux/seq_file.h>
7 #include <linux/rcupdate.h>
8 #include <linux/kernel_stat.h>
14 * CPU accounting code for task groups.
16 * Based on the work by Paul Menage (menage@google.com) and Balbir Singh
17 * (balbir@in.ibm.com).
20 /* Time spent by the tasks of the cpu accounting group executing in ... */
21 enum cpuacct_stat_index
{
22 CPUACCT_STAT_USER
, /* ... user mode */
23 CPUACCT_STAT_SYSTEM
, /* ... kernel mode */
28 /* track cpu usage of a group of tasks and its child groups */
30 struct cgroup_subsys_state css
;
31 /* cpuusage holds pointer to a u64-type object on every cpu */
32 u64 __percpu
*cpuusage
;
33 struct kernel_cpustat __percpu
*cpustat
;
36 static inline struct cpuacct
*css_ca(struct cgroup_subsys_state
*css
)
38 return css
? container_of(css
, struct cpuacct
, css
) : NULL
;
41 /* return cpu accounting group corresponding to this container */
42 static inline struct cpuacct
*cgroup_ca(struct cgroup
*cgrp
)
44 return css_ca(cgroup_css(cgrp
, cpuacct_subsys_id
));
47 /* return cpu accounting group to which this task belongs */
48 static inline struct cpuacct
*task_ca(struct task_struct
*tsk
)
50 return css_ca(task_css(tsk
, cpuacct_subsys_id
));
53 static inline struct cpuacct
*__parent_ca(struct cpuacct
*ca
)
55 return cgroup_ca(ca
->css
.cgroup
->parent
);
58 static inline struct cpuacct
*parent_ca(struct cpuacct
*ca
)
60 if (!ca
->css
.cgroup
->parent
)
62 return cgroup_ca(ca
->css
.cgroup
->parent
);
65 static DEFINE_PER_CPU(u64
, root_cpuacct_cpuusage
);
66 static struct cpuacct root_cpuacct
= {
67 .cpustat
= &kernel_cpustat
,
68 .cpuusage
= &root_cpuacct_cpuusage
,
71 /* create a new cpu accounting group */
72 static struct cgroup_subsys_state
*cpuacct_css_alloc(struct cgroup
*cgrp
)
77 return &root_cpuacct
.css
;
79 ca
= kzalloc(sizeof(*ca
), GFP_KERNEL
);
83 ca
->cpuusage
= alloc_percpu(u64
);
87 ca
->cpustat
= alloc_percpu(struct kernel_cpustat
);
89 goto out_free_cpuusage
;
94 free_percpu(ca
->cpuusage
);
98 return ERR_PTR(-ENOMEM
);
101 /* destroy an existing cpu accounting group */
102 static void cpuacct_css_free(struct cgroup
*cgrp
)
104 struct cpuacct
*ca
= cgroup_ca(cgrp
);
106 free_percpu(ca
->cpustat
);
107 free_percpu(ca
->cpuusage
);
111 static u64
cpuacct_cpuusage_read(struct cpuacct
*ca
, int cpu
)
113 u64
*cpuusage
= per_cpu_ptr(ca
->cpuusage
, cpu
);
118 * Take rq->lock to make 64-bit read safe on 32-bit platforms.
120 raw_spin_lock_irq(&cpu_rq(cpu
)->lock
);
122 raw_spin_unlock_irq(&cpu_rq(cpu
)->lock
);
130 static void cpuacct_cpuusage_write(struct cpuacct
*ca
, int cpu
, u64 val
)
132 u64
*cpuusage
= per_cpu_ptr(ca
->cpuusage
, cpu
);
136 * Take rq->lock to make 64-bit write safe on 32-bit platforms.
138 raw_spin_lock_irq(&cpu_rq(cpu
)->lock
);
140 raw_spin_unlock_irq(&cpu_rq(cpu
)->lock
);
146 /* return total cpu usage (in nanoseconds) of a group */
147 static u64
cpuusage_read(struct cgroup
*cgrp
, struct cftype
*cft
)
149 struct cpuacct
*ca
= cgroup_ca(cgrp
);
150 u64 totalcpuusage
= 0;
153 for_each_present_cpu(i
)
154 totalcpuusage
+= cpuacct_cpuusage_read(ca
, i
);
156 return totalcpuusage
;
159 static int cpuusage_write(struct cgroup
*cgrp
, struct cftype
*cftype
,
162 struct cpuacct
*ca
= cgroup_ca(cgrp
);
171 for_each_present_cpu(i
)
172 cpuacct_cpuusage_write(ca
, i
, 0);
178 static int cpuacct_percpu_seq_read(struct cgroup
*cgroup
, struct cftype
*cft
,
181 struct cpuacct
*ca
= cgroup_ca(cgroup
);
185 for_each_present_cpu(i
) {
186 percpu
= cpuacct_cpuusage_read(ca
, i
);
187 seq_printf(m
, "%llu ", (unsigned long long) percpu
);
193 static const char * const cpuacct_stat_desc
[] = {
194 [CPUACCT_STAT_USER
] = "user",
195 [CPUACCT_STAT_SYSTEM
] = "system",
198 static int cpuacct_stats_show(struct cgroup
*cgrp
, struct cftype
*cft
,
199 struct cgroup_map_cb
*cb
)
201 struct cpuacct
*ca
= cgroup_ca(cgrp
);
205 for_each_online_cpu(cpu
) {
206 struct kernel_cpustat
*kcpustat
= per_cpu_ptr(ca
->cpustat
, cpu
);
207 val
+= kcpustat
->cpustat
[CPUTIME_USER
];
208 val
+= kcpustat
->cpustat
[CPUTIME_NICE
];
210 val
= cputime64_to_clock_t(val
);
211 cb
->fill(cb
, cpuacct_stat_desc
[CPUACCT_STAT_USER
], val
);
214 for_each_online_cpu(cpu
) {
215 struct kernel_cpustat
*kcpustat
= per_cpu_ptr(ca
->cpustat
, cpu
);
216 val
+= kcpustat
->cpustat
[CPUTIME_SYSTEM
];
217 val
+= kcpustat
->cpustat
[CPUTIME_IRQ
];
218 val
+= kcpustat
->cpustat
[CPUTIME_SOFTIRQ
];
221 val
= cputime64_to_clock_t(val
);
222 cb
->fill(cb
, cpuacct_stat_desc
[CPUACCT_STAT_SYSTEM
], val
);
227 static struct cftype files
[] = {
230 .read_u64
= cpuusage_read
,
231 .write_u64
= cpuusage_write
,
234 .name
= "usage_percpu",
235 .read_seq_string
= cpuacct_percpu_seq_read
,
239 .read_map
= cpuacct_stats_show
,
245 * charge this task's execution time to its accounting group.
247 * called with rq->lock held.
249 void cpuacct_charge(struct task_struct
*tsk
, u64 cputime
)
261 u64
*cpuusage
= per_cpu_ptr(ca
->cpuusage
, cpu
);
262 *cpuusage
+= cputime
;
273 * Add user/system time to cpuacct.
275 * Note: it's the caller that updates the account of the root cgroup.
277 void cpuacct_account_field(struct task_struct
*p
, int index
, u64 val
)
279 struct kernel_cpustat
*kcpustat
;
284 while (ca
!= &root_cpuacct
) {
285 kcpustat
= this_cpu_ptr(ca
->cpustat
);
286 kcpustat
->cpustat
[index
] += val
;
287 ca
= __parent_ca(ca
);
292 struct cgroup_subsys cpuacct_subsys
= {
294 .css_alloc
= cpuacct_css_alloc
,
295 .css_free
= cpuacct_css_free
,
296 .subsys_id
= cpuacct_subsys_id
,
297 .base_cftypes
= files
,