]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - security/device_cgroup.c
ipv4: convert dst_metrics.refcnt from atomic_t to refcount_t
[mirror_ubuntu-artful-kernel.git] / security / device_cgroup.c
CommitLineData
08ce5f16 1/*
47c59803 2 * device_cgroup.c - device cgroup subsystem
08ce5f16
SH
3 *
4 * Copyright 2007 IBM Corp
5 */
6
7#include <linux/device_cgroup.h>
8#include <linux/cgroup.h>
9#include <linux/ctype.h>
b6450630 10#include <linux/export.h>
08ce5f16
SH
11#include <linux/list.h>
12#include <linux/uaccess.h>
29486df3 13#include <linux/seq_file.h>
5a0e3ad6 14#include <linux/slab.h>
47c59803 15#include <linux/rcupdate.h>
b4046f00 16#include <linux/mutex.h>
08ce5f16
SH
17
18#define ACC_MKNOD 1
19#define ACC_READ 2
20#define ACC_WRITE 4
21#define ACC_MASK (ACC_MKNOD | ACC_READ | ACC_WRITE)
22
23#define DEV_BLOCK 1
24#define DEV_CHAR 2
25#define DEV_ALL 4 /* this represents all devices */
26
b4046f00
LZ
27static DEFINE_MUTEX(devcgroup_mutex);
28
c39a2a30
AR
29enum devcg_behavior {
30 DEVCG_DEFAULT_NONE,
31 DEVCG_DEFAULT_ALLOW,
32 DEVCG_DEFAULT_DENY,
33};
34
08ce5f16 35/*
db9aeca9 36 * exception list locking rules:
b4046f00 37 * hold devcgroup_mutex for update/read.
47c59803 38 * hold rcu_read_lock() for read.
08ce5f16
SH
39 */
40
db9aeca9 41struct dev_exception_item {
08ce5f16
SH
42 u32 major, minor;
43 short type;
44 short access;
45 struct list_head list;
4efd1a1b 46 struct rcu_head rcu;
08ce5f16
SH
47};
48
49struct dev_cgroup {
50 struct cgroup_subsys_state css;
db9aeca9 51 struct list_head exceptions;
c39a2a30 52 enum devcg_behavior behavior;
08ce5f16
SH
53};
54
b66862f7
PE
55static inline struct dev_cgroup *css_to_devcgroup(struct cgroup_subsys_state *s)
56{
a7c6d554 57 return s ? container_of(s, struct dev_cgroup, css) : NULL;
b66862f7
PE
58}
59
f92523e3
PM
60static inline struct dev_cgroup *task_devcgroup(struct task_struct *task)
61{
073219e9 62 return css_to_devcgroup(task_css(task, devices_cgrp_id));
f92523e3
PM
63}
64
08ce5f16 65/*
b4046f00 66 * called under devcgroup_mutex
08ce5f16 67 */
db9aeca9 68static int dev_exceptions_copy(struct list_head *dest, struct list_head *orig)
08ce5f16 69{
db9aeca9 70 struct dev_exception_item *ex, *tmp, *new;
08ce5f16 71
4b1c7840
TH
72 lockdep_assert_held(&devcgroup_mutex);
73
db9aeca9
AR
74 list_for_each_entry(ex, orig, list) {
75 new = kmemdup(ex, sizeof(*ex), GFP_KERNEL);
08ce5f16
SH
76 if (!new)
77 goto free_and_exit;
08ce5f16
SH
78 list_add_tail(&new->list, dest);
79 }
80
81 return 0;
82
83free_and_exit:
db9aeca9
AR
84 list_for_each_entry_safe(ex, tmp, dest, list) {
85 list_del(&ex->list);
86 kfree(ex);
08ce5f16
SH
87 }
88 return -ENOMEM;
89}
90
08ce5f16 91/*
b4046f00 92 * called under devcgroup_mutex
08ce5f16 93 */
db9aeca9
AR
94static int dev_exception_add(struct dev_cgroup *dev_cgroup,
95 struct dev_exception_item *ex)
08ce5f16 96{
db9aeca9 97 struct dev_exception_item *excopy, *walk;
08ce5f16 98
4b1c7840
TH
99 lockdep_assert_held(&devcgroup_mutex);
100
db9aeca9
AR
101 excopy = kmemdup(ex, sizeof(*ex), GFP_KERNEL);
102 if (!excopy)
08ce5f16
SH
103 return -ENOMEM;
104
db9aeca9
AR
105 list_for_each_entry(walk, &dev_cgroup->exceptions, list) {
106 if (walk->type != ex->type)
d1ee2971 107 continue;
db9aeca9 108 if (walk->major != ex->major)
d1ee2971 109 continue;
db9aeca9 110 if (walk->minor != ex->minor)
d1ee2971
PE
111 continue;
112
db9aeca9
AR
113 walk->access |= ex->access;
114 kfree(excopy);
115 excopy = NULL;
d1ee2971
PE
116 }
117
db9aeca9
AR
118 if (excopy != NULL)
119 list_add_tail_rcu(&excopy->list, &dev_cgroup->exceptions);
08ce5f16
SH
120 return 0;
121}
122
123/*
b4046f00 124 * called under devcgroup_mutex
08ce5f16 125 */
db9aeca9
AR
126static void dev_exception_rm(struct dev_cgroup *dev_cgroup,
127 struct dev_exception_item *ex)
08ce5f16 128{
db9aeca9 129 struct dev_exception_item *walk, *tmp;
08ce5f16 130
4b1c7840
TH
131 lockdep_assert_held(&devcgroup_mutex);
132
db9aeca9
AR
133 list_for_each_entry_safe(walk, tmp, &dev_cgroup->exceptions, list) {
134 if (walk->type != ex->type)
08ce5f16 135 continue;
db9aeca9 136 if (walk->major != ex->major)
08ce5f16 137 continue;
db9aeca9 138 if (walk->minor != ex->minor)
08ce5f16
SH
139 continue;
140
db9aeca9 141 walk->access &= ~ex->access;
08ce5f16 142 if (!walk->access) {
4efd1a1b 143 list_del_rcu(&walk->list);
6034f7e6 144 kfree_rcu(walk, rcu);
08ce5f16
SH
145 }
146 }
08ce5f16
SH
147}
148
53eb8c82
JS
149static void __dev_exception_clean(struct dev_cgroup *dev_cgroup)
150{
151 struct dev_exception_item *ex, *tmp;
152
153 list_for_each_entry_safe(ex, tmp, &dev_cgroup->exceptions, list) {
154 list_del_rcu(&ex->list);
155 kfree_rcu(ex, rcu);
156 }
157}
158
868539a3 159/**
db9aeca9
AR
160 * dev_exception_clean - frees all entries of the exception list
161 * @dev_cgroup: dev_cgroup with the exception list to be cleaned
868539a3
AR
162 *
163 * called under devcgroup_mutex
164 */
db9aeca9 165static void dev_exception_clean(struct dev_cgroup *dev_cgroup)
868539a3 166{
4b1c7840
TH
167 lockdep_assert_held(&devcgroup_mutex);
168
53eb8c82 169 __dev_exception_clean(dev_cgroup);
868539a3
AR
170}
171
bd2953eb
AR
172static inline bool is_devcg_online(const struct dev_cgroup *devcg)
173{
174 return (devcg->behavior != DEVCG_DEFAULT_NONE);
175}
176
1909554c
AR
177/**
178 * devcgroup_online - initializes devcgroup's behavior and exceptions based on
179 * parent's
eb95419b 180 * @css: css getting online
1909554c
AR
181 * returns 0 in case of success, error code otherwise
182 */
eb95419b 183static int devcgroup_online(struct cgroup_subsys_state *css)
1909554c 184{
eb95419b 185 struct dev_cgroup *dev_cgroup = css_to_devcgroup(css);
5c9d535b 186 struct dev_cgroup *parent_dev_cgroup = css_to_devcgroup(css->parent);
1909554c
AR
187 int ret = 0;
188
189 mutex_lock(&devcgroup_mutex);
1909554c
AR
190
191 if (parent_dev_cgroup == NULL)
192 dev_cgroup->behavior = DEVCG_DEFAULT_ALLOW;
193 else {
194 ret = dev_exceptions_copy(&dev_cgroup->exceptions,
195 &parent_dev_cgroup->exceptions);
196 if (!ret)
197 dev_cgroup->behavior = parent_dev_cgroup->behavior;
198 }
199 mutex_unlock(&devcgroup_mutex);
200
201 return ret;
202}
203
eb95419b 204static void devcgroup_offline(struct cgroup_subsys_state *css)
1909554c 205{
eb95419b 206 struct dev_cgroup *dev_cgroup = css_to_devcgroup(css);
1909554c
AR
207
208 mutex_lock(&devcgroup_mutex);
209 dev_cgroup->behavior = DEVCG_DEFAULT_NONE;
210 mutex_unlock(&devcgroup_mutex);
211}
212
08ce5f16
SH
213/*
214 * called from kernel/cgroup.c with cgroup_lock() held.
215 */
eb95419b
TH
216static struct cgroup_subsys_state *
217devcgroup_css_alloc(struct cgroup_subsys_state *parent_css)
08ce5f16 218{
1909554c 219 struct dev_cgroup *dev_cgroup;
08ce5f16
SH
220
221 dev_cgroup = kzalloc(sizeof(*dev_cgroup), GFP_KERNEL);
222 if (!dev_cgroup)
223 return ERR_PTR(-ENOMEM);
db9aeca9 224 INIT_LIST_HEAD(&dev_cgroup->exceptions);
1909554c 225 dev_cgroup->behavior = DEVCG_DEFAULT_NONE;
08ce5f16 226
08ce5f16
SH
227 return &dev_cgroup->css;
228}
229
eb95419b 230static void devcgroup_css_free(struct cgroup_subsys_state *css)
08ce5f16 231{
eb95419b 232 struct dev_cgroup *dev_cgroup = css_to_devcgroup(css);
08ce5f16 233
53eb8c82 234 __dev_exception_clean(dev_cgroup);
08ce5f16
SH
235 kfree(dev_cgroup);
236}
237
238#define DEVCG_ALLOW 1
239#define DEVCG_DENY 2
29486df3
SH
240#define DEVCG_LIST 3
241
17d213f8 242#define MAJMINLEN 13
29486df3 243#define ACCLEN 4
08ce5f16
SH
244
245static void set_access(char *acc, short access)
246{
247 int idx = 0;
29486df3 248 memset(acc, 0, ACCLEN);
08ce5f16
SH
249 if (access & ACC_READ)
250 acc[idx++] = 'r';
251 if (access & ACC_WRITE)
252 acc[idx++] = 'w';
253 if (access & ACC_MKNOD)
254 acc[idx++] = 'm';
255}
256
257static char type_to_char(short type)
258{
259 if (type == DEV_ALL)
260 return 'a';
261 if (type == DEV_CHAR)
262 return 'c';
263 if (type == DEV_BLOCK)
264 return 'b';
265 return 'X';
266}
267
29486df3 268static void set_majmin(char *str, unsigned m)
08ce5f16 269{
08ce5f16 270 if (m == ~0)
7759fc9d 271 strcpy(str, "*");
08ce5f16 272 else
7759fc9d 273 sprintf(str, "%u", m);
08ce5f16
SH
274}
275
2da8ca82 276static int devcgroup_seq_show(struct seq_file *m, void *v)
08ce5f16 277{
2da8ca82 278 struct dev_cgroup *devcgroup = css_to_devcgroup(seq_css(m));
db9aeca9 279 struct dev_exception_item *ex;
29486df3 280 char maj[MAJMINLEN], min[MAJMINLEN], acc[ACCLEN];
08ce5f16 281
4efd1a1b 282 rcu_read_lock();
ad676077
AR
283 /*
284 * To preserve the compatibility:
285 * - Only show the "all devices" when the default policy is to allow
286 * - List the exceptions in case the default policy is to deny
287 * This way, the file remains as a "whitelist of devices"
288 */
5b7aa7d5 289 if (devcgroup->behavior == DEVCG_DEFAULT_ALLOW) {
ad676077
AR
290 set_access(acc, ACC_MASK);
291 set_majmin(maj, ~0);
292 set_majmin(min, ~0);
293 seq_printf(m, "%c %s:%s %s\n", type_to_char(DEV_ALL),
29486df3 294 maj, min, acc);
ad676077 295 } else {
db9aeca9
AR
296 list_for_each_entry_rcu(ex, &devcgroup->exceptions, list) {
297 set_access(acc, ex->access);
298 set_majmin(maj, ex->major);
299 set_majmin(min, ex->minor);
300 seq_printf(m, "%c %s:%s %s\n", type_to_char(ex->type),
ad676077
AR
301 maj, min, acc);
302 }
08ce5f16 303 }
4efd1a1b 304 rcu_read_unlock();
08ce5f16 305
29486df3 306 return 0;
08ce5f16
SH
307}
308
ad676077 309/**
f5f3cf6f 310 * match_exception - iterates the exception list trying to find a complete match
79d71974
AR
311 * @exceptions: list of exceptions
312 * @type: device type (DEV_BLOCK or DEV_CHAR)
313 * @major: device file major number, ~0 to match all
314 * @minor: device file minor number, ~0 to match all
315 * @access: permission mask (ACC_READ, ACC_WRITE, ACC_MKNOD)
316 *
f5f3cf6f
AR
317 * It is considered a complete match if an exception is found that will
318 * contain the entire range of provided parameters.
319 *
320 * Return: true in case it matches an exception completely
08ce5f16 321 */
79d71974
AR
322static bool match_exception(struct list_head *exceptions, short type,
323 u32 major, u32 minor, short access)
08ce5f16 324{
db9aeca9 325 struct dev_exception_item *ex;
08ce5f16 326
79d71974
AR
327 list_for_each_entry_rcu(ex, exceptions, list) {
328 if ((type & DEV_BLOCK) && !(ex->type & DEV_BLOCK))
329 continue;
330 if ((type & DEV_CHAR) && !(ex->type & DEV_CHAR))
331 continue;
332 if (ex->major != ~0 && ex->major != major)
333 continue;
334 if (ex->minor != ~0 && ex->minor != minor)
335 continue;
336 /* provided access cannot have more than the exception rule */
337 if (access & (~ex->access))
338 continue;
339 return true;
340 }
341 return false;
342}
343
344/**
f5f3cf6f 345 * match_exception_partial - iterates the exception list trying to find a partial match
79d71974
AR
346 * @exceptions: list of exceptions
347 * @type: device type (DEV_BLOCK or DEV_CHAR)
348 * @major: device file major number, ~0 to match all
349 * @minor: device file minor number, ~0 to match all
350 * @access: permission mask (ACC_READ, ACC_WRITE, ACC_MKNOD)
351 *
f5f3cf6f
AR
352 * It is considered a partial match if an exception's range is found to
353 * contain *any* of the devices specified by provided parameters. This is
354 * used to make sure no extra access is being granted that is forbidden by
355 * any of the exception list.
356 *
357 * Return: true in case the provided range mat matches an exception completely
79d71974
AR
358 */
359static bool match_exception_partial(struct list_head *exceptions, short type,
360 u32 major, u32 minor, short access)
361{
362 struct dev_exception_item *ex;
4b1c7840 363
79d71974
AR
364 list_for_each_entry_rcu(ex, exceptions, list) {
365 if ((type & DEV_BLOCK) && !(ex->type & DEV_BLOCK))
08ce5f16 366 continue;
79d71974 367 if ((type & DEV_CHAR) && !(ex->type & DEV_CHAR))
08ce5f16 368 continue;
79d71974
AR
369 /*
370 * We must be sure that both the exception and the provided
371 * range aren't masking all devices
372 */
373 if (ex->major != ~0 && major != ~0 && ex->major != major)
08ce5f16 374 continue;
79d71974 375 if (ex->minor != ~0 && minor != ~0 && ex->minor != minor)
08ce5f16 376 continue;
79d71974
AR
377 /*
378 * In order to make sure the provided range isn't matching
379 * an exception, all its access bits shouldn't match the
380 * exception's access bits
381 */
382 if (!(access & ex->access))
08ce5f16 383 continue;
79d71974 384 return true;
08ce5f16 385 }
79d71974
AR
386 return false;
387}
388
389/**
f5f3cf6f 390 * verify_new_ex - verifies if a new exception is allowed by parent cgroup's permissions
79d71974
AR
391 * @dev_cgroup: dev cgroup to be tested against
392 * @refex: new exception
393 * @behavior: behavior of the exception's dev_cgroup
f5f3cf6f
AR
394 *
395 * This is used to make sure a child cgroup won't have more privileges
396 * than its parent
79d71974
AR
397 */
398static bool verify_new_ex(struct dev_cgroup *dev_cgroup,
399 struct dev_exception_item *refex,
400 enum devcg_behavior behavior)
401{
402 bool match = false;
403
f78f5b90 404 RCU_LOCKDEP_WARN(!rcu_read_lock_held() &&
dc3a04d5 405 !lockdep_is_held(&devcgroup_mutex),
f78f5b90 406 "device_cgroup:verify_new_ex called without proper synchronization");
ad676077 407
c39a2a30
AR
408 if (dev_cgroup->behavior == DEVCG_DEFAULT_ALLOW) {
409 if (behavior == DEVCG_DEFAULT_ALLOW) {
79d71974
AR
410 /*
411 * new exception in the child doesn't matter, only
412 * adding extra restrictions
413 */
c39a2a30
AR
414 return true;
415 } else {
79d71974
AR
416 /*
417 * new exception in the child will add more devices
418 * that can be acessed, so it can't match any of
419 * parent's exceptions, even slightly
420 */
421 match = match_exception_partial(&dev_cgroup->exceptions,
422 refex->type,
423 refex->major,
424 refex->minor,
425 refex->access);
426
c39a2a30 427 if (match)
c39a2a30 428 return false;
26898fdf 429 return true;
c39a2a30 430 }
26898fdf 431 } else {
79d71974
AR
432 /*
433 * Only behavior == DEVCG_DEFAULT_DENY allowed here, therefore
434 * the new exception will add access to more devices and must
435 * be contained completely in an parent's exception to be
436 * allowed
437 */
438 match = match_exception(&dev_cgroup->exceptions, refex->type,
439 refex->major, refex->minor,
440 refex->access);
441
c39a2a30
AR
442 if (match)
443 /* parent has an exception that matches the proposed */
26898fdf 444 return true;
c39a2a30
AR
445 else
446 return false;
26898fdf
AR
447 }
448 return false;
08ce5f16
SH
449}
450
451/*
452 * parent_has_perm:
db9aeca9 453 * when adding a new allow rule to a device exception list, the rule
08ce5f16
SH
454 * must be allowed in the parent device
455 */
f92523e3 456static int parent_has_perm(struct dev_cgroup *childcg,
db9aeca9 457 struct dev_exception_item *ex)
08ce5f16 458{
5c9d535b 459 struct dev_cgroup *parent = css_to_devcgroup(childcg->css.parent);
08ce5f16 460
63876986 461 if (!parent)
08ce5f16 462 return 1;
79d71974 463 return verify_new_ex(parent, ex, childcg->behavior);
08ce5f16
SH
464}
465
d2c2b11c
AR
466/**
467 * parent_allows_removal - verify if it's ok to remove an exception
468 * @childcg: child cgroup from where the exception will be removed
469 * @ex: exception being removed
470 *
471 * When removing an exception in cgroups with default ALLOW policy, it must
472 * be checked if removing it will give the child cgroup more access than the
473 * parent.
474 *
475 * Return: true if it's ok to remove exception, false otherwise
476 */
477static bool parent_allows_removal(struct dev_cgroup *childcg,
478 struct dev_exception_item *ex)
479{
5c9d535b 480 struct dev_cgroup *parent = css_to_devcgroup(childcg->css.parent);
d2c2b11c
AR
481
482 if (!parent)
483 return true;
484
485 /* It's always allowed to remove access to devices */
486 if (childcg->behavior == DEVCG_DEFAULT_DENY)
487 return true;
488
489 /*
490 * Make sure you're not removing part or a whole exception existing in
491 * the parent cgroup
492 */
493 return !match_exception_partial(&parent->exceptions, ex->type,
494 ex->major, ex->minor, ex->access);
495}
496
4cef7299
AR
497/**
498 * may_allow_all - checks if it's possible to change the behavior to
499 * allow based on parent's rules.
500 * @parent: device cgroup's parent
501 * returns: != 0 in case it's allowed, 0 otherwise
502 */
503static inline int may_allow_all(struct dev_cgroup *parent)
504{
64e10477
AR
505 if (!parent)
506 return 1;
4cef7299
AR
507 return parent->behavior == DEVCG_DEFAULT_ALLOW;
508}
509
bd2953eb
AR
510/**
511 * revalidate_active_exceptions - walks through the active exception list and
512 * revalidates the exceptions based on parent's
513 * behavior and exceptions. The exceptions that
514 * are no longer valid will be removed.
515 * Called with devcgroup_mutex held.
516 * @devcg: cgroup which exceptions will be checked
517 *
518 * This is one of the three key functions for hierarchy implementation.
519 * This function is responsible for re-evaluating all the cgroup's active
520 * exceptions due to a parent's exception change.
521 * Refer to Documentation/cgroups/devices.txt for more details.
522 */
523static void revalidate_active_exceptions(struct dev_cgroup *devcg)
524{
525 struct dev_exception_item *ex;
526 struct list_head *this, *tmp;
527
528 list_for_each_safe(this, tmp, &devcg->exceptions) {
529 ex = container_of(this, struct dev_exception_item, list);
530 if (!parent_has_perm(devcg, ex))
531 dev_exception_rm(devcg, ex);
532 }
533}
534
bd2953eb
AR
535/**
536 * propagate_exception - propagates a new exception to the children
537 * @devcg_root: device cgroup that added a new exception
538 * @ex: new exception to be propagated
539 *
540 * returns: 0 in case of success, != 0 in case of error
541 */
542static int propagate_exception(struct dev_cgroup *devcg_root,
543 struct dev_exception_item *ex)
544{
492eb21b 545 struct cgroup_subsys_state *pos;
bd2953eb 546 int rc = 0;
bd2953eb 547
d591fb56 548 rcu_read_lock();
bd2953eb 549
492eb21b
TH
550 css_for_each_descendant_pre(pos, &devcg_root->css) {
551 struct dev_cgroup *devcg = css_to_devcgroup(pos);
d591fb56
TH
552
553 /*
554 * Because devcgroup_mutex is held, no devcg will become
555 * online or offline during the tree walk (see on/offline
556 * methods), and online ones are safe to access outside RCU
557 * read lock without bumping refcnt.
558 */
bd8815a6 559 if (pos == &devcg_root->css || !is_devcg_online(devcg))
d591fb56
TH
560 continue;
561
562 rcu_read_unlock();
bd2953eb
AR
563
564 /*
565 * in case both root's behavior and devcg is allow, a new
566 * restriction means adding to the exception list
567 */
568 if (devcg_root->behavior == DEVCG_DEFAULT_ALLOW &&
569 devcg->behavior == DEVCG_DEFAULT_ALLOW) {
570 rc = dev_exception_add(devcg, ex);
571 if (rc)
572 break;
573 } else {
574 /*
575 * in the other possible cases:
576 * root's behavior: allow, devcg's: deny
577 * root's behavior: deny, devcg's: deny
578 * the exception will be removed
579 */
580 dev_exception_rm(devcg, ex);
581 }
582 revalidate_active_exceptions(devcg);
583
d591fb56 584 rcu_read_lock();
bd2953eb 585 }
d591fb56
TH
586
587 rcu_read_unlock();
bd2953eb
AR
588 return rc;
589}
590
08ce5f16 591/*
db9aeca9 592 * Modify the exception list using allow/deny rules.
08ce5f16
SH
593 * CAP_SYS_ADMIN is needed for this. It's at least separate from CAP_MKNOD
594 * so we can give a container CAP_MKNOD to let it create devices but not
db9aeca9 595 * modify the exception list.
08ce5f16
SH
596 * It seems likely we'll want to add a CAP_CONTAINER capability to allow
597 * us to also grant CAP_SYS_ADMIN to containers without giving away the
db9aeca9 598 * device exception list controls, but for now we'll stick with CAP_SYS_ADMIN
08ce5f16
SH
599 *
600 * Taking rules away is always allowed (given CAP_SYS_ADMIN). Granting
601 * new access is only allowed if you're in the top-level cgroup, or your
602 * parent cgroup has the access you're asking for.
603 */
f92523e3 604static int devcgroup_update_access(struct dev_cgroup *devcgroup,
4d3bb511 605 int filetype, char *buffer)
08ce5f16 606{
f92523e3 607 const char *b;
26fd8405 608 char temp[12]; /* 11 + 1 characters needed for a u32 */
c39a2a30 609 int count, rc = 0;
db9aeca9 610 struct dev_exception_item ex;
5c9d535b 611 struct dev_cgroup *parent = css_to_devcgroup(devcgroup->css.parent);
08ce5f16
SH
612
613 if (!capable(CAP_SYS_ADMIN))
614 return -EPERM;
615
db9aeca9 616 memset(&ex, 0, sizeof(ex));
08ce5f16
SH
617 b = buffer;
618
619 switch (*b) {
620 case 'a':
ad676077
AR
621 switch (filetype) {
622 case DEVCG_ALLOW:
7a3bb24f 623 if (css_has_online_children(&devcgroup->css))
bd2953eb
AR
624 return -EINVAL;
625
4cef7299 626 if (!may_allow_all(parent))
ad676077 627 return -EPERM;
db9aeca9 628 dev_exception_clean(devcgroup);
64e10477
AR
629 devcgroup->behavior = DEVCG_DEFAULT_ALLOW;
630 if (!parent)
631 break;
632
4cef7299
AR
633 rc = dev_exceptions_copy(&devcgroup->exceptions,
634 &parent->exceptions);
635 if (rc)
636 return rc;
ad676077
AR
637 break;
638 case DEVCG_DENY:
7a3bb24f 639 if (css_has_online_children(&devcgroup->css))
bd2953eb
AR
640 return -EINVAL;
641
db9aeca9 642 dev_exception_clean(devcgroup);
5b7aa7d5 643 devcgroup->behavior = DEVCG_DEFAULT_DENY;
ad676077
AR
644 break;
645 default:
646 return -EINVAL;
647 }
648 return 0;
08ce5f16 649 case 'b':
db9aeca9 650 ex.type = DEV_BLOCK;
08ce5f16
SH
651 break;
652 case 'c':
db9aeca9 653 ex.type = DEV_CHAR;
08ce5f16
SH
654 break;
655 default:
f92523e3 656 return -EINVAL;
08ce5f16
SH
657 }
658 b++;
f92523e3
PM
659 if (!isspace(*b))
660 return -EINVAL;
08ce5f16
SH
661 b++;
662 if (*b == '*') {
db9aeca9 663 ex.major = ~0;
08ce5f16
SH
664 b++;
665 } else if (isdigit(*b)) {
26fd8405
AR
666 memset(temp, 0, sizeof(temp));
667 for (count = 0; count < sizeof(temp) - 1; count++) {
668 temp[count] = *b;
669 b++;
670 if (!isdigit(*b))
671 break;
672 }
673 rc = kstrtou32(temp, 10, &ex.major);
674 if (rc)
675 return -EINVAL;
08ce5f16 676 } else {
f92523e3 677 return -EINVAL;
08ce5f16 678 }
f92523e3
PM
679 if (*b != ':')
680 return -EINVAL;
08ce5f16
SH
681 b++;
682
683 /* read minor */
684 if (*b == '*') {
db9aeca9 685 ex.minor = ~0;
08ce5f16
SH
686 b++;
687 } else if (isdigit(*b)) {
26fd8405
AR
688 memset(temp, 0, sizeof(temp));
689 for (count = 0; count < sizeof(temp) - 1; count++) {
690 temp[count] = *b;
691 b++;
692 if (!isdigit(*b))
693 break;
694 }
695 rc = kstrtou32(temp, 10, &ex.minor);
696 if (rc)
697 return -EINVAL;
08ce5f16 698 } else {
f92523e3 699 return -EINVAL;
08ce5f16 700 }
f92523e3
PM
701 if (!isspace(*b))
702 return -EINVAL;
08ce5f16
SH
703 for (b++, count = 0; count < 3; count++, b++) {
704 switch (*b) {
705 case 'r':
db9aeca9 706 ex.access |= ACC_READ;
08ce5f16
SH
707 break;
708 case 'w':
db9aeca9 709 ex.access |= ACC_WRITE;
08ce5f16
SH
710 break;
711 case 'm':
db9aeca9 712 ex.access |= ACC_MKNOD;
08ce5f16
SH
713 break;
714 case '\n':
715 case '\0':
716 count = 3;
717 break;
718 default:
f92523e3 719 return -EINVAL;
08ce5f16
SH
720 }
721 }
722
08ce5f16
SH
723 switch (filetype) {
724 case DEVCG_ALLOW:
ad676077
AR
725 /*
726 * If the default policy is to allow by default, try to remove
727 * an matching exception instead. And be silent about it: we
728 * don't want to break compatibility
729 */
5b7aa7d5 730 if (devcgroup->behavior == DEVCG_DEFAULT_ALLOW) {
d2c2b11c
AR
731 /* Check if the parent allows removing it first */
732 if (!parent_allows_removal(devcgroup, &ex))
733 return -EPERM;
db9aeca9 734 dev_exception_rm(devcgroup, &ex);
d2c2b11c 735 break;
ad676077 736 }
d2c2b11c
AR
737
738 if (!parent_has_perm(devcgroup, &ex))
739 return -EPERM;
bd2953eb
AR
740 rc = dev_exception_add(devcgroup, &ex);
741 break;
08ce5f16 742 case DEVCG_DENY:
ad676077
AR
743 /*
744 * If the default policy is to deny by default, try to remove
745 * an matching exception instead. And be silent about it: we
746 * don't want to break compatibility
747 */
bd2953eb 748 if (devcgroup->behavior == DEVCG_DEFAULT_DENY)
db9aeca9 749 dev_exception_rm(devcgroup, &ex);
bd2953eb
AR
750 else
751 rc = dev_exception_add(devcgroup, &ex);
752
753 if (rc)
754 break;
755 /* we only propagate new restrictions */
756 rc = propagate_exception(devcgroup, &ex);
757 break;
08ce5f16 758 default:
bd2953eb 759 rc = -EINVAL;
08ce5f16 760 }
bd2953eb 761 return rc;
f92523e3 762}
08ce5f16 763
451af504
TH
764static ssize_t devcgroup_access_write(struct kernfs_open_file *of,
765 char *buf, size_t nbytes, loff_t off)
f92523e3
PM
766{
767 int retval;
b4046f00
LZ
768
769 mutex_lock(&devcgroup_mutex);
451af504
TH
770 retval = devcgroup_update_access(css_to_devcgroup(of_css(of)),
771 of_cft(of)->private, strstrip(buf));
b4046f00 772 mutex_unlock(&devcgroup_mutex);
451af504 773 return retval ?: nbytes;
08ce5f16
SH
774}
775
776static struct cftype dev_cgroup_files[] = {
777 {
778 .name = "allow",
451af504 779 .write = devcgroup_access_write,
08ce5f16
SH
780 .private = DEVCG_ALLOW,
781 },
782 {
783 .name = "deny",
451af504 784 .write = devcgroup_access_write,
08ce5f16
SH
785 .private = DEVCG_DENY,
786 },
29486df3
SH
787 {
788 .name = "list",
2da8ca82 789 .seq_show = devcgroup_seq_show,
29486df3
SH
790 .private = DEVCG_LIST,
791 },
4baf6e33 792 { } /* terminate */
08ce5f16
SH
793};
794
073219e9 795struct cgroup_subsys devices_cgrp_subsys = {
92fb9748
TH
796 .css_alloc = devcgroup_css_alloc,
797 .css_free = devcgroup_css_free,
1909554c
AR
798 .css_online = devcgroup_online,
799 .css_offline = devcgroup_offline,
5577964e 800 .legacy_cftypes = dev_cgroup_files,
08ce5f16
SH
801};
802
ad676077
AR
803/**
804 * __devcgroup_check_permission - checks if an inode operation is permitted
805 * @dev_cgroup: the dev cgroup to be tested against
806 * @type: device type
807 * @major: device major number
808 * @minor: device minor number
809 * @access: combination of ACC_WRITE, ACC_READ and ACC_MKNOD
810 *
811 * returns 0 on success, -EPERM case the operation is not permitted
812 */
8c9506d1 813static int __devcgroup_check_permission(short type, u32 major, u32 minor,
ad676077 814 short access)
08ce5f16 815{
8c9506d1 816 struct dev_cgroup *dev_cgroup;
79d71974 817 bool rc;
36fd71d2 818
ad676077 819 rcu_read_lock();
8c9506d1 820 dev_cgroup = task_devcgroup(current);
79d71974
AR
821 if (dev_cgroup->behavior == DEVCG_DEFAULT_ALLOW)
822 /* Can't match any of the exceptions, even partially */
823 rc = !match_exception_partial(&dev_cgroup->exceptions,
824 type, major, minor, access);
825 else
826 /* Need to match completely one exception to be allowed */
827 rc = match_exception(&dev_cgroup->exceptions, type, major,
828 minor, access);
ad676077 829 rcu_read_unlock();
cd500819 830
ad676077
AR
831 if (!rc)
832 return -EPERM;
36fd71d2 833
ad676077
AR
834 return 0;
835}
08ce5f16 836
ad676077
AR
837int __devcgroup_inode_permission(struct inode *inode, int mask)
838{
ad676077
AR
839 short type, access = 0;
840
841 if (S_ISBLK(inode->i_mode))
842 type = DEV_BLOCK;
843 if (S_ISCHR(inode->i_mode))
844 type = DEV_CHAR;
845 if (mask & MAY_WRITE)
846 access |= ACC_WRITE;
847 if (mask & MAY_READ)
848 access |= ACC_READ;
849
8c9506d1
JS
850 return __devcgroup_check_permission(type, imajor(inode), iminor(inode),
851 access);
08ce5f16 852}
b6450630 853EXPORT_SYMBOL_GPL(__devcgroup_inode_permission);
08ce5f16
SH
854
855int devcgroup_inode_mknod(int mode, dev_t dev)
856{
ad676077 857 short type;
08ce5f16 858
0b82ac37
SH
859 if (!S_ISBLK(mode) && !S_ISCHR(mode))
860 return 0;
861
ad676077
AR
862 if (S_ISBLK(mode))
863 type = DEV_BLOCK;
864 else
865 type = DEV_CHAR;
36fd71d2 866
8c9506d1
JS
867 return __devcgroup_check_permission(type, MAJOR(dev), MINOR(dev),
868 ACC_MKNOD);
36fd71d2 869
08ce5f16 870}