]> git.ipfire.org Git - people/arne_f/kernel.git/blame - security/device_cgroup.c
device_cgroup: rework device access check and exception checking
[people/arne_f/kernel.git] / security / device_cgroup.c
CommitLineData
08ce5f16 1/*
47c59803 2 * device_cgroup.c - device cgroup subsystem
08ce5f16
SH
3 *
4 * Copyright 2007 IBM Corp
5 */
6
7#include <linux/device_cgroup.h>
8#include <linux/cgroup.h>
9#include <linux/ctype.h>
10#include <linux/list.h>
11#include <linux/uaccess.h>
29486df3 12#include <linux/seq_file.h>
5a0e3ad6 13#include <linux/slab.h>
47c59803 14#include <linux/rcupdate.h>
b4046f00 15#include <linux/mutex.h>
08ce5f16
SH
16
17#define ACC_MKNOD 1
18#define ACC_READ 2
19#define ACC_WRITE 4
20#define ACC_MASK (ACC_MKNOD | ACC_READ | ACC_WRITE)
21
22#define DEV_BLOCK 1
23#define DEV_CHAR 2
24#define DEV_ALL 4 /* this represents all devices */
25
b4046f00
LZ
26static DEFINE_MUTEX(devcgroup_mutex);
27
c39a2a30
AR
28enum devcg_behavior {
29 DEVCG_DEFAULT_NONE,
30 DEVCG_DEFAULT_ALLOW,
31 DEVCG_DEFAULT_DENY,
32};
33
08ce5f16 34/*
db9aeca9 35 * exception list locking rules:
b4046f00 36 * hold devcgroup_mutex for update/read.
47c59803 37 * hold rcu_read_lock() for read.
08ce5f16
SH
38 */
39
db9aeca9 40struct dev_exception_item {
08ce5f16
SH
41 u32 major, minor;
42 short type;
43 short access;
44 struct list_head list;
4efd1a1b 45 struct rcu_head rcu;
08ce5f16
SH
46};
47
48struct dev_cgroup {
49 struct cgroup_subsys_state css;
db9aeca9 50 struct list_head exceptions;
c39a2a30 51 enum devcg_behavior behavior;
08ce5f16
SH
52};
53
b66862f7
PE
54static inline struct dev_cgroup *css_to_devcgroup(struct cgroup_subsys_state *s)
55{
a7c6d554 56 return s ? container_of(s, struct dev_cgroup, css) : NULL;
b66862f7
PE
57}
58
f92523e3
PM
59static inline struct dev_cgroup *task_devcgroup(struct task_struct *task)
60{
073219e9 61 return css_to_devcgroup(task_css(task, devices_cgrp_id));
f92523e3
PM
62}
63
08ce5f16 64/*
b4046f00 65 * called under devcgroup_mutex
08ce5f16 66 */
db9aeca9 67static int dev_exceptions_copy(struct list_head *dest, struct list_head *orig)
08ce5f16 68{
db9aeca9 69 struct dev_exception_item *ex, *tmp, *new;
08ce5f16 70
4b1c7840
TH
71 lockdep_assert_held(&devcgroup_mutex);
72
db9aeca9
AR
73 list_for_each_entry(ex, orig, list) {
74 new = kmemdup(ex, sizeof(*ex), GFP_KERNEL);
08ce5f16
SH
75 if (!new)
76 goto free_and_exit;
08ce5f16
SH
77 list_add_tail(&new->list, dest);
78 }
79
80 return 0;
81
82free_and_exit:
db9aeca9
AR
83 list_for_each_entry_safe(ex, tmp, dest, list) {
84 list_del(&ex->list);
85 kfree(ex);
08ce5f16
SH
86 }
87 return -ENOMEM;
88}
89
08ce5f16 90/*
b4046f00 91 * called under devcgroup_mutex
08ce5f16 92 */
db9aeca9
AR
93static int dev_exception_add(struct dev_cgroup *dev_cgroup,
94 struct dev_exception_item *ex)
08ce5f16 95{
db9aeca9 96 struct dev_exception_item *excopy, *walk;
08ce5f16 97
4b1c7840
TH
98 lockdep_assert_held(&devcgroup_mutex);
99
db9aeca9
AR
100 excopy = kmemdup(ex, sizeof(*ex), GFP_KERNEL);
101 if (!excopy)
08ce5f16
SH
102 return -ENOMEM;
103
db9aeca9
AR
104 list_for_each_entry(walk, &dev_cgroup->exceptions, list) {
105 if (walk->type != ex->type)
d1ee2971 106 continue;
db9aeca9 107 if (walk->major != ex->major)
d1ee2971 108 continue;
db9aeca9 109 if (walk->minor != ex->minor)
d1ee2971
PE
110 continue;
111
db9aeca9
AR
112 walk->access |= ex->access;
113 kfree(excopy);
114 excopy = NULL;
d1ee2971
PE
115 }
116
db9aeca9
AR
117 if (excopy != NULL)
118 list_add_tail_rcu(&excopy->list, &dev_cgroup->exceptions);
08ce5f16
SH
119 return 0;
120}
121
122/*
b4046f00 123 * called under devcgroup_mutex
08ce5f16 124 */
db9aeca9
AR
125static void dev_exception_rm(struct dev_cgroup *dev_cgroup,
126 struct dev_exception_item *ex)
08ce5f16 127{
db9aeca9 128 struct dev_exception_item *walk, *tmp;
08ce5f16 129
4b1c7840
TH
130 lockdep_assert_held(&devcgroup_mutex);
131
db9aeca9
AR
132 list_for_each_entry_safe(walk, tmp, &dev_cgroup->exceptions, list) {
133 if (walk->type != ex->type)
08ce5f16 134 continue;
db9aeca9 135 if (walk->major != ex->major)
08ce5f16 136 continue;
db9aeca9 137 if (walk->minor != ex->minor)
08ce5f16
SH
138 continue;
139
db9aeca9 140 walk->access &= ~ex->access;
08ce5f16 141 if (!walk->access) {
4efd1a1b 142 list_del_rcu(&walk->list);
6034f7e6 143 kfree_rcu(walk, rcu);
08ce5f16
SH
144 }
145 }
08ce5f16
SH
146}
147
53eb8c82
JS
148static void __dev_exception_clean(struct dev_cgroup *dev_cgroup)
149{
150 struct dev_exception_item *ex, *tmp;
151
152 list_for_each_entry_safe(ex, tmp, &dev_cgroup->exceptions, list) {
153 list_del_rcu(&ex->list);
154 kfree_rcu(ex, rcu);
155 }
156}
157
868539a3 158/**
db9aeca9
AR
159 * dev_exception_clean - frees all entries of the exception list
160 * @dev_cgroup: dev_cgroup with the exception list to be cleaned
868539a3
AR
161 *
162 * called under devcgroup_mutex
163 */
db9aeca9 164static void dev_exception_clean(struct dev_cgroup *dev_cgroup)
868539a3 165{
4b1c7840
TH
166 lockdep_assert_held(&devcgroup_mutex);
167
53eb8c82 168 __dev_exception_clean(dev_cgroup);
868539a3
AR
169}
170
bd2953eb
AR
171static inline bool is_devcg_online(const struct dev_cgroup *devcg)
172{
173 return (devcg->behavior != DEVCG_DEFAULT_NONE);
174}
175
1909554c
AR
176/**
177 * devcgroup_online - initializes devcgroup's behavior and exceptions based on
178 * parent's
eb95419b 179 * @css: css getting online
1909554c
AR
180 * returns 0 in case of success, error code otherwise
181 */
eb95419b 182static int devcgroup_online(struct cgroup_subsys_state *css)
1909554c 183{
eb95419b
TH
184 struct dev_cgroup *dev_cgroup = css_to_devcgroup(css);
185 struct dev_cgroup *parent_dev_cgroup = css_to_devcgroup(css_parent(css));
1909554c
AR
186 int ret = 0;
187
188 mutex_lock(&devcgroup_mutex);
1909554c
AR
189
190 if (parent_dev_cgroup == NULL)
191 dev_cgroup->behavior = DEVCG_DEFAULT_ALLOW;
192 else {
193 ret = dev_exceptions_copy(&dev_cgroup->exceptions,
194 &parent_dev_cgroup->exceptions);
195 if (!ret)
196 dev_cgroup->behavior = parent_dev_cgroup->behavior;
197 }
198 mutex_unlock(&devcgroup_mutex);
199
200 return ret;
201}
202
eb95419b 203static void devcgroup_offline(struct cgroup_subsys_state *css)
1909554c 204{
eb95419b 205 struct dev_cgroup *dev_cgroup = css_to_devcgroup(css);
1909554c
AR
206
207 mutex_lock(&devcgroup_mutex);
208 dev_cgroup->behavior = DEVCG_DEFAULT_NONE;
209 mutex_unlock(&devcgroup_mutex);
210}
211
08ce5f16
SH
212/*
213 * called from kernel/cgroup.c with cgroup_lock() held.
214 */
eb95419b
TH
215static struct cgroup_subsys_state *
216devcgroup_css_alloc(struct cgroup_subsys_state *parent_css)
08ce5f16 217{
1909554c 218 struct dev_cgroup *dev_cgroup;
08ce5f16
SH
219
220 dev_cgroup = kzalloc(sizeof(*dev_cgroup), GFP_KERNEL);
221 if (!dev_cgroup)
222 return ERR_PTR(-ENOMEM);
db9aeca9 223 INIT_LIST_HEAD(&dev_cgroup->exceptions);
1909554c 224 dev_cgroup->behavior = DEVCG_DEFAULT_NONE;
08ce5f16 225
08ce5f16
SH
226 return &dev_cgroup->css;
227}
228
eb95419b 229static void devcgroup_css_free(struct cgroup_subsys_state *css)
08ce5f16 230{
eb95419b 231 struct dev_cgroup *dev_cgroup = css_to_devcgroup(css);
08ce5f16 232
53eb8c82 233 __dev_exception_clean(dev_cgroup);
08ce5f16
SH
234 kfree(dev_cgroup);
235}
236
237#define DEVCG_ALLOW 1
238#define DEVCG_DENY 2
29486df3
SH
239#define DEVCG_LIST 3
240
17d213f8 241#define MAJMINLEN 13
29486df3 242#define ACCLEN 4
08ce5f16
SH
243
244static void set_access(char *acc, short access)
245{
246 int idx = 0;
29486df3 247 memset(acc, 0, ACCLEN);
08ce5f16
SH
248 if (access & ACC_READ)
249 acc[idx++] = 'r';
250 if (access & ACC_WRITE)
251 acc[idx++] = 'w';
252 if (access & ACC_MKNOD)
253 acc[idx++] = 'm';
254}
255
256static char type_to_char(short type)
257{
258 if (type == DEV_ALL)
259 return 'a';
260 if (type == DEV_CHAR)
261 return 'c';
262 if (type == DEV_BLOCK)
263 return 'b';
264 return 'X';
265}
266
29486df3 267static void set_majmin(char *str, unsigned m)
08ce5f16 268{
08ce5f16 269 if (m == ~0)
7759fc9d 270 strcpy(str, "*");
08ce5f16 271 else
7759fc9d 272 sprintf(str, "%u", m);
08ce5f16
SH
273}
274
2da8ca82 275static int devcgroup_seq_show(struct seq_file *m, void *v)
08ce5f16 276{
2da8ca82 277 struct dev_cgroup *devcgroup = css_to_devcgroup(seq_css(m));
db9aeca9 278 struct dev_exception_item *ex;
29486df3 279 char maj[MAJMINLEN], min[MAJMINLEN], acc[ACCLEN];
08ce5f16 280
4efd1a1b 281 rcu_read_lock();
ad676077
AR
282 /*
283 * To preserve the compatibility:
284 * - Only show the "all devices" when the default policy is to allow
285 * - List the exceptions in case the default policy is to deny
286 * This way, the file remains as a "whitelist of devices"
287 */
5b7aa7d5 288 if (devcgroup->behavior == DEVCG_DEFAULT_ALLOW) {
ad676077
AR
289 set_access(acc, ACC_MASK);
290 set_majmin(maj, ~0);
291 set_majmin(min, ~0);
292 seq_printf(m, "%c %s:%s %s\n", type_to_char(DEV_ALL),
29486df3 293 maj, min, acc);
ad676077 294 } else {
db9aeca9
AR
295 list_for_each_entry_rcu(ex, &devcgroup->exceptions, list) {
296 set_access(acc, ex->access);
297 set_majmin(maj, ex->major);
298 set_majmin(min, ex->minor);
299 seq_printf(m, "%c %s:%s %s\n", type_to_char(ex->type),
ad676077
AR
300 maj, min, acc);
301 }
08ce5f16 302 }
4efd1a1b 303 rcu_read_unlock();
08ce5f16 304
29486df3 305 return 0;
08ce5f16
SH
306}
307
ad676077 308/**
79d71974
AR
309 * match_exception - iterates the exception list trying to match a rule
310 * based on type, major, minor and access type. It is
311 * considered a match if an exception is found that
312 * will contain the entire range of provided parameters.
313 * @exceptions: list of exceptions
314 * @type: device type (DEV_BLOCK or DEV_CHAR)
315 * @major: device file major number, ~0 to match all
316 * @minor: device file minor number, ~0 to match all
317 * @access: permission mask (ACC_READ, ACC_WRITE, ACC_MKNOD)
318 *
319 * returns: true in case it matches an exception completely
08ce5f16 320 */
79d71974
AR
321static bool match_exception(struct list_head *exceptions, short type,
322 u32 major, u32 minor, short access)
08ce5f16 323{
db9aeca9 324 struct dev_exception_item *ex;
08ce5f16 325
79d71974
AR
326 list_for_each_entry_rcu(ex, exceptions, list) {
327 if ((type & DEV_BLOCK) && !(ex->type & DEV_BLOCK))
328 continue;
329 if ((type & DEV_CHAR) && !(ex->type & DEV_CHAR))
330 continue;
331 if (ex->major != ~0 && ex->major != major)
332 continue;
333 if (ex->minor != ~0 && ex->minor != minor)
334 continue;
335 /* provided access cannot have more than the exception rule */
336 if (access & (~ex->access))
337 continue;
338 return true;
339 }
340 return false;
341}
342
343/**
344 * match_exception_partial - iterates the exception list trying to match a rule
345 * based on type, major, minor and access type. It is
346 * considered a match if an exception's range is
347 * found to contain *any* of the devices specified by
348 * provided parameters. This is used to make sure no
349 * extra access is being granted that is forbidden by
350 * any of the exception list.
351 * @exceptions: list of exceptions
352 * @type: device type (DEV_BLOCK or DEV_CHAR)
353 * @major: device file major number, ~0 to match all
354 * @minor: device file minor number, ~0 to match all
355 * @access: permission mask (ACC_READ, ACC_WRITE, ACC_MKNOD)
356 *
357 * returns: true in case the provided range mat matches an exception completely
358 */
359static bool match_exception_partial(struct list_head *exceptions, short type,
360 u32 major, u32 minor, short access)
361{
362 struct dev_exception_item *ex;
4b1c7840 363
79d71974
AR
364 list_for_each_entry_rcu(ex, exceptions, list) {
365 if ((type & DEV_BLOCK) && !(ex->type & DEV_BLOCK))
08ce5f16 366 continue;
79d71974 367 if ((type & DEV_CHAR) && !(ex->type & DEV_CHAR))
08ce5f16 368 continue;
79d71974
AR
369 /*
370 * We must be sure that both the exception and the provided
371 * range aren't masking all devices
372 */
373 if (ex->major != ~0 && major != ~0 && ex->major != major)
08ce5f16 374 continue;
79d71974 375 if (ex->minor != ~0 && minor != ~0 && ex->minor != minor)
08ce5f16 376 continue;
79d71974
AR
377 /*
378 * In order to make sure the provided range isn't matching
379 * an exception, all its access bits shouldn't match the
380 * exception's access bits
381 */
382 if (!(access & ex->access))
08ce5f16 383 continue;
79d71974 384 return true;
08ce5f16 385 }
79d71974
AR
386 return false;
387}
388
389/**
390 * verify_new_ex - verifies if a new exception is part of what is allowed
391 * by a dev cgroup based on the default policy +
392 * exceptions. This is used to make sure a child cgroup
393 * won't have more privileges than its parent
394 * @dev_cgroup: dev cgroup to be tested against
395 * @refex: new exception
396 * @behavior: behavior of the exception's dev_cgroup
397 */
398static bool verify_new_ex(struct dev_cgroup *dev_cgroup,
399 struct dev_exception_item *refex,
400 enum devcg_behavior behavior)
401{
402 bool match = false;
403
404 rcu_lockdep_assert(rcu_read_lock_held() ||
405 lockdep_is_held(&devcgroup_mutex),
406 "device_cgroup:verify_new_ex called without proper synchronization");
ad676077 407
c39a2a30
AR
408 if (dev_cgroup->behavior == DEVCG_DEFAULT_ALLOW) {
409 if (behavior == DEVCG_DEFAULT_ALLOW) {
79d71974
AR
410 /*
411 * new exception in the child doesn't matter, only
412 * adding extra restrictions
413 */
c39a2a30
AR
414 return true;
415 } else {
79d71974
AR
416 /*
417 * new exception in the child will add more devices
418 * that can be acessed, so it can't match any of
419 * parent's exceptions, even slightly
420 */
421 match = match_exception_partial(&dev_cgroup->exceptions,
422 refex->type,
423 refex->major,
424 refex->minor,
425 refex->access);
426
c39a2a30 427 if (match)
c39a2a30 428 return false;
26898fdf 429 return true;
c39a2a30 430 }
26898fdf 431 } else {
79d71974
AR
432 /*
433 * Only behavior == DEVCG_DEFAULT_DENY allowed here, therefore
434 * the new exception will add access to more devices and must
435 * be contained completely in an parent's exception to be
436 * allowed
437 */
438 match = match_exception(&dev_cgroup->exceptions, refex->type,
439 refex->major, refex->minor,
440 refex->access);
441
c39a2a30
AR
442 if (match)
443 /* parent has an exception that matches the proposed */
26898fdf 444 return true;
c39a2a30
AR
445 else
446 return false;
26898fdf
AR
447 }
448 return false;
08ce5f16
SH
449}
450
451/*
452 * parent_has_perm:
db9aeca9 453 * when adding a new allow rule to a device exception list, the rule
08ce5f16
SH
454 * must be allowed in the parent device
455 */
f92523e3 456static int parent_has_perm(struct dev_cgroup *childcg,
db9aeca9 457 struct dev_exception_item *ex)
08ce5f16 458{
63876986 459 struct dev_cgroup *parent = css_to_devcgroup(css_parent(&childcg->css));
08ce5f16 460
63876986 461 if (!parent)
08ce5f16 462 return 1;
79d71974 463 return verify_new_ex(parent, ex, childcg->behavior);
08ce5f16
SH
464}
465
4cef7299
AR
466/**
467 * may_allow_all - checks if it's possible to change the behavior to
468 * allow based on parent's rules.
469 * @parent: device cgroup's parent
470 * returns: != 0 in case it's allowed, 0 otherwise
471 */
472static inline int may_allow_all(struct dev_cgroup *parent)
473{
64e10477
AR
474 if (!parent)
475 return 1;
4cef7299
AR
476 return parent->behavior == DEVCG_DEFAULT_ALLOW;
477}
478
bd2953eb
AR
479/**
480 * revalidate_active_exceptions - walks through the active exception list and
481 * revalidates the exceptions based on parent's
482 * behavior and exceptions. The exceptions that
483 * are no longer valid will be removed.
484 * Called with devcgroup_mutex held.
485 * @devcg: cgroup which exceptions will be checked
486 *
487 * This is one of the three key functions for hierarchy implementation.
488 * This function is responsible for re-evaluating all the cgroup's active
489 * exceptions due to a parent's exception change.
490 * Refer to Documentation/cgroups/devices.txt for more details.
491 */
492static void revalidate_active_exceptions(struct dev_cgroup *devcg)
493{
494 struct dev_exception_item *ex;
495 struct list_head *this, *tmp;
496
497 list_for_each_safe(this, tmp, &devcg->exceptions) {
498 ex = container_of(this, struct dev_exception_item, list);
499 if (!parent_has_perm(devcg, ex))
500 dev_exception_rm(devcg, ex);
501 }
502}
503
bd2953eb
AR
504/**
505 * propagate_exception - propagates a new exception to the children
506 * @devcg_root: device cgroup that added a new exception
507 * @ex: new exception to be propagated
508 *
509 * returns: 0 in case of success, != 0 in case of error
510 */
511static int propagate_exception(struct dev_cgroup *devcg_root,
512 struct dev_exception_item *ex)
513{
492eb21b 514 struct cgroup_subsys_state *pos;
bd2953eb 515 int rc = 0;
bd2953eb 516
d591fb56 517 rcu_read_lock();
bd2953eb 518
492eb21b
TH
519 css_for_each_descendant_pre(pos, &devcg_root->css) {
520 struct dev_cgroup *devcg = css_to_devcgroup(pos);
d591fb56
TH
521
522 /*
523 * Because devcgroup_mutex is held, no devcg will become
524 * online or offline during the tree walk (see on/offline
525 * methods), and online ones are safe to access outside RCU
526 * read lock without bumping refcnt.
527 */
bd8815a6 528 if (pos == &devcg_root->css || !is_devcg_online(devcg))
d591fb56
TH
529 continue;
530
531 rcu_read_unlock();
bd2953eb
AR
532
533 /*
534 * in case both root's behavior and devcg is allow, a new
535 * restriction means adding to the exception list
536 */
537 if (devcg_root->behavior == DEVCG_DEFAULT_ALLOW &&
538 devcg->behavior == DEVCG_DEFAULT_ALLOW) {
539 rc = dev_exception_add(devcg, ex);
540 if (rc)
541 break;
542 } else {
543 /*
544 * in the other possible cases:
545 * root's behavior: allow, devcg's: deny
546 * root's behavior: deny, devcg's: deny
547 * the exception will be removed
548 */
549 dev_exception_rm(devcg, ex);
550 }
551 revalidate_active_exceptions(devcg);
552
d591fb56 553 rcu_read_lock();
bd2953eb 554 }
d591fb56
TH
555
556 rcu_read_unlock();
bd2953eb
AR
557 return rc;
558}
559
560static inline bool has_children(struct dev_cgroup *devcgroup)
561{
562 struct cgroup *cgrp = devcgroup->css.cgroup;
563
564 return !list_empty(&cgrp->children);
565}
566
08ce5f16 567/*
db9aeca9 568 * Modify the exception list using allow/deny rules.
08ce5f16
SH
569 * CAP_SYS_ADMIN is needed for this. It's at least separate from CAP_MKNOD
570 * so we can give a container CAP_MKNOD to let it create devices but not
db9aeca9 571 * modify the exception list.
08ce5f16
SH
572 * It seems likely we'll want to add a CAP_CONTAINER capability to allow
573 * us to also grant CAP_SYS_ADMIN to containers without giving away the
db9aeca9 574 * device exception list controls, but for now we'll stick with CAP_SYS_ADMIN
08ce5f16
SH
575 *
576 * Taking rules away is always allowed (given CAP_SYS_ADMIN). Granting
577 * new access is only allowed if you're in the top-level cgroup, or your
578 * parent cgroup has the access you're asking for.
579 */
f92523e3 580static int devcgroup_update_access(struct dev_cgroup *devcgroup,
4d3bb511 581 int filetype, char *buffer)
08ce5f16 582{
f92523e3 583 const char *b;
26fd8405 584 char temp[12]; /* 11 + 1 characters needed for a u32 */
c39a2a30 585 int count, rc = 0;
db9aeca9 586 struct dev_exception_item ex;
63876986 587 struct dev_cgroup *parent = css_to_devcgroup(css_parent(&devcgroup->css));
08ce5f16
SH
588
589 if (!capable(CAP_SYS_ADMIN))
590 return -EPERM;
591
db9aeca9 592 memset(&ex, 0, sizeof(ex));
08ce5f16
SH
593 b = buffer;
594
595 switch (*b) {
596 case 'a':
ad676077
AR
597 switch (filetype) {
598 case DEVCG_ALLOW:
bd2953eb
AR
599 if (has_children(devcgroup))
600 return -EINVAL;
601
4cef7299 602 if (!may_allow_all(parent))
ad676077 603 return -EPERM;
db9aeca9 604 dev_exception_clean(devcgroup);
64e10477
AR
605 devcgroup->behavior = DEVCG_DEFAULT_ALLOW;
606 if (!parent)
607 break;
608
4cef7299
AR
609 rc = dev_exceptions_copy(&devcgroup->exceptions,
610 &parent->exceptions);
611 if (rc)
612 return rc;
ad676077
AR
613 break;
614 case DEVCG_DENY:
bd2953eb
AR
615 if (has_children(devcgroup))
616 return -EINVAL;
617
db9aeca9 618 dev_exception_clean(devcgroup);
5b7aa7d5 619 devcgroup->behavior = DEVCG_DEFAULT_DENY;
ad676077
AR
620 break;
621 default:
622 return -EINVAL;
623 }
624 return 0;
08ce5f16 625 case 'b':
db9aeca9 626 ex.type = DEV_BLOCK;
08ce5f16
SH
627 break;
628 case 'c':
db9aeca9 629 ex.type = DEV_CHAR;
08ce5f16
SH
630 break;
631 default:
f92523e3 632 return -EINVAL;
08ce5f16
SH
633 }
634 b++;
f92523e3
PM
635 if (!isspace(*b))
636 return -EINVAL;
08ce5f16
SH
637 b++;
638 if (*b == '*') {
db9aeca9 639 ex.major = ~0;
08ce5f16
SH
640 b++;
641 } else if (isdigit(*b)) {
26fd8405
AR
642 memset(temp, 0, sizeof(temp));
643 for (count = 0; count < sizeof(temp) - 1; count++) {
644 temp[count] = *b;
645 b++;
646 if (!isdigit(*b))
647 break;
648 }
649 rc = kstrtou32(temp, 10, &ex.major);
650 if (rc)
651 return -EINVAL;
08ce5f16 652 } else {
f92523e3 653 return -EINVAL;
08ce5f16 654 }
f92523e3
PM
655 if (*b != ':')
656 return -EINVAL;
08ce5f16
SH
657 b++;
658
659 /* read minor */
660 if (*b == '*') {
db9aeca9 661 ex.minor = ~0;
08ce5f16
SH
662 b++;
663 } else if (isdigit(*b)) {
26fd8405
AR
664 memset(temp, 0, sizeof(temp));
665 for (count = 0; count < sizeof(temp) - 1; count++) {
666 temp[count] = *b;
667 b++;
668 if (!isdigit(*b))
669 break;
670 }
671 rc = kstrtou32(temp, 10, &ex.minor);
672 if (rc)
673 return -EINVAL;
08ce5f16 674 } else {
f92523e3 675 return -EINVAL;
08ce5f16 676 }
f92523e3
PM
677 if (!isspace(*b))
678 return -EINVAL;
08ce5f16
SH
679 for (b++, count = 0; count < 3; count++, b++) {
680 switch (*b) {
681 case 'r':
db9aeca9 682 ex.access |= ACC_READ;
08ce5f16
SH
683 break;
684 case 'w':
db9aeca9 685 ex.access |= ACC_WRITE;
08ce5f16
SH
686 break;
687 case 'm':
db9aeca9 688 ex.access |= ACC_MKNOD;
08ce5f16
SH
689 break;
690 case '\n':
691 case '\0':
692 count = 3;
693 break;
694 default:
f92523e3 695 return -EINVAL;
08ce5f16
SH
696 }
697 }
698
08ce5f16
SH
699 switch (filetype) {
700 case DEVCG_ALLOW:
db9aeca9 701 if (!parent_has_perm(devcgroup, &ex))
f92523e3 702 return -EPERM;
ad676077
AR
703 /*
704 * If the default policy is to allow by default, try to remove
705 * an matching exception instead. And be silent about it: we
706 * don't want to break compatibility
707 */
5b7aa7d5 708 if (devcgroup->behavior == DEVCG_DEFAULT_ALLOW) {
db9aeca9 709 dev_exception_rm(devcgroup, &ex);
ad676077
AR
710 return 0;
711 }
bd2953eb
AR
712 rc = dev_exception_add(devcgroup, &ex);
713 break;
08ce5f16 714 case DEVCG_DENY:
ad676077
AR
715 /*
716 * If the default policy is to deny by default, try to remove
717 * an matching exception instead. And be silent about it: we
718 * don't want to break compatibility
719 */
bd2953eb 720 if (devcgroup->behavior == DEVCG_DEFAULT_DENY)
db9aeca9 721 dev_exception_rm(devcgroup, &ex);
bd2953eb
AR
722 else
723 rc = dev_exception_add(devcgroup, &ex);
724
725 if (rc)
726 break;
727 /* we only propagate new restrictions */
728 rc = propagate_exception(devcgroup, &ex);
729 break;
08ce5f16 730 default:
bd2953eb 731 rc = -EINVAL;
08ce5f16 732 }
bd2953eb 733 return rc;
f92523e3 734}
08ce5f16 735
182446d0 736static int devcgroup_access_write(struct cgroup_subsys_state *css,
4d3bb511 737 struct cftype *cft, char *buffer)
f92523e3
PM
738{
739 int retval;
b4046f00
LZ
740
741 mutex_lock(&devcgroup_mutex);
182446d0 742 retval = devcgroup_update_access(css_to_devcgroup(css),
f92523e3 743 cft->private, buffer);
b4046f00 744 mutex_unlock(&devcgroup_mutex);
08ce5f16
SH
745 return retval;
746}
747
748static struct cftype dev_cgroup_files[] = {
749 {
750 .name = "allow",
f92523e3 751 .write_string = devcgroup_access_write,
08ce5f16
SH
752 .private = DEVCG_ALLOW,
753 },
754 {
755 .name = "deny",
f92523e3 756 .write_string = devcgroup_access_write,
08ce5f16
SH
757 .private = DEVCG_DENY,
758 },
29486df3
SH
759 {
760 .name = "list",
2da8ca82 761 .seq_show = devcgroup_seq_show,
29486df3
SH
762 .private = DEVCG_LIST,
763 },
4baf6e33 764 { } /* terminate */
08ce5f16
SH
765};
766
073219e9 767struct cgroup_subsys devices_cgrp_subsys = {
92fb9748
TH
768 .css_alloc = devcgroup_css_alloc,
769 .css_free = devcgroup_css_free,
1909554c
AR
770 .css_online = devcgroup_online,
771 .css_offline = devcgroup_offline,
4baf6e33 772 .base_cftypes = dev_cgroup_files,
08ce5f16
SH
773};
774
ad676077
AR
775/**
776 * __devcgroup_check_permission - checks if an inode operation is permitted
777 * @dev_cgroup: the dev cgroup to be tested against
778 * @type: device type
779 * @major: device major number
780 * @minor: device minor number
781 * @access: combination of ACC_WRITE, ACC_READ and ACC_MKNOD
782 *
783 * returns 0 on success, -EPERM case the operation is not permitted
784 */
8c9506d1 785static int __devcgroup_check_permission(short type, u32 major, u32 minor,
ad676077 786 short access)
08ce5f16 787{
8c9506d1 788 struct dev_cgroup *dev_cgroup;
79d71974 789 bool rc;
36fd71d2 790
ad676077 791 rcu_read_lock();
8c9506d1 792 dev_cgroup = task_devcgroup(current);
79d71974
AR
793 if (dev_cgroup->behavior == DEVCG_DEFAULT_ALLOW)
794 /* Can't match any of the exceptions, even partially */
795 rc = !match_exception_partial(&dev_cgroup->exceptions,
796 type, major, minor, access);
797 else
798 /* Need to match completely one exception to be allowed */
799 rc = match_exception(&dev_cgroup->exceptions, type, major,
800 minor, access);
ad676077 801 rcu_read_unlock();
cd500819 802
ad676077
AR
803 if (!rc)
804 return -EPERM;
36fd71d2 805
ad676077
AR
806 return 0;
807}
08ce5f16 808
ad676077
AR
809int __devcgroup_inode_permission(struct inode *inode, int mask)
810{
ad676077
AR
811 short type, access = 0;
812
813 if (S_ISBLK(inode->i_mode))
814 type = DEV_BLOCK;
815 if (S_ISCHR(inode->i_mode))
816 type = DEV_CHAR;
817 if (mask & MAY_WRITE)
818 access |= ACC_WRITE;
819 if (mask & MAY_READ)
820 access |= ACC_READ;
821
8c9506d1
JS
822 return __devcgroup_check_permission(type, imajor(inode), iminor(inode),
823 access);
08ce5f16
SH
824}
825
826int devcgroup_inode_mknod(int mode, dev_t dev)
827{
ad676077 828 short type;
08ce5f16 829
0b82ac37
SH
830 if (!S_ISBLK(mode) && !S_ISCHR(mode))
831 return 0;
832
ad676077
AR
833 if (S_ISBLK(mode))
834 type = DEV_BLOCK;
835 else
836 type = DEV_CHAR;
36fd71d2 837
8c9506d1
JS
838 return __devcgroup_check_permission(type, MAJOR(dev), MINOR(dev),
839 ACC_MKNOD);
36fd71d2 840
08ce5f16 841}