]> git.ipfire.org Git - thirdparty/kernel/linux.git/blob - fs/xattr.c
Merge tag 'riscv-soc-fixes-for-v6.9-rc3' of https://git.kernel.org/pub/scm/linux...
[thirdparty/kernel/linux.git] / fs / xattr.c
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3 File: fs/xattr.c
4
5 Extended attribute handling.
6
7 Copyright (C) 2001 by Andreas Gruenbacher <a.gruenbacher@computer.org>
8 Copyright (C) 2001 SGI - Silicon Graphics, Inc <linux-xfs@oss.sgi.com>
9 Copyright (c) 2004 Red Hat, Inc., James Morris <jmorris@redhat.com>
10 */
11 #include <linux/fs.h>
12 #include <linux/filelock.h>
13 #include <linux/slab.h>
14 #include <linux/file.h>
15 #include <linux/xattr.h>
16 #include <linux/mount.h>
17 #include <linux/namei.h>
18 #include <linux/security.h>
19 #include <linux/syscalls.h>
20 #include <linux/export.h>
21 #include <linux/fsnotify.h>
22 #include <linux/audit.h>
23 #include <linux/vmalloc.h>
24 #include <linux/posix_acl_xattr.h>
25
26 #include <linux/uaccess.h>
27
28 #include "internal.h"
29
30 static const char *
31 strcmp_prefix(const char *a, const char *a_prefix)
32 {
33 while (*a_prefix && *a == *a_prefix) {
34 a++;
35 a_prefix++;
36 }
37 return *a_prefix ? NULL : a;
38 }
39
40 /*
41 * In order to implement different sets of xattr operations for each xattr
42 * prefix, a filesystem should create a null-terminated array of struct
43 * xattr_handler (one for each prefix) and hang a pointer to it off of the
44 * s_xattr field of the superblock.
45 */
46 #define for_each_xattr_handler(handlers, handler) \
47 if (handlers) \
48 for ((handler) = *(handlers)++; \
49 (handler) != NULL; \
50 (handler) = *(handlers)++)
51
52 /*
53 * Find the xattr_handler with the matching prefix.
54 */
55 static const struct xattr_handler *
56 xattr_resolve_name(struct inode *inode, const char **name)
57 {
58 const struct xattr_handler * const *handlers = inode->i_sb->s_xattr;
59 const struct xattr_handler *handler;
60
61 if (!(inode->i_opflags & IOP_XATTR)) {
62 if (unlikely(is_bad_inode(inode)))
63 return ERR_PTR(-EIO);
64 return ERR_PTR(-EOPNOTSUPP);
65 }
66 for_each_xattr_handler(handlers, handler) {
67 const char *n;
68
69 n = strcmp_prefix(*name, xattr_prefix(handler));
70 if (n) {
71 if (!handler->prefix ^ !*n) {
72 if (*n)
73 continue;
74 return ERR_PTR(-EINVAL);
75 }
76 *name = n;
77 return handler;
78 }
79 }
80 return ERR_PTR(-EOPNOTSUPP);
81 }
82
83 /**
84 * may_write_xattr - check whether inode allows writing xattr
85 * @idmap: idmap of the mount the inode was found from
86 * @inode: the inode on which to set an xattr
87 *
88 * Check whether the inode allows writing xattrs. Specifically, we can never
89 * set or remove an extended attribute on a read-only filesystem or on an
90 * immutable / append-only inode.
91 *
92 * We also need to ensure that the inode has a mapping in the mount to
93 * not risk writing back invalid i_{g,u}id values.
94 *
95 * Return: On success zero is returned. On error a negative errno is returned.
96 */
97 int may_write_xattr(struct mnt_idmap *idmap, struct inode *inode)
98 {
99 if (IS_IMMUTABLE(inode))
100 return -EPERM;
101 if (IS_APPEND(inode))
102 return -EPERM;
103 if (HAS_UNMAPPED_ID(idmap, inode))
104 return -EPERM;
105 return 0;
106 }
107
108 /*
109 * Check permissions for extended attribute access. This is a bit complicated
110 * because different namespaces have very different rules.
111 */
112 static int
113 xattr_permission(struct mnt_idmap *idmap, struct inode *inode,
114 const char *name, int mask)
115 {
116 if (mask & MAY_WRITE) {
117 int ret;
118
119 ret = may_write_xattr(idmap, inode);
120 if (ret)
121 return ret;
122 }
123
124 /*
125 * No restriction for security.* and system.* from the VFS. Decision
126 * on these is left to the underlying filesystem / security module.
127 */
128 if (!strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) ||
129 !strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
130 return 0;
131
132 /*
133 * The trusted.* namespace can only be accessed by privileged users.
134 */
135 if (!strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN)) {
136 if (!capable(CAP_SYS_ADMIN))
137 return (mask & MAY_WRITE) ? -EPERM : -ENODATA;
138 return 0;
139 }
140
141 /*
142 * In the user.* namespace, only regular files and directories can have
143 * extended attributes. For sticky directories, only the owner and
144 * privileged users can write attributes.
145 */
146 if (!strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN)) {
147 if (!S_ISREG(inode->i_mode) && !S_ISDIR(inode->i_mode))
148 return (mask & MAY_WRITE) ? -EPERM : -ENODATA;
149 if (S_ISDIR(inode->i_mode) && (inode->i_mode & S_ISVTX) &&
150 (mask & MAY_WRITE) &&
151 !inode_owner_or_capable(idmap, inode))
152 return -EPERM;
153 }
154
155 return inode_permission(idmap, inode, mask);
156 }
157
158 /*
159 * Look for any handler that deals with the specified namespace.
160 */
161 int
162 xattr_supports_user_prefix(struct inode *inode)
163 {
164 const struct xattr_handler * const *handlers = inode->i_sb->s_xattr;
165 const struct xattr_handler *handler;
166
167 if (!(inode->i_opflags & IOP_XATTR)) {
168 if (unlikely(is_bad_inode(inode)))
169 return -EIO;
170 return -EOPNOTSUPP;
171 }
172
173 for_each_xattr_handler(handlers, handler) {
174 if (!strncmp(xattr_prefix(handler), XATTR_USER_PREFIX,
175 XATTR_USER_PREFIX_LEN))
176 return 0;
177 }
178
179 return -EOPNOTSUPP;
180 }
181 EXPORT_SYMBOL(xattr_supports_user_prefix);
182
183 int
184 __vfs_setxattr(struct mnt_idmap *idmap, struct dentry *dentry,
185 struct inode *inode, const char *name, const void *value,
186 size_t size, int flags)
187 {
188 const struct xattr_handler *handler;
189
190 if (is_posix_acl_xattr(name))
191 return -EOPNOTSUPP;
192
193 handler = xattr_resolve_name(inode, &name);
194 if (IS_ERR(handler))
195 return PTR_ERR(handler);
196 if (!handler->set)
197 return -EOPNOTSUPP;
198 if (size == 0)
199 value = ""; /* empty EA, do not remove */
200 return handler->set(handler, idmap, dentry, inode, name, value,
201 size, flags);
202 }
203 EXPORT_SYMBOL(__vfs_setxattr);
204
205 /**
206 * __vfs_setxattr_noperm - perform setxattr operation without performing
207 * permission checks.
208 *
209 * @idmap: idmap of the mount the inode was found from
210 * @dentry: object to perform setxattr on
211 * @name: xattr name to set
212 * @value: value to set @name to
213 * @size: size of @value
214 * @flags: flags to pass into filesystem operations
215 *
216 * returns the result of the internal setxattr or setsecurity operations.
217 *
218 * This function requires the caller to lock the inode's i_mutex before it
219 * is executed. It also assumes that the caller will make the appropriate
220 * permission checks.
221 */
222 int __vfs_setxattr_noperm(struct mnt_idmap *idmap,
223 struct dentry *dentry, const char *name,
224 const void *value, size_t size, int flags)
225 {
226 struct inode *inode = dentry->d_inode;
227 int error = -EAGAIN;
228 int issec = !strncmp(name, XATTR_SECURITY_PREFIX,
229 XATTR_SECURITY_PREFIX_LEN);
230
231 if (issec)
232 inode->i_flags &= ~S_NOSEC;
233 if (inode->i_opflags & IOP_XATTR) {
234 error = __vfs_setxattr(idmap, dentry, inode, name, value,
235 size, flags);
236 if (!error) {
237 fsnotify_xattr(dentry);
238 security_inode_post_setxattr(dentry, name, value,
239 size, flags);
240 }
241 } else {
242 if (unlikely(is_bad_inode(inode)))
243 return -EIO;
244 }
245 if (error == -EAGAIN) {
246 error = -EOPNOTSUPP;
247
248 if (issec) {
249 const char *suffix = name + XATTR_SECURITY_PREFIX_LEN;
250
251 error = security_inode_setsecurity(inode, suffix, value,
252 size, flags);
253 if (!error)
254 fsnotify_xattr(dentry);
255 }
256 }
257
258 return error;
259 }
260
261 /**
262 * __vfs_setxattr_locked - set an extended attribute while holding the inode
263 * lock
264 *
265 * @idmap: idmap of the mount of the target inode
266 * @dentry: object to perform setxattr on
267 * @name: xattr name to set
268 * @value: value to set @name to
269 * @size: size of @value
270 * @flags: flags to pass into filesystem operations
271 * @delegated_inode: on return, will contain an inode pointer that
272 * a delegation was broken on, NULL if none.
273 */
274 int
275 __vfs_setxattr_locked(struct mnt_idmap *idmap, struct dentry *dentry,
276 const char *name, const void *value, size_t size,
277 int flags, struct inode **delegated_inode)
278 {
279 struct inode *inode = dentry->d_inode;
280 int error;
281
282 error = xattr_permission(idmap, inode, name, MAY_WRITE);
283 if (error)
284 return error;
285
286 error = security_inode_setxattr(idmap, dentry, name, value, size,
287 flags);
288 if (error)
289 goto out;
290
291 error = try_break_deleg(inode, delegated_inode);
292 if (error)
293 goto out;
294
295 error = __vfs_setxattr_noperm(idmap, dentry, name, value,
296 size, flags);
297
298 out:
299 return error;
300 }
301 EXPORT_SYMBOL_GPL(__vfs_setxattr_locked);
302
303 int
304 vfs_setxattr(struct mnt_idmap *idmap, struct dentry *dentry,
305 const char *name, const void *value, size_t size, int flags)
306 {
307 struct inode *inode = dentry->d_inode;
308 struct inode *delegated_inode = NULL;
309 const void *orig_value = value;
310 int error;
311
312 if (size && strcmp(name, XATTR_NAME_CAPS) == 0) {
313 error = cap_convert_nscap(idmap, dentry, &value, size);
314 if (error < 0)
315 return error;
316 size = error;
317 }
318
319 retry_deleg:
320 inode_lock(inode);
321 error = __vfs_setxattr_locked(idmap, dentry, name, value, size,
322 flags, &delegated_inode);
323 inode_unlock(inode);
324
325 if (delegated_inode) {
326 error = break_deleg_wait(&delegated_inode);
327 if (!error)
328 goto retry_deleg;
329 }
330 if (value != orig_value)
331 kfree(value);
332
333 return error;
334 }
335 EXPORT_SYMBOL_GPL(vfs_setxattr);
336
337 static ssize_t
338 xattr_getsecurity(struct mnt_idmap *idmap, struct inode *inode,
339 const char *name, void *value, size_t size)
340 {
341 void *buffer = NULL;
342 ssize_t len;
343
344 if (!value || !size) {
345 len = security_inode_getsecurity(idmap, inode, name,
346 &buffer, false);
347 goto out_noalloc;
348 }
349
350 len = security_inode_getsecurity(idmap, inode, name, &buffer,
351 true);
352 if (len < 0)
353 return len;
354 if (size < len) {
355 len = -ERANGE;
356 goto out;
357 }
358 memcpy(value, buffer, len);
359 out:
360 kfree(buffer);
361 out_noalloc:
362 return len;
363 }
364
365 /*
366 * vfs_getxattr_alloc - allocate memory, if necessary, before calling getxattr
367 *
368 * Allocate memory, if not already allocated, or re-allocate correct size,
369 * before retrieving the extended attribute. The xattr value buffer should
370 * always be freed by the caller, even on error.
371 *
372 * Returns the result of alloc, if failed, or the getxattr operation.
373 */
374 int
375 vfs_getxattr_alloc(struct mnt_idmap *idmap, struct dentry *dentry,
376 const char *name, char **xattr_value, size_t xattr_size,
377 gfp_t flags)
378 {
379 const struct xattr_handler *handler;
380 struct inode *inode = dentry->d_inode;
381 char *value = *xattr_value;
382 int error;
383
384 error = xattr_permission(idmap, inode, name, MAY_READ);
385 if (error)
386 return error;
387
388 handler = xattr_resolve_name(inode, &name);
389 if (IS_ERR(handler))
390 return PTR_ERR(handler);
391 if (!handler->get)
392 return -EOPNOTSUPP;
393 error = handler->get(handler, dentry, inode, name, NULL, 0);
394 if (error < 0)
395 return error;
396
397 if (!value || (error > xattr_size)) {
398 value = krealloc(*xattr_value, error + 1, flags);
399 if (!value)
400 return -ENOMEM;
401 memset(value, 0, error + 1);
402 }
403
404 error = handler->get(handler, dentry, inode, name, value, error);
405 *xattr_value = value;
406 return error;
407 }
408
409 ssize_t
410 __vfs_getxattr(struct dentry *dentry, struct inode *inode, const char *name,
411 void *value, size_t size)
412 {
413 const struct xattr_handler *handler;
414
415 if (is_posix_acl_xattr(name))
416 return -EOPNOTSUPP;
417
418 handler = xattr_resolve_name(inode, &name);
419 if (IS_ERR(handler))
420 return PTR_ERR(handler);
421 if (!handler->get)
422 return -EOPNOTSUPP;
423 return handler->get(handler, dentry, inode, name, value, size);
424 }
425 EXPORT_SYMBOL(__vfs_getxattr);
426
427 ssize_t
428 vfs_getxattr(struct mnt_idmap *idmap, struct dentry *dentry,
429 const char *name, void *value, size_t size)
430 {
431 struct inode *inode = dentry->d_inode;
432 int error;
433
434 error = xattr_permission(idmap, inode, name, MAY_READ);
435 if (error)
436 return error;
437
438 error = security_inode_getxattr(dentry, name);
439 if (error)
440 return error;
441
442 if (!strncmp(name, XATTR_SECURITY_PREFIX,
443 XATTR_SECURITY_PREFIX_LEN)) {
444 const char *suffix = name + XATTR_SECURITY_PREFIX_LEN;
445 int ret = xattr_getsecurity(idmap, inode, suffix, value,
446 size);
447 /*
448 * Only overwrite the return value if a security module
449 * is actually active.
450 */
451 if (ret == -EOPNOTSUPP)
452 goto nolsm;
453 return ret;
454 }
455 nolsm:
456 return __vfs_getxattr(dentry, inode, name, value, size);
457 }
458 EXPORT_SYMBOL_GPL(vfs_getxattr);
459
460 /**
461 * vfs_listxattr - retrieve \0 separated list of xattr names
462 * @dentry: the dentry from whose inode the xattr names are retrieved
463 * @list: buffer to store xattr names into
464 * @size: size of the buffer
465 *
466 * This function returns the names of all xattrs associated with the
467 * inode of @dentry.
468 *
469 * Note, for legacy reasons the vfs_listxattr() function lists POSIX
470 * ACLs as well. Since POSIX ACLs are decoupled from IOP_XATTR the
471 * vfs_listxattr() function doesn't check for this flag since a
472 * filesystem could implement POSIX ACLs without implementing any other
473 * xattrs.
474 *
475 * However, since all codepaths that remove IOP_XATTR also assign of
476 * inode operations that either don't implement or implement a stub
477 * ->listxattr() operation.
478 *
479 * Return: On success, the size of the buffer that was used. On error a
480 * negative error code.
481 */
482 ssize_t
483 vfs_listxattr(struct dentry *dentry, char *list, size_t size)
484 {
485 struct inode *inode = d_inode(dentry);
486 ssize_t error;
487
488 error = security_inode_listxattr(dentry);
489 if (error)
490 return error;
491
492 if (inode->i_op->listxattr) {
493 error = inode->i_op->listxattr(dentry, list, size);
494 } else {
495 error = security_inode_listsecurity(inode, list, size);
496 if (size && error > size)
497 error = -ERANGE;
498 }
499 return error;
500 }
501 EXPORT_SYMBOL_GPL(vfs_listxattr);
502
503 int
504 __vfs_removexattr(struct mnt_idmap *idmap, struct dentry *dentry,
505 const char *name)
506 {
507 struct inode *inode = d_inode(dentry);
508 const struct xattr_handler *handler;
509
510 if (is_posix_acl_xattr(name))
511 return -EOPNOTSUPP;
512
513 handler = xattr_resolve_name(inode, &name);
514 if (IS_ERR(handler))
515 return PTR_ERR(handler);
516 if (!handler->set)
517 return -EOPNOTSUPP;
518 return handler->set(handler, idmap, dentry, inode, name, NULL, 0,
519 XATTR_REPLACE);
520 }
521 EXPORT_SYMBOL(__vfs_removexattr);
522
523 /**
524 * __vfs_removexattr_locked - set an extended attribute while holding the inode
525 * lock
526 *
527 * @idmap: idmap of the mount of the target inode
528 * @dentry: object to perform setxattr on
529 * @name: name of xattr to remove
530 * @delegated_inode: on return, will contain an inode pointer that
531 * a delegation was broken on, NULL if none.
532 */
533 int
534 __vfs_removexattr_locked(struct mnt_idmap *idmap,
535 struct dentry *dentry, const char *name,
536 struct inode **delegated_inode)
537 {
538 struct inode *inode = dentry->d_inode;
539 int error;
540
541 error = xattr_permission(idmap, inode, name, MAY_WRITE);
542 if (error)
543 return error;
544
545 error = security_inode_removexattr(idmap, dentry, name);
546 if (error)
547 goto out;
548
549 error = try_break_deleg(inode, delegated_inode);
550 if (error)
551 goto out;
552
553 error = __vfs_removexattr(idmap, dentry, name);
554 if (error)
555 return error;
556
557 fsnotify_xattr(dentry);
558 security_inode_post_removexattr(dentry, name);
559
560 out:
561 return error;
562 }
563 EXPORT_SYMBOL_GPL(__vfs_removexattr_locked);
564
565 int
566 vfs_removexattr(struct mnt_idmap *idmap, struct dentry *dentry,
567 const char *name)
568 {
569 struct inode *inode = dentry->d_inode;
570 struct inode *delegated_inode = NULL;
571 int error;
572
573 retry_deleg:
574 inode_lock(inode);
575 error = __vfs_removexattr_locked(idmap, dentry,
576 name, &delegated_inode);
577 inode_unlock(inode);
578
579 if (delegated_inode) {
580 error = break_deleg_wait(&delegated_inode);
581 if (!error)
582 goto retry_deleg;
583 }
584
585 return error;
586 }
587 EXPORT_SYMBOL_GPL(vfs_removexattr);
588
589 /*
590 * Extended attribute SET operations
591 */
592
593 int setxattr_copy(const char __user *name, struct xattr_ctx *ctx)
594 {
595 int error;
596
597 if (ctx->flags & ~(XATTR_CREATE|XATTR_REPLACE))
598 return -EINVAL;
599
600 error = strncpy_from_user(ctx->kname->name, name,
601 sizeof(ctx->kname->name));
602 if (error == 0 || error == sizeof(ctx->kname->name))
603 return -ERANGE;
604 if (error < 0)
605 return error;
606
607 error = 0;
608 if (ctx->size) {
609 if (ctx->size > XATTR_SIZE_MAX)
610 return -E2BIG;
611
612 ctx->kvalue = vmemdup_user(ctx->cvalue, ctx->size);
613 if (IS_ERR(ctx->kvalue)) {
614 error = PTR_ERR(ctx->kvalue);
615 ctx->kvalue = NULL;
616 }
617 }
618
619 return error;
620 }
621
622 int do_setxattr(struct mnt_idmap *idmap, struct dentry *dentry,
623 struct xattr_ctx *ctx)
624 {
625 if (is_posix_acl_xattr(ctx->kname->name))
626 return do_set_acl(idmap, dentry, ctx->kname->name,
627 ctx->kvalue, ctx->size);
628
629 return vfs_setxattr(idmap, dentry, ctx->kname->name,
630 ctx->kvalue, ctx->size, ctx->flags);
631 }
632
633 static long
634 setxattr(struct mnt_idmap *idmap, struct dentry *d,
635 const char __user *name, const void __user *value, size_t size,
636 int flags)
637 {
638 struct xattr_name kname;
639 struct xattr_ctx ctx = {
640 .cvalue = value,
641 .kvalue = NULL,
642 .size = size,
643 .kname = &kname,
644 .flags = flags,
645 };
646 int error;
647
648 error = setxattr_copy(name, &ctx);
649 if (error)
650 return error;
651
652 error = do_setxattr(idmap, d, &ctx);
653
654 kvfree(ctx.kvalue);
655 return error;
656 }
657
658 static int path_setxattr(const char __user *pathname,
659 const char __user *name, const void __user *value,
660 size_t size, int flags, unsigned int lookup_flags)
661 {
662 struct path path;
663 int error;
664
665 retry:
666 error = user_path_at(AT_FDCWD, pathname, lookup_flags, &path);
667 if (error)
668 return error;
669 error = mnt_want_write(path.mnt);
670 if (!error) {
671 error = setxattr(mnt_idmap(path.mnt), path.dentry, name,
672 value, size, flags);
673 mnt_drop_write(path.mnt);
674 }
675 path_put(&path);
676 if (retry_estale(error, lookup_flags)) {
677 lookup_flags |= LOOKUP_REVAL;
678 goto retry;
679 }
680 return error;
681 }
682
683 SYSCALL_DEFINE5(setxattr, const char __user *, pathname,
684 const char __user *, name, const void __user *, value,
685 size_t, size, int, flags)
686 {
687 return path_setxattr(pathname, name, value, size, flags, LOOKUP_FOLLOW);
688 }
689
690 SYSCALL_DEFINE5(lsetxattr, const char __user *, pathname,
691 const char __user *, name, const void __user *, value,
692 size_t, size, int, flags)
693 {
694 return path_setxattr(pathname, name, value, size, flags, 0);
695 }
696
697 SYSCALL_DEFINE5(fsetxattr, int, fd, const char __user *, name,
698 const void __user *,value, size_t, size, int, flags)
699 {
700 struct fd f = fdget(fd);
701 int error = -EBADF;
702
703 if (!f.file)
704 return error;
705 audit_file(f.file);
706 error = mnt_want_write_file(f.file);
707 if (!error) {
708 error = setxattr(file_mnt_idmap(f.file),
709 f.file->f_path.dentry, name,
710 value, size, flags);
711 mnt_drop_write_file(f.file);
712 }
713 fdput(f);
714 return error;
715 }
716
717 /*
718 * Extended attribute GET operations
719 */
720 ssize_t
721 do_getxattr(struct mnt_idmap *idmap, struct dentry *d,
722 struct xattr_ctx *ctx)
723 {
724 ssize_t error;
725 char *kname = ctx->kname->name;
726
727 if (ctx->size) {
728 if (ctx->size > XATTR_SIZE_MAX)
729 ctx->size = XATTR_SIZE_MAX;
730 ctx->kvalue = kvzalloc(ctx->size, GFP_KERNEL);
731 if (!ctx->kvalue)
732 return -ENOMEM;
733 }
734
735 if (is_posix_acl_xattr(ctx->kname->name))
736 error = do_get_acl(idmap, d, kname, ctx->kvalue, ctx->size);
737 else
738 error = vfs_getxattr(idmap, d, kname, ctx->kvalue, ctx->size);
739 if (error > 0) {
740 if (ctx->size && copy_to_user(ctx->value, ctx->kvalue, error))
741 error = -EFAULT;
742 } else if (error == -ERANGE && ctx->size >= XATTR_SIZE_MAX) {
743 /* The file system tried to returned a value bigger
744 than XATTR_SIZE_MAX bytes. Not possible. */
745 error = -E2BIG;
746 }
747
748 return error;
749 }
750
751 static ssize_t
752 getxattr(struct mnt_idmap *idmap, struct dentry *d,
753 const char __user *name, void __user *value, size_t size)
754 {
755 ssize_t error;
756 struct xattr_name kname;
757 struct xattr_ctx ctx = {
758 .value = value,
759 .kvalue = NULL,
760 .size = size,
761 .kname = &kname,
762 .flags = 0,
763 };
764
765 error = strncpy_from_user(kname.name, name, sizeof(kname.name));
766 if (error == 0 || error == sizeof(kname.name))
767 error = -ERANGE;
768 if (error < 0)
769 return error;
770
771 error = do_getxattr(idmap, d, &ctx);
772
773 kvfree(ctx.kvalue);
774 return error;
775 }
776
777 static ssize_t path_getxattr(const char __user *pathname,
778 const char __user *name, void __user *value,
779 size_t size, unsigned int lookup_flags)
780 {
781 struct path path;
782 ssize_t error;
783 retry:
784 error = user_path_at(AT_FDCWD, pathname, lookup_flags, &path);
785 if (error)
786 return error;
787 error = getxattr(mnt_idmap(path.mnt), path.dentry, name, value, size);
788 path_put(&path);
789 if (retry_estale(error, lookup_flags)) {
790 lookup_flags |= LOOKUP_REVAL;
791 goto retry;
792 }
793 return error;
794 }
795
796 SYSCALL_DEFINE4(getxattr, const char __user *, pathname,
797 const char __user *, name, void __user *, value, size_t, size)
798 {
799 return path_getxattr(pathname, name, value, size, LOOKUP_FOLLOW);
800 }
801
802 SYSCALL_DEFINE4(lgetxattr, const char __user *, pathname,
803 const char __user *, name, void __user *, value, size_t, size)
804 {
805 return path_getxattr(pathname, name, value, size, 0);
806 }
807
808 SYSCALL_DEFINE4(fgetxattr, int, fd, const char __user *, name,
809 void __user *, value, size_t, size)
810 {
811 struct fd f = fdget(fd);
812 ssize_t error = -EBADF;
813
814 if (!f.file)
815 return error;
816 audit_file(f.file);
817 error = getxattr(file_mnt_idmap(f.file), f.file->f_path.dentry,
818 name, value, size);
819 fdput(f);
820 return error;
821 }
822
823 /*
824 * Extended attribute LIST operations
825 */
826 static ssize_t
827 listxattr(struct dentry *d, char __user *list, size_t size)
828 {
829 ssize_t error;
830 char *klist = NULL;
831
832 if (size) {
833 if (size > XATTR_LIST_MAX)
834 size = XATTR_LIST_MAX;
835 klist = kvmalloc(size, GFP_KERNEL);
836 if (!klist)
837 return -ENOMEM;
838 }
839
840 error = vfs_listxattr(d, klist, size);
841 if (error > 0) {
842 if (size && copy_to_user(list, klist, error))
843 error = -EFAULT;
844 } else if (error == -ERANGE && size >= XATTR_LIST_MAX) {
845 /* The file system tried to returned a list bigger
846 than XATTR_LIST_MAX bytes. Not possible. */
847 error = -E2BIG;
848 }
849
850 kvfree(klist);
851
852 return error;
853 }
854
855 static ssize_t path_listxattr(const char __user *pathname, char __user *list,
856 size_t size, unsigned int lookup_flags)
857 {
858 struct path path;
859 ssize_t error;
860 retry:
861 error = user_path_at(AT_FDCWD, pathname, lookup_flags, &path);
862 if (error)
863 return error;
864 error = listxattr(path.dentry, list, size);
865 path_put(&path);
866 if (retry_estale(error, lookup_flags)) {
867 lookup_flags |= LOOKUP_REVAL;
868 goto retry;
869 }
870 return error;
871 }
872
873 SYSCALL_DEFINE3(listxattr, const char __user *, pathname, char __user *, list,
874 size_t, size)
875 {
876 return path_listxattr(pathname, list, size, LOOKUP_FOLLOW);
877 }
878
879 SYSCALL_DEFINE3(llistxattr, const char __user *, pathname, char __user *, list,
880 size_t, size)
881 {
882 return path_listxattr(pathname, list, size, 0);
883 }
884
885 SYSCALL_DEFINE3(flistxattr, int, fd, char __user *, list, size_t, size)
886 {
887 struct fd f = fdget(fd);
888 ssize_t error = -EBADF;
889
890 if (!f.file)
891 return error;
892 audit_file(f.file);
893 error = listxattr(f.file->f_path.dentry, list, size);
894 fdput(f);
895 return error;
896 }
897
898 /*
899 * Extended attribute REMOVE operations
900 */
901 static long
902 removexattr(struct mnt_idmap *idmap, struct dentry *d,
903 const char __user *name)
904 {
905 int error;
906 char kname[XATTR_NAME_MAX + 1];
907
908 error = strncpy_from_user(kname, name, sizeof(kname));
909 if (error == 0 || error == sizeof(kname))
910 error = -ERANGE;
911 if (error < 0)
912 return error;
913
914 if (is_posix_acl_xattr(kname))
915 return vfs_remove_acl(idmap, d, kname);
916
917 return vfs_removexattr(idmap, d, kname);
918 }
919
920 static int path_removexattr(const char __user *pathname,
921 const char __user *name, unsigned int lookup_flags)
922 {
923 struct path path;
924 int error;
925 retry:
926 error = user_path_at(AT_FDCWD, pathname, lookup_flags, &path);
927 if (error)
928 return error;
929 error = mnt_want_write(path.mnt);
930 if (!error) {
931 error = removexattr(mnt_idmap(path.mnt), path.dentry, name);
932 mnt_drop_write(path.mnt);
933 }
934 path_put(&path);
935 if (retry_estale(error, lookup_flags)) {
936 lookup_flags |= LOOKUP_REVAL;
937 goto retry;
938 }
939 return error;
940 }
941
942 SYSCALL_DEFINE2(removexattr, const char __user *, pathname,
943 const char __user *, name)
944 {
945 return path_removexattr(pathname, name, LOOKUP_FOLLOW);
946 }
947
948 SYSCALL_DEFINE2(lremovexattr, const char __user *, pathname,
949 const char __user *, name)
950 {
951 return path_removexattr(pathname, name, 0);
952 }
953
954 SYSCALL_DEFINE2(fremovexattr, int, fd, const char __user *, name)
955 {
956 struct fd f = fdget(fd);
957 int error = -EBADF;
958
959 if (!f.file)
960 return error;
961 audit_file(f.file);
962 error = mnt_want_write_file(f.file);
963 if (!error) {
964 error = removexattr(file_mnt_idmap(f.file),
965 f.file->f_path.dentry, name);
966 mnt_drop_write_file(f.file);
967 }
968 fdput(f);
969 return error;
970 }
971
972 int xattr_list_one(char **buffer, ssize_t *remaining_size, const char *name)
973 {
974 size_t len;
975
976 len = strlen(name) + 1;
977 if (*buffer) {
978 if (*remaining_size < len)
979 return -ERANGE;
980 memcpy(*buffer, name, len);
981 *buffer += len;
982 }
983 *remaining_size -= len;
984 return 0;
985 }
986
987 /**
988 * generic_listxattr - run through a dentry's xattr list() operations
989 * @dentry: dentry to list the xattrs
990 * @buffer: result buffer
991 * @buffer_size: size of @buffer
992 *
993 * Combine the results of the list() operation from every xattr_handler in the
994 * xattr_handler stack.
995 *
996 * Note that this will not include the entries for POSIX ACLs.
997 */
998 ssize_t
999 generic_listxattr(struct dentry *dentry, char *buffer, size_t buffer_size)
1000 {
1001 const struct xattr_handler *handler, * const *handlers = dentry->d_sb->s_xattr;
1002 ssize_t remaining_size = buffer_size;
1003 int err = 0;
1004
1005 for_each_xattr_handler(handlers, handler) {
1006 if (!handler->name || (handler->list && !handler->list(dentry)))
1007 continue;
1008 err = xattr_list_one(&buffer, &remaining_size, handler->name);
1009 if (err)
1010 return err;
1011 }
1012
1013 return err ? err : buffer_size - remaining_size;
1014 }
1015 EXPORT_SYMBOL(generic_listxattr);
1016
1017 /**
1018 * xattr_full_name - Compute full attribute name from suffix
1019 *
1020 * @handler: handler of the xattr_handler operation
1021 * @name: name passed to the xattr_handler operation
1022 *
1023 * The get and set xattr handler operations are called with the remainder of
1024 * the attribute name after skipping the handler's prefix: for example, "foo"
1025 * is passed to the get operation of a handler with prefix "user." to get
1026 * attribute "user.foo". The full name is still "there" in the name though.
1027 *
1028 * Note: the list xattr handler operation when called from the vfs is passed a
1029 * NULL name; some file systems use this operation internally, with varying
1030 * semantics.
1031 */
1032 const char *xattr_full_name(const struct xattr_handler *handler,
1033 const char *name)
1034 {
1035 size_t prefix_len = strlen(xattr_prefix(handler));
1036
1037 return name - prefix_len;
1038 }
1039 EXPORT_SYMBOL(xattr_full_name);
1040
1041 /**
1042 * simple_xattr_space - estimate the memory used by a simple xattr
1043 * @name: the full name of the xattr
1044 * @size: the size of its value
1045 *
1046 * This takes no account of how much larger the two slab objects actually are:
1047 * that would depend on the slab implementation, when what is required is a
1048 * deterministic number, which grows with name length and size and quantity.
1049 *
1050 * Return: The approximate number of bytes of memory used by such an xattr.
1051 */
1052 size_t simple_xattr_space(const char *name, size_t size)
1053 {
1054 /*
1055 * Use "40" instead of sizeof(struct simple_xattr), to return the
1056 * same result on 32-bit and 64-bit, and even if simple_xattr grows.
1057 */
1058 return 40 + size + strlen(name);
1059 }
1060
1061 /**
1062 * simple_xattr_free - free an xattr object
1063 * @xattr: the xattr object
1064 *
1065 * Free the xattr object. Can handle @xattr being NULL.
1066 */
1067 void simple_xattr_free(struct simple_xattr *xattr)
1068 {
1069 if (xattr)
1070 kfree(xattr->name);
1071 kvfree(xattr);
1072 }
1073
1074 /**
1075 * simple_xattr_alloc - allocate new xattr object
1076 * @value: value of the xattr object
1077 * @size: size of @value
1078 *
1079 * Allocate a new xattr object and initialize respective members. The caller is
1080 * responsible for handling the name of the xattr.
1081 *
1082 * Return: On success a new xattr object is returned. On failure NULL is
1083 * returned.
1084 */
1085 struct simple_xattr *simple_xattr_alloc(const void *value, size_t size)
1086 {
1087 struct simple_xattr *new_xattr;
1088 size_t len;
1089
1090 /* wrap around? */
1091 len = sizeof(*new_xattr) + size;
1092 if (len < sizeof(*new_xattr))
1093 return NULL;
1094
1095 new_xattr = kvmalloc(len, GFP_KERNEL_ACCOUNT);
1096 if (!new_xattr)
1097 return NULL;
1098
1099 new_xattr->size = size;
1100 memcpy(new_xattr->value, value, size);
1101 return new_xattr;
1102 }
1103
1104 /**
1105 * rbtree_simple_xattr_cmp - compare xattr name with current rbtree xattr entry
1106 * @key: xattr name
1107 * @node: current node
1108 *
1109 * Compare the xattr name with the xattr name attached to @node in the rbtree.
1110 *
1111 * Return: Negative value if continuing left, positive if continuing right, 0
1112 * if the xattr attached to @node matches @key.
1113 */
1114 static int rbtree_simple_xattr_cmp(const void *key, const struct rb_node *node)
1115 {
1116 const char *xattr_name = key;
1117 const struct simple_xattr *xattr;
1118
1119 xattr = rb_entry(node, struct simple_xattr, rb_node);
1120 return strcmp(xattr->name, xattr_name);
1121 }
1122
1123 /**
1124 * rbtree_simple_xattr_node_cmp - compare two xattr rbtree nodes
1125 * @new_node: new node
1126 * @node: current node
1127 *
1128 * Compare the xattr attached to @new_node with the xattr attached to @node.
1129 *
1130 * Return: Negative value if continuing left, positive if continuing right, 0
1131 * if the xattr attached to @new_node matches the xattr attached to @node.
1132 */
1133 static int rbtree_simple_xattr_node_cmp(struct rb_node *new_node,
1134 const struct rb_node *node)
1135 {
1136 struct simple_xattr *xattr;
1137 xattr = rb_entry(new_node, struct simple_xattr, rb_node);
1138 return rbtree_simple_xattr_cmp(xattr->name, node);
1139 }
1140
1141 /**
1142 * simple_xattr_get - get an xattr object
1143 * @xattrs: the header of the xattr object
1144 * @name: the name of the xattr to retrieve
1145 * @buffer: the buffer to store the value into
1146 * @size: the size of @buffer
1147 *
1148 * Try to find and retrieve the xattr object associated with @name.
1149 * If @buffer is provided store the value of @xattr in @buffer
1150 * otherwise just return the length. The size of @buffer is limited
1151 * to XATTR_SIZE_MAX which currently is 65536.
1152 *
1153 * Return: On success the length of the xattr value is returned. On error a
1154 * negative error code is returned.
1155 */
1156 int simple_xattr_get(struct simple_xattrs *xattrs, const char *name,
1157 void *buffer, size_t size)
1158 {
1159 struct simple_xattr *xattr = NULL;
1160 struct rb_node *rbp;
1161 int ret = -ENODATA;
1162
1163 read_lock(&xattrs->lock);
1164 rbp = rb_find(name, &xattrs->rb_root, rbtree_simple_xattr_cmp);
1165 if (rbp) {
1166 xattr = rb_entry(rbp, struct simple_xattr, rb_node);
1167 ret = xattr->size;
1168 if (buffer) {
1169 if (size < xattr->size)
1170 ret = -ERANGE;
1171 else
1172 memcpy(buffer, xattr->value, xattr->size);
1173 }
1174 }
1175 read_unlock(&xattrs->lock);
1176 return ret;
1177 }
1178
1179 /**
1180 * simple_xattr_set - set an xattr object
1181 * @xattrs: the header of the xattr object
1182 * @name: the name of the xattr to retrieve
1183 * @value: the value to store along the xattr
1184 * @size: the size of @value
1185 * @flags: the flags determining how to set the xattr
1186 *
1187 * Set a new xattr object.
1188 * If @value is passed a new xattr object will be allocated. If XATTR_REPLACE
1189 * is specified in @flags a matching xattr object for @name must already exist.
1190 * If it does it will be replaced with the new xattr object. If it doesn't we
1191 * fail. If XATTR_CREATE is specified and a matching xattr does already exist
1192 * we fail. If it doesn't we create a new xattr. If @flags is zero we simply
1193 * insert the new xattr replacing any existing one.
1194 *
1195 * If @value is empty and a matching xattr object is found we delete it if
1196 * XATTR_REPLACE is specified in @flags or @flags is zero.
1197 *
1198 * If @value is empty and no matching xattr object for @name is found we do
1199 * nothing if XATTR_CREATE is specified in @flags or @flags is zero. For
1200 * XATTR_REPLACE we fail as mentioned above.
1201 *
1202 * Return: On success, the removed or replaced xattr is returned, to be freed
1203 * by the caller; or NULL if none. On failure a negative error code is returned.
1204 */
1205 struct simple_xattr *simple_xattr_set(struct simple_xattrs *xattrs,
1206 const char *name, const void *value,
1207 size_t size, int flags)
1208 {
1209 struct simple_xattr *old_xattr = NULL, *new_xattr = NULL;
1210 struct rb_node *parent = NULL, **rbp;
1211 int err = 0, ret;
1212
1213 /* value == NULL means remove */
1214 if (value) {
1215 new_xattr = simple_xattr_alloc(value, size);
1216 if (!new_xattr)
1217 return ERR_PTR(-ENOMEM);
1218
1219 new_xattr->name = kstrdup(name, GFP_KERNEL_ACCOUNT);
1220 if (!new_xattr->name) {
1221 simple_xattr_free(new_xattr);
1222 return ERR_PTR(-ENOMEM);
1223 }
1224 }
1225
1226 write_lock(&xattrs->lock);
1227 rbp = &xattrs->rb_root.rb_node;
1228 while (*rbp) {
1229 parent = *rbp;
1230 ret = rbtree_simple_xattr_cmp(name, *rbp);
1231 if (ret < 0)
1232 rbp = &(*rbp)->rb_left;
1233 else if (ret > 0)
1234 rbp = &(*rbp)->rb_right;
1235 else
1236 old_xattr = rb_entry(*rbp, struct simple_xattr, rb_node);
1237 if (old_xattr)
1238 break;
1239 }
1240
1241 if (old_xattr) {
1242 /* Fail if XATTR_CREATE is requested and the xattr exists. */
1243 if (flags & XATTR_CREATE) {
1244 err = -EEXIST;
1245 goto out_unlock;
1246 }
1247
1248 if (new_xattr)
1249 rb_replace_node(&old_xattr->rb_node,
1250 &new_xattr->rb_node, &xattrs->rb_root);
1251 else
1252 rb_erase(&old_xattr->rb_node, &xattrs->rb_root);
1253 } else {
1254 /* Fail if XATTR_REPLACE is requested but no xattr is found. */
1255 if (flags & XATTR_REPLACE) {
1256 err = -ENODATA;
1257 goto out_unlock;
1258 }
1259
1260 /*
1261 * If XATTR_CREATE or no flags are specified together with a
1262 * new value simply insert it.
1263 */
1264 if (new_xattr) {
1265 rb_link_node(&new_xattr->rb_node, parent, rbp);
1266 rb_insert_color(&new_xattr->rb_node, &xattrs->rb_root);
1267 }
1268
1269 /*
1270 * If XATTR_CREATE or no flags are specified and neither an
1271 * old or new xattr exist then we don't need to do anything.
1272 */
1273 }
1274
1275 out_unlock:
1276 write_unlock(&xattrs->lock);
1277 if (!err)
1278 return old_xattr;
1279 simple_xattr_free(new_xattr);
1280 return ERR_PTR(err);
1281 }
1282
1283 static bool xattr_is_trusted(const char *name)
1284 {
1285 return !strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN);
1286 }
1287
1288 /**
1289 * simple_xattr_list - list all xattr objects
1290 * @inode: inode from which to get the xattrs
1291 * @xattrs: the header of the xattr object
1292 * @buffer: the buffer to store all xattrs into
1293 * @size: the size of @buffer
1294 *
1295 * List all xattrs associated with @inode. If @buffer is NULL we returned
1296 * the required size of the buffer. If @buffer is provided we store the
1297 * xattrs value into it provided it is big enough.
1298 *
1299 * Note, the number of xattr names that can be listed with listxattr(2) is
1300 * limited to XATTR_LIST_MAX aka 65536 bytes. If a larger buffer is passed
1301 * then vfs_listxattr() caps it to XATTR_LIST_MAX and if more xattr names
1302 * are found it will return -E2BIG.
1303 *
1304 * Return: On success the required size or the size of the copied xattrs is
1305 * returned. On error a negative error code is returned.
1306 */
1307 ssize_t simple_xattr_list(struct inode *inode, struct simple_xattrs *xattrs,
1308 char *buffer, size_t size)
1309 {
1310 bool trusted = ns_capable_noaudit(&init_user_ns, CAP_SYS_ADMIN);
1311 struct simple_xattr *xattr;
1312 struct rb_node *rbp;
1313 ssize_t remaining_size = size;
1314 int err = 0;
1315
1316 err = posix_acl_listxattr(inode, &buffer, &remaining_size);
1317 if (err)
1318 return err;
1319
1320 read_lock(&xattrs->lock);
1321 for (rbp = rb_first(&xattrs->rb_root); rbp; rbp = rb_next(rbp)) {
1322 xattr = rb_entry(rbp, struct simple_xattr, rb_node);
1323
1324 /* skip "trusted." attributes for unprivileged callers */
1325 if (!trusted && xattr_is_trusted(xattr->name))
1326 continue;
1327
1328 err = xattr_list_one(&buffer, &remaining_size, xattr->name);
1329 if (err)
1330 break;
1331 }
1332 read_unlock(&xattrs->lock);
1333
1334 return err ? err : size - remaining_size;
1335 }
1336
1337 /**
1338 * rbtree_simple_xattr_less - compare two xattr rbtree nodes
1339 * @new_node: new node
1340 * @node: current node
1341 *
1342 * Compare the xattr attached to @new_node with the xattr attached to @node.
1343 * Note that this function technically tolerates duplicate entries.
1344 *
1345 * Return: True if insertion point in the rbtree is found.
1346 */
1347 static bool rbtree_simple_xattr_less(struct rb_node *new_node,
1348 const struct rb_node *node)
1349 {
1350 return rbtree_simple_xattr_node_cmp(new_node, node) < 0;
1351 }
1352
1353 /**
1354 * simple_xattr_add - add xattr objects
1355 * @xattrs: the header of the xattr object
1356 * @new_xattr: the xattr object to add
1357 *
1358 * Add an xattr object to @xattrs. This assumes no replacement or removal
1359 * of matching xattrs is wanted. Should only be called during inode
1360 * initialization when a few distinct initial xattrs are supposed to be set.
1361 */
1362 void simple_xattr_add(struct simple_xattrs *xattrs,
1363 struct simple_xattr *new_xattr)
1364 {
1365 write_lock(&xattrs->lock);
1366 rb_add(&new_xattr->rb_node, &xattrs->rb_root, rbtree_simple_xattr_less);
1367 write_unlock(&xattrs->lock);
1368 }
1369
1370 /**
1371 * simple_xattrs_init - initialize new xattr header
1372 * @xattrs: header to initialize
1373 *
1374 * Initialize relevant fields of a an xattr header.
1375 */
1376 void simple_xattrs_init(struct simple_xattrs *xattrs)
1377 {
1378 xattrs->rb_root = RB_ROOT;
1379 rwlock_init(&xattrs->lock);
1380 }
1381
1382 /**
1383 * simple_xattrs_free - free xattrs
1384 * @xattrs: xattr header whose xattrs to destroy
1385 * @freed_space: approximate number of bytes of memory freed from @xattrs
1386 *
1387 * Destroy all xattrs in @xattr. When this is called no one can hold a
1388 * reference to any of the xattrs anymore.
1389 */
1390 void simple_xattrs_free(struct simple_xattrs *xattrs, size_t *freed_space)
1391 {
1392 struct rb_node *rbp;
1393
1394 if (freed_space)
1395 *freed_space = 0;
1396 rbp = rb_first(&xattrs->rb_root);
1397 while (rbp) {
1398 struct simple_xattr *xattr;
1399 struct rb_node *rbp_next;
1400
1401 rbp_next = rb_next(rbp);
1402 xattr = rb_entry(rbp, struct simple_xattr, rb_node);
1403 rb_erase(&xattr->rb_node, &xattrs->rb_root);
1404 if (freed_space)
1405 *freed_space += simple_xattr_space(xattr->name,
1406 xattr->size);
1407 simple_xattr_free(xattr);
1408 rbp = rbp_next;
1409 }
1410 }