xref: /openbmc/linux/fs/posix_acl.c (revision 138060ba)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * Copyright (C) 2002,2003 by Andreas Gruenbacher <a.gruenbacher@computer.org>
4  *
5  * Fixes from William Schumacher incorporated on 15 March 2001.
6  *    (Reported by Charles Bertsch, <CBertsch@microtest.com>).
7  */
8 
9 /*
10  *  This file contains generic functions for manipulating
11  *  POSIX 1003.1e draft standard 17 ACLs.
12  */
13 
14 #include <linux/kernel.h>
15 #include <linux/slab.h>
16 #include <linux/atomic.h>
17 #include <linux/fs.h>
18 #include <linux/sched.h>
19 #include <linux/cred.h>
20 #include <linux/posix_acl.h>
21 #include <linux/posix_acl_xattr.h>
22 #include <linux/xattr.h>
23 #include <linux/export.h>
24 #include <linux/user_namespace.h>
25 #include <linux/namei.h>
26 #include <linux/mnt_idmapping.h>
27 #include <linux/iversion.h>
28 
29 static struct posix_acl **acl_by_type(struct inode *inode, int type)
30 {
31 	switch (type) {
32 	case ACL_TYPE_ACCESS:
33 		return &inode->i_acl;
34 	case ACL_TYPE_DEFAULT:
35 		return &inode->i_default_acl;
36 	default:
37 		BUG();
38 	}
39 }
40 
41 struct posix_acl *get_cached_acl(struct inode *inode, int type)
42 {
43 	struct posix_acl **p = acl_by_type(inode, type);
44 	struct posix_acl *acl;
45 
46 	for (;;) {
47 		rcu_read_lock();
48 		acl = rcu_dereference(*p);
49 		if (!acl || is_uncached_acl(acl) ||
50 		    refcount_inc_not_zero(&acl->a_refcount))
51 			break;
52 		rcu_read_unlock();
53 		cpu_relax();
54 	}
55 	rcu_read_unlock();
56 	return acl;
57 }
58 EXPORT_SYMBOL(get_cached_acl);
59 
60 struct posix_acl *get_cached_acl_rcu(struct inode *inode, int type)
61 {
62 	struct posix_acl *acl = rcu_dereference(*acl_by_type(inode, type));
63 
64 	if (acl == ACL_DONT_CACHE) {
65 		struct posix_acl *ret;
66 
67 		ret = inode->i_op->get_acl(inode, type, LOOKUP_RCU);
68 		if (!IS_ERR(ret))
69 			acl = ret;
70 	}
71 
72 	return acl;
73 }
74 EXPORT_SYMBOL(get_cached_acl_rcu);
75 
76 void set_cached_acl(struct inode *inode, int type, struct posix_acl *acl)
77 {
78 	struct posix_acl **p = acl_by_type(inode, type);
79 	struct posix_acl *old;
80 
81 	old = xchg(p, posix_acl_dup(acl));
82 	if (!is_uncached_acl(old))
83 		posix_acl_release(old);
84 }
85 EXPORT_SYMBOL(set_cached_acl);
86 
87 static void __forget_cached_acl(struct posix_acl **p)
88 {
89 	struct posix_acl *old;
90 
91 	old = xchg(p, ACL_NOT_CACHED);
92 	if (!is_uncached_acl(old))
93 		posix_acl_release(old);
94 }
95 
96 void forget_cached_acl(struct inode *inode, int type)
97 {
98 	__forget_cached_acl(acl_by_type(inode, type));
99 }
100 EXPORT_SYMBOL(forget_cached_acl);
101 
102 void forget_all_cached_acls(struct inode *inode)
103 {
104 	__forget_cached_acl(&inode->i_acl);
105 	__forget_cached_acl(&inode->i_default_acl);
106 }
107 EXPORT_SYMBOL(forget_all_cached_acls);
108 
109 struct posix_acl *get_acl(struct inode *inode, int type)
110 {
111 	void *sentinel;
112 	struct posix_acl **p;
113 	struct posix_acl *acl;
114 
115 	/*
116 	 * The sentinel is used to detect when another operation like
117 	 * set_cached_acl() or forget_cached_acl() races with get_acl().
118 	 * It is guaranteed that is_uncached_acl(sentinel) is true.
119 	 */
120 
121 	acl = get_cached_acl(inode, type);
122 	if (!is_uncached_acl(acl))
123 		return acl;
124 
125 	if (!IS_POSIXACL(inode))
126 		return NULL;
127 
128 	sentinel = uncached_acl_sentinel(current);
129 	p = acl_by_type(inode, type);
130 
131 	/*
132 	 * If the ACL isn't being read yet, set our sentinel.  Otherwise, the
133 	 * current value of the ACL will not be ACL_NOT_CACHED and so our own
134 	 * sentinel will not be set; another task will update the cache.  We
135 	 * could wait for that other task to complete its job, but it's easier
136 	 * to just call ->get_acl to fetch the ACL ourself.  (This is going to
137 	 * be an unlikely race.)
138 	 */
139 	cmpxchg(p, ACL_NOT_CACHED, sentinel);
140 
141 	/*
142 	 * Normally, the ACL returned by ->get_acl will be cached.
143 	 * A filesystem can prevent that by calling
144 	 * forget_cached_acl(inode, type) in ->get_acl.
145 	 *
146 	 * If the filesystem doesn't have a get_acl() function at all, we'll
147 	 * just create the negative cache entry.
148 	 */
149 	if (!inode->i_op->get_acl) {
150 		set_cached_acl(inode, type, NULL);
151 		return NULL;
152 	}
153 	acl = inode->i_op->get_acl(inode, type, false);
154 
155 	if (IS_ERR(acl)) {
156 		/*
157 		 * Remove our sentinel so that we don't block future attempts
158 		 * to cache the ACL.
159 		 */
160 		cmpxchg(p, sentinel, ACL_NOT_CACHED);
161 		return acl;
162 	}
163 
164 	/*
165 	 * Cache the result, but only if our sentinel is still in place.
166 	 */
167 	posix_acl_dup(acl);
168 	if (unlikely(cmpxchg(p, sentinel, acl) != sentinel))
169 		posix_acl_release(acl);
170 	return acl;
171 }
172 EXPORT_SYMBOL(get_acl);
173 
174 /*
175  * Init a fresh posix_acl
176  */
177 void
178 posix_acl_init(struct posix_acl *acl, int count)
179 {
180 	refcount_set(&acl->a_refcount, 1);
181 	acl->a_count = count;
182 }
183 EXPORT_SYMBOL(posix_acl_init);
184 
185 /*
186  * Allocate a new ACL with the specified number of entries.
187  */
188 struct posix_acl *
189 posix_acl_alloc(int count, gfp_t flags)
190 {
191 	const size_t size = sizeof(struct posix_acl) +
192 	                    count * sizeof(struct posix_acl_entry);
193 	struct posix_acl *acl = kmalloc(size, flags);
194 	if (acl)
195 		posix_acl_init(acl, count);
196 	return acl;
197 }
198 EXPORT_SYMBOL(posix_acl_alloc);
199 
200 /*
201  * Clone an ACL.
202  */
203 struct posix_acl *
204 posix_acl_clone(const struct posix_acl *acl, gfp_t flags)
205 {
206 	struct posix_acl *clone = NULL;
207 
208 	if (acl) {
209 		int size = sizeof(struct posix_acl) + acl->a_count *
210 		           sizeof(struct posix_acl_entry);
211 		clone = kmemdup(acl, size, flags);
212 		if (clone)
213 			refcount_set(&clone->a_refcount, 1);
214 	}
215 	return clone;
216 }
217 EXPORT_SYMBOL_GPL(posix_acl_clone);
218 
219 /*
220  * Check if an acl is valid. Returns 0 if it is, or -E... otherwise.
221  */
222 int
223 posix_acl_valid(struct user_namespace *user_ns, const struct posix_acl *acl)
224 {
225 	const struct posix_acl_entry *pa, *pe;
226 	int state = ACL_USER_OBJ;
227 	int needs_mask = 0;
228 
229 	FOREACH_ACL_ENTRY(pa, acl, pe) {
230 		if (pa->e_perm & ~(ACL_READ|ACL_WRITE|ACL_EXECUTE))
231 			return -EINVAL;
232 		switch (pa->e_tag) {
233 			case ACL_USER_OBJ:
234 				if (state == ACL_USER_OBJ) {
235 					state = ACL_USER;
236 					break;
237 				}
238 				return -EINVAL;
239 
240 			case ACL_USER:
241 				if (state != ACL_USER)
242 					return -EINVAL;
243 				if (!kuid_has_mapping(user_ns, pa->e_uid))
244 					return -EINVAL;
245 				needs_mask = 1;
246 				break;
247 
248 			case ACL_GROUP_OBJ:
249 				if (state == ACL_USER) {
250 					state = ACL_GROUP;
251 					break;
252 				}
253 				return -EINVAL;
254 
255 			case ACL_GROUP:
256 				if (state != ACL_GROUP)
257 					return -EINVAL;
258 				if (!kgid_has_mapping(user_ns, pa->e_gid))
259 					return -EINVAL;
260 				needs_mask = 1;
261 				break;
262 
263 			case ACL_MASK:
264 				if (state != ACL_GROUP)
265 					return -EINVAL;
266 				state = ACL_OTHER;
267 				break;
268 
269 			case ACL_OTHER:
270 				if (state == ACL_OTHER ||
271 				    (state == ACL_GROUP && !needs_mask)) {
272 					state = 0;
273 					break;
274 				}
275 				return -EINVAL;
276 
277 			default:
278 				return -EINVAL;
279 		}
280 	}
281 	if (state == 0)
282 		return 0;
283 	return -EINVAL;
284 }
285 EXPORT_SYMBOL(posix_acl_valid);
286 
287 /*
288  * Returns 0 if the acl can be exactly represented in the traditional
289  * file mode permission bits, or else 1. Returns -E... on error.
290  */
291 int
292 posix_acl_equiv_mode(const struct posix_acl *acl, umode_t *mode_p)
293 {
294 	const struct posix_acl_entry *pa, *pe;
295 	umode_t mode = 0;
296 	int not_equiv = 0;
297 
298 	/*
299 	 * A null ACL can always be presented as mode bits.
300 	 */
301 	if (!acl)
302 		return 0;
303 
304 	FOREACH_ACL_ENTRY(pa, acl, pe) {
305 		switch (pa->e_tag) {
306 			case ACL_USER_OBJ:
307 				mode |= (pa->e_perm & S_IRWXO) << 6;
308 				break;
309 			case ACL_GROUP_OBJ:
310 				mode |= (pa->e_perm & S_IRWXO) << 3;
311 				break;
312 			case ACL_OTHER:
313 				mode |= pa->e_perm & S_IRWXO;
314 				break;
315 			case ACL_MASK:
316 				mode = (mode & ~S_IRWXG) |
317 				       ((pa->e_perm & S_IRWXO) << 3);
318 				not_equiv = 1;
319 				break;
320 			case ACL_USER:
321 			case ACL_GROUP:
322 				not_equiv = 1;
323 				break;
324 			default:
325 				return -EINVAL;
326 		}
327 	}
328         if (mode_p)
329                 *mode_p = (*mode_p & ~S_IRWXUGO) | mode;
330         return not_equiv;
331 }
332 EXPORT_SYMBOL(posix_acl_equiv_mode);
333 
334 /*
335  * Create an ACL representing the file mode permission bits of an inode.
336  */
337 struct posix_acl *
338 posix_acl_from_mode(umode_t mode, gfp_t flags)
339 {
340 	struct posix_acl *acl = posix_acl_alloc(3, flags);
341 	if (!acl)
342 		return ERR_PTR(-ENOMEM);
343 
344 	acl->a_entries[0].e_tag  = ACL_USER_OBJ;
345 	acl->a_entries[0].e_perm = (mode & S_IRWXU) >> 6;
346 
347 	acl->a_entries[1].e_tag  = ACL_GROUP_OBJ;
348 	acl->a_entries[1].e_perm = (mode & S_IRWXG) >> 3;
349 
350 	acl->a_entries[2].e_tag  = ACL_OTHER;
351 	acl->a_entries[2].e_perm = (mode & S_IRWXO);
352 	return acl;
353 }
354 EXPORT_SYMBOL(posix_acl_from_mode);
355 
356 /*
357  * Return 0 if current is granted want access to the inode
358  * by the acl. Returns -E... otherwise.
359  */
360 int
361 posix_acl_permission(struct user_namespace *mnt_userns, struct inode *inode,
362 		     const struct posix_acl *acl, int want)
363 {
364 	const struct posix_acl_entry *pa, *pe, *mask_obj;
365 	struct user_namespace *fs_userns = i_user_ns(inode);
366 	int found = 0;
367 	vfsuid_t vfsuid;
368 	vfsgid_t vfsgid;
369 
370 	want &= MAY_READ | MAY_WRITE | MAY_EXEC;
371 
372 	FOREACH_ACL_ENTRY(pa, acl, pe) {
373                 switch(pa->e_tag) {
374                         case ACL_USER_OBJ:
375 				/* (May have been checked already) */
376 				vfsuid = i_uid_into_vfsuid(mnt_userns, inode);
377 				if (vfsuid_eq_kuid(vfsuid, current_fsuid()))
378                                         goto check_perm;
379                                 break;
380                         case ACL_USER:
381 				vfsuid = make_vfsuid(mnt_userns, fs_userns,
382 						     pa->e_uid);
383 				if (vfsuid_eq_kuid(vfsuid, current_fsuid()))
384                                         goto mask;
385 				break;
386                         case ACL_GROUP_OBJ:
387 				vfsgid = i_gid_into_vfsgid(mnt_userns, inode);
388 				if (vfsgid_in_group_p(vfsgid)) {
389 					found = 1;
390 					if ((pa->e_perm & want) == want)
391 						goto mask;
392                                 }
393 				break;
394                         case ACL_GROUP:
395 				vfsgid = make_vfsgid(mnt_userns, fs_userns,
396 						     pa->e_gid);
397 				if (vfsgid_in_group_p(vfsgid)) {
398 					found = 1;
399 					if ((pa->e_perm & want) == want)
400 						goto mask;
401                                 }
402                                 break;
403                         case ACL_MASK:
404                                 break;
405                         case ACL_OTHER:
406 				if (found)
407 					return -EACCES;
408 				else
409 					goto check_perm;
410 			default:
411 				return -EIO;
412                 }
413         }
414 	return -EIO;
415 
416 mask:
417 	for (mask_obj = pa+1; mask_obj != pe; mask_obj++) {
418 		if (mask_obj->e_tag == ACL_MASK) {
419 			if ((pa->e_perm & mask_obj->e_perm & want) == want)
420 				return 0;
421 			return -EACCES;
422 		}
423 	}
424 
425 check_perm:
426 	if ((pa->e_perm & want) == want)
427 		return 0;
428 	return -EACCES;
429 }
430 
431 /*
432  * Modify acl when creating a new inode. The caller must ensure the acl is
433  * only referenced once.
434  *
435  * mode_p initially must contain the mode parameter to the open() / creat()
436  * system calls. All permissions that are not granted by the acl are removed.
437  * The permissions in the acl are changed to reflect the mode_p parameter.
438  */
439 static int posix_acl_create_masq(struct posix_acl *acl, umode_t *mode_p)
440 {
441 	struct posix_acl_entry *pa, *pe;
442 	struct posix_acl_entry *group_obj = NULL, *mask_obj = NULL;
443 	umode_t mode = *mode_p;
444 	int not_equiv = 0;
445 
446 	/* assert(atomic_read(acl->a_refcount) == 1); */
447 
448 	FOREACH_ACL_ENTRY(pa, acl, pe) {
449                 switch(pa->e_tag) {
450                         case ACL_USER_OBJ:
451 				pa->e_perm &= (mode >> 6) | ~S_IRWXO;
452 				mode &= (pa->e_perm << 6) | ~S_IRWXU;
453 				break;
454 
455 			case ACL_USER:
456 			case ACL_GROUP:
457 				not_equiv = 1;
458 				break;
459 
460                         case ACL_GROUP_OBJ:
461 				group_obj = pa;
462                                 break;
463 
464                         case ACL_OTHER:
465 				pa->e_perm &= mode | ~S_IRWXO;
466 				mode &= pa->e_perm | ~S_IRWXO;
467                                 break;
468 
469                         case ACL_MASK:
470 				mask_obj = pa;
471 				not_equiv = 1;
472                                 break;
473 
474 			default:
475 				return -EIO;
476                 }
477         }
478 
479 	if (mask_obj) {
480 		mask_obj->e_perm &= (mode >> 3) | ~S_IRWXO;
481 		mode &= (mask_obj->e_perm << 3) | ~S_IRWXG;
482 	} else {
483 		if (!group_obj)
484 			return -EIO;
485 		group_obj->e_perm &= (mode >> 3) | ~S_IRWXO;
486 		mode &= (group_obj->e_perm << 3) | ~S_IRWXG;
487 	}
488 
489 	*mode_p = (*mode_p & ~S_IRWXUGO) | mode;
490         return not_equiv;
491 }
492 
493 /*
494  * Modify the ACL for the chmod syscall.
495  */
496 static int __posix_acl_chmod_masq(struct posix_acl *acl, umode_t mode)
497 {
498 	struct posix_acl_entry *group_obj = NULL, *mask_obj = NULL;
499 	struct posix_acl_entry *pa, *pe;
500 
501 	/* assert(atomic_read(acl->a_refcount) == 1); */
502 
503 	FOREACH_ACL_ENTRY(pa, acl, pe) {
504 		switch(pa->e_tag) {
505 			case ACL_USER_OBJ:
506 				pa->e_perm = (mode & S_IRWXU) >> 6;
507 				break;
508 
509 			case ACL_USER:
510 			case ACL_GROUP:
511 				break;
512 
513 			case ACL_GROUP_OBJ:
514 				group_obj = pa;
515 				break;
516 
517 			case ACL_MASK:
518 				mask_obj = pa;
519 				break;
520 
521 			case ACL_OTHER:
522 				pa->e_perm = (mode & S_IRWXO);
523 				break;
524 
525 			default:
526 				return -EIO;
527 		}
528 	}
529 
530 	if (mask_obj) {
531 		mask_obj->e_perm = (mode & S_IRWXG) >> 3;
532 	} else {
533 		if (!group_obj)
534 			return -EIO;
535 		group_obj->e_perm = (mode & S_IRWXG) >> 3;
536 	}
537 
538 	return 0;
539 }
540 
541 int
542 __posix_acl_create(struct posix_acl **acl, gfp_t gfp, umode_t *mode_p)
543 {
544 	struct posix_acl *clone = posix_acl_clone(*acl, gfp);
545 	int err = -ENOMEM;
546 	if (clone) {
547 		err = posix_acl_create_masq(clone, mode_p);
548 		if (err < 0) {
549 			posix_acl_release(clone);
550 			clone = NULL;
551 		}
552 	}
553 	posix_acl_release(*acl);
554 	*acl = clone;
555 	return err;
556 }
557 EXPORT_SYMBOL(__posix_acl_create);
558 
559 int
560 __posix_acl_chmod(struct posix_acl **acl, gfp_t gfp, umode_t mode)
561 {
562 	struct posix_acl *clone = posix_acl_clone(*acl, gfp);
563 	int err = -ENOMEM;
564 	if (clone) {
565 		err = __posix_acl_chmod_masq(clone, mode);
566 		if (err) {
567 			posix_acl_release(clone);
568 			clone = NULL;
569 		}
570 	}
571 	posix_acl_release(*acl);
572 	*acl = clone;
573 	return err;
574 }
575 EXPORT_SYMBOL(__posix_acl_chmod);
576 
577 /**
578  * posix_acl_chmod - chmod a posix acl
579  *
580  * @mnt_userns:	user namespace of the mount @inode was found from
581  * @dentry:	dentry to check permissions on
582  * @mode:	the new mode of @inode
583  *
584  * If the dentry has been found through an idmapped mount the user namespace of
585  * the vfsmount must be passed through @mnt_userns. This function will then
586  * take care to map the inode according to @mnt_userns before checking
587  * permissions. On non-idmapped mounts or if permission checking is to be
588  * performed on the raw inode simply passs init_user_ns.
589  */
590 int
591  posix_acl_chmod(struct user_namespace *mnt_userns, struct dentry *dentry,
592 		    umode_t mode)
593 {
594 	struct inode *inode = d_inode(dentry);
595 	struct posix_acl *acl;
596 	int ret = 0;
597 
598 	if (!IS_POSIXACL(inode))
599 		return 0;
600 	if (!inode->i_op->set_acl)
601 		return -EOPNOTSUPP;
602 
603 	acl = get_acl(inode, ACL_TYPE_ACCESS);
604 	if (IS_ERR_OR_NULL(acl)) {
605 		if (acl == ERR_PTR(-EOPNOTSUPP))
606 			return 0;
607 		return PTR_ERR(acl);
608 	}
609 
610 	ret = __posix_acl_chmod(&acl, GFP_KERNEL, mode);
611 	if (ret)
612 		return ret;
613 	ret = inode->i_op->set_acl(mnt_userns, dentry, acl, ACL_TYPE_ACCESS);
614 	posix_acl_release(acl);
615 	return ret;
616 }
617 EXPORT_SYMBOL(posix_acl_chmod);
618 
619 int
620 posix_acl_create(struct inode *dir, umode_t *mode,
621 		struct posix_acl **default_acl, struct posix_acl **acl)
622 {
623 	struct posix_acl *p;
624 	struct posix_acl *clone;
625 	int ret;
626 
627 	*acl = NULL;
628 	*default_acl = NULL;
629 
630 	if (S_ISLNK(*mode) || !IS_POSIXACL(dir))
631 		return 0;
632 
633 	p = get_acl(dir, ACL_TYPE_DEFAULT);
634 	if (!p || p == ERR_PTR(-EOPNOTSUPP)) {
635 		*mode &= ~current_umask();
636 		return 0;
637 	}
638 	if (IS_ERR(p))
639 		return PTR_ERR(p);
640 
641 	ret = -ENOMEM;
642 	clone = posix_acl_clone(p, GFP_NOFS);
643 	if (!clone)
644 		goto err_release;
645 
646 	ret = posix_acl_create_masq(clone, mode);
647 	if (ret < 0)
648 		goto err_release_clone;
649 
650 	if (ret == 0)
651 		posix_acl_release(clone);
652 	else
653 		*acl = clone;
654 
655 	if (!S_ISDIR(*mode))
656 		posix_acl_release(p);
657 	else
658 		*default_acl = p;
659 
660 	return 0;
661 
662 err_release_clone:
663 	posix_acl_release(clone);
664 err_release:
665 	posix_acl_release(p);
666 	return ret;
667 }
668 EXPORT_SYMBOL_GPL(posix_acl_create);
669 
670 /**
671  * posix_acl_update_mode  -  update mode in set_acl
672  * @mnt_userns:	user namespace of the mount @inode was found from
673  * @inode:	target inode
674  * @mode_p:	mode (pointer) for update
675  * @acl:	acl pointer
676  *
677  * Update the file mode when setting an ACL: compute the new file permission
678  * bits based on the ACL.  In addition, if the ACL is equivalent to the new
679  * file mode, set *@acl to NULL to indicate that no ACL should be set.
680  *
681  * As with chmod, clear the setgid bit if the caller is not in the owning group
682  * or capable of CAP_FSETID (see inode_change_ok).
683  *
684  * If the inode has been found through an idmapped mount the user namespace of
685  * the vfsmount must be passed through @mnt_userns. This function will then
686  * take care to map the inode according to @mnt_userns before checking
687  * permissions. On non-idmapped mounts or if permission checking is to be
688  * performed on the raw inode simply passs init_user_ns.
689  *
690  * Called from set_acl inode operations.
691  */
692 int posix_acl_update_mode(struct user_namespace *mnt_userns,
693 			  struct inode *inode, umode_t *mode_p,
694 			  struct posix_acl **acl)
695 {
696 	umode_t mode = inode->i_mode;
697 	int error;
698 
699 	error = posix_acl_equiv_mode(*acl, &mode);
700 	if (error < 0)
701 		return error;
702 	if (error == 0)
703 		*acl = NULL;
704 	if (!vfsgid_in_group_p(i_gid_into_vfsgid(mnt_userns, inode)) &&
705 	    !capable_wrt_inode_uidgid(mnt_userns, inode, CAP_FSETID))
706 		mode &= ~S_ISGID;
707 	*mode_p = mode;
708 	return 0;
709 }
710 EXPORT_SYMBOL(posix_acl_update_mode);
711 
712 /*
713  * Fix up the uids and gids in posix acl extended attributes in place.
714  */
715 static int posix_acl_fix_xattr_common(const void *value, size_t size)
716 {
717 	const struct posix_acl_xattr_header *header = value;
718 	int count;
719 
720 	if (!header)
721 		return -EINVAL;
722 	if (size < sizeof(struct posix_acl_xattr_header))
723 		return -EINVAL;
724 	if (header->a_version != cpu_to_le32(POSIX_ACL_XATTR_VERSION))
725 		return -EOPNOTSUPP;
726 
727 	count = posix_acl_xattr_count(size);
728 	if (count < 0)
729 		return -EINVAL;
730 	if (count == 0)
731 		return 0;
732 
733 	return count;
734 }
735 
736 void posix_acl_getxattr_idmapped_mnt(struct user_namespace *mnt_userns,
737 				     const struct inode *inode,
738 				     void *value, size_t size)
739 {
740 	struct posix_acl_xattr_header *header = value;
741 	struct posix_acl_xattr_entry *entry = (void *)(header + 1), *end;
742 	struct user_namespace *fs_userns = i_user_ns(inode);
743 	int count;
744 	vfsuid_t vfsuid;
745 	vfsgid_t vfsgid;
746 	kuid_t uid;
747 	kgid_t gid;
748 
749 	if (no_idmapping(mnt_userns, i_user_ns(inode)))
750 		return;
751 
752 	count = posix_acl_fix_xattr_common(value, size);
753 	if (count <= 0)
754 		return;
755 
756 	for (end = entry + count; entry != end; entry++) {
757 		switch (le16_to_cpu(entry->e_tag)) {
758 		case ACL_USER:
759 			uid = make_kuid(&init_user_ns, le32_to_cpu(entry->e_id));
760 			vfsuid = make_vfsuid(mnt_userns, fs_userns, uid);
761 			entry->e_id = cpu_to_le32(from_kuid(&init_user_ns,
762 						vfsuid_into_kuid(vfsuid)));
763 			break;
764 		case ACL_GROUP:
765 			gid = make_kgid(&init_user_ns, le32_to_cpu(entry->e_id));
766 			vfsgid = make_vfsgid(mnt_userns, fs_userns, gid);
767 			entry->e_id = cpu_to_le32(from_kgid(&init_user_ns,
768 						vfsgid_into_kgid(vfsgid)));
769 			break;
770 		default:
771 			break;
772 		}
773 	}
774 }
775 
776 static void posix_acl_fix_xattr_userns(
777 	struct user_namespace *to, struct user_namespace *from,
778 	void *value, size_t size)
779 {
780 	struct posix_acl_xattr_header *header = value;
781 	struct posix_acl_xattr_entry *entry = (void *)(header + 1), *end;
782 	int count;
783 	kuid_t uid;
784 	kgid_t gid;
785 
786 	count = posix_acl_fix_xattr_common(value, size);
787 	if (count <= 0)
788 		return;
789 
790 	for (end = entry + count; entry != end; entry++) {
791 		switch(le16_to_cpu(entry->e_tag)) {
792 		case ACL_USER:
793 			uid = make_kuid(from, le32_to_cpu(entry->e_id));
794 			entry->e_id = cpu_to_le32(from_kuid(to, uid));
795 			break;
796 		case ACL_GROUP:
797 			gid = make_kgid(from, le32_to_cpu(entry->e_id));
798 			entry->e_id = cpu_to_le32(from_kgid(to, gid));
799 			break;
800 		default:
801 			break;
802 		}
803 	}
804 }
805 
806 void posix_acl_fix_xattr_from_user(void *value, size_t size)
807 {
808 	struct user_namespace *user_ns = current_user_ns();
809 	if (user_ns == &init_user_ns)
810 		return;
811 	posix_acl_fix_xattr_userns(&init_user_ns, user_ns, value, size);
812 }
813 
814 void posix_acl_fix_xattr_to_user(void *value, size_t size)
815 {
816 	struct user_namespace *user_ns = current_user_ns();
817 	if (user_ns == &init_user_ns)
818 		return;
819 	posix_acl_fix_xattr_userns(user_ns, &init_user_ns, value, size);
820 }
821 
822 /**
823  * make_posix_acl - convert POSIX ACLs from uapi to VFS format using the
824  *                  provided callbacks to map ACL_{GROUP,USER} entries into the
825  *                  appropriate format
826  * @mnt_userns: the mount's idmapping
827  * @fs_userns: the filesystem's idmapping
828  * @value: the uapi representation of POSIX ACLs
829  * @size: the size of @void
830  * @uid_cb: callback to use for mapping the uid stored in ACL_USER entries
831  * @gid_cb: callback to use for mapping the gid stored in ACL_GROUP entries
832  *
833  * The make_posix_acl() helper is an abstraction to translate from uapi format
834  * into the VFS format allowing the caller to specific callbacks to map
835  * ACL_{GROUP,USER} entries into the expected format. This is used in
836  * posix_acl_from_xattr() and vfs_set_acl_prepare() and avoids pointless code
837  * duplication.
838  *
839  * Return: Allocated struct posix_acl on success, NULL for a valid header but
840  *         without actual POSIX ACL entries, or ERR_PTR() encoded error code.
841  */
842 static struct posix_acl *make_posix_acl(struct user_namespace *mnt_userns,
843 	struct user_namespace *fs_userns, const void *value, size_t size,
844 	kuid_t (*uid_cb)(struct user_namespace *, struct user_namespace *,
845 			 const struct posix_acl_xattr_entry *),
846 	kgid_t (*gid_cb)(struct user_namespace *, struct user_namespace *,
847 			 const struct posix_acl_xattr_entry *))
848 {
849 	const struct posix_acl_xattr_header *header = value;
850 	const struct posix_acl_xattr_entry *entry = (const void *)(header + 1), *end;
851 	int count;
852 	struct posix_acl *acl;
853 	struct posix_acl_entry *acl_e;
854 
855 	count = posix_acl_fix_xattr_common(value, size);
856 	if (count < 0)
857 		return ERR_PTR(count);
858 	if (count == 0)
859 		return NULL;
860 
861 	acl = posix_acl_alloc(count, GFP_NOFS);
862 	if (!acl)
863 		return ERR_PTR(-ENOMEM);
864 	acl_e = acl->a_entries;
865 
866 	for (end = entry + count; entry != end; acl_e++, entry++) {
867 		acl_e->e_tag  = le16_to_cpu(entry->e_tag);
868 		acl_e->e_perm = le16_to_cpu(entry->e_perm);
869 
870 		switch(acl_e->e_tag) {
871 			case ACL_USER_OBJ:
872 			case ACL_GROUP_OBJ:
873 			case ACL_MASK:
874 			case ACL_OTHER:
875 				break;
876 
877 			case ACL_USER:
878 				acl_e->e_uid = uid_cb(mnt_userns, fs_userns, entry);
879 				if (!uid_valid(acl_e->e_uid))
880 					goto fail;
881 				break;
882 			case ACL_GROUP:
883 				acl_e->e_gid = gid_cb(mnt_userns, fs_userns, entry);
884 				if (!gid_valid(acl_e->e_gid))
885 					goto fail;
886 				break;
887 
888 			default:
889 				goto fail;
890 		}
891 	}
892 	return acl;
893 
894 fail:
895 	posix_acl_release(acl);
896 	return ERR_PTR(-EINVAL);
897 }
898 
899 /**
900  * vfs_set_acl_prepare_kuid - map ACL_USER uid according to mount- and
901  *                            filesystem idmapping
902  * @mnt_userns: the mount's idmapping
903  * @fs_userns: the filesystem's idmapping
904  * @e: a ACL_USER entry in POSIX ACL uapi format
905  *
906  * The uid stored as ACL_USER entry in @e is a kuid_t stored as a raw {g,u}id
907  * value. The vfs_set_acl_prepare_kuid() will recover the kuid_t through
908  * KUIDT_INIT() and then map it according to the idmapped mount. The resulting
909  * kuid_t is the value which the filesystem can map up into a raw backing store
910  * id in the filesystem's idmapping.
911  *
912  * This is used in vfs_set_acl_prepare() to generate the proper VFS
913  * representation of POSIX ACLs with ACL_USER entries during setxattr().
914  *
915  * Return: A kuid in @fs_userns for the uid stored in @e.
916  */
917 static inline kuid_t
918 vfs_set_acl_prepare_kuid(struct user_namespace *mnt_userns,
919 			 struct user_namespace *fs_userns,
920 			 const struct posix_acl_xattr_entry *e)
921 {
922 	kuid_t kuid = KUIDT_INIT(le32_to_cpu(e->e_id));
923 	return from_vfsuid(mnt_userns, fs_userns, VFSUIDT_INIT(kuid));
924 }
925 
926 /**
927  * vfs_set_acl_prepare_kgid - map ACL_GROUP gid according to mount- and
928  *                            filesystem idmapping
929  * @mnt_userns: the mount's idmapping
930  * @fs_userns: the filesystem's idmapping
931  * @e: a ACL_GROUP entry in POSIX ACL uapi format
932  *
933  * The gid stored as ACL_GROUP entry in @e is a kgid_t stored as a raw {g,u}id
934  * value. The vfs_set_acl_prepare_kgid() will recover the kgid_t through
935  * KGIDT_INIT() and then map it according to the idmapped mount. The resulting
936  * kgid_t is the value which the filesystem can map up into a raw backing store
937  * id in the filesystem's idmapping.
938  *
939  * This is used in vfs_set_acl_prepare() to generate the proper VFS
940  * representation of POSIX ACLs with ACL_GROUP entries during setxattr().
941  *
942  * Return: A kgid in @fs_userns for the gid stored in @e.
943  */
944 static inline kgid_t
945 vfs_set_acl_prepare_kgid(struct user_namespace *mnt_userns,
946 			 struct user_namespace *fs_userns,
947 			 const struct posix_acl_xattr_entry *e)
948 {
949 	kgid_t kgid = KGIDT_INIT(le32_to_cpu(e->e_id));
950 	return from_vfsgid(mnt_userns, fs_userns, VFSGIDT_INIT(kgid));
951 }
952 
953 /**
954  * vfs_set_acl_prepare - convert POSIX ACLs from uapi to VFS format taking
955  *                       mount and filesystem idmappings into account
956  * @mnt_userns: the mount's idmapping
957  * @fs_userns: the filesystem's idmapping
958  * @value: the uapi representation of POSIX ACLs
959  * @size: the size of @void
960  *
961  * When setting POSIX ACLs with ACL_{GROUP,USER} entries they need to be
962  * mapped according to the relevant mount- and filesystem idmapping. It is
963  * important that the ACL_{GROUP,USER} entries in struct posix_acl will be
964  * mapped into k{g,u}id_t that are supposed to be mapped up in the filesystem
965  * idmapping. This is crucial since the resulting struct posix_acl might be
966  * cached filesystem wide. The vfs_set_acl_prepare() function will take care to
967  * perform all necessary idmappings.
968  *
969  * Note, that since basically forever the {g,u}id values encoded as
970  * ACL_{GROUP,USER} entries in the uapi POSIX ACLs passed via @value contain
971  * values that have been mapped according to the caller's idmapping. In other
972  * words, POSIX ACLs passed in uapi format as @value during setxattr() contain
973  * {g,u}id values in their ACL_{GROUP,USER} entries that should actually have
974  * been stored as k{g,u}id_t.
975  *
976  * This means, vfs_set_acl_prepare() needs to first recover the k{g,u}id_t by
977  * calling K{G,U}IDT_INIT(). Afterwards they can be interpreted as vfs{g,u}id_t
978  * through from_vfs{g,u}id() to account for any idmapped mounts. The
979  * vfs_set_acl_prepare_k{g,u}id() helpers will take care to generate the
980  * correct k{g,u}id_t.
981  *
982  * The filesystem will then receive the POSIX ACLs ready to be cached
983  * filesystem wide and ready to be written to the backing store taking the
984  * filesystem's idmapping into account.
985  *
986  * Return: Allocated struct posix_acl on success, NULL for a valid header but
987  *         without actual POSIX ACL entries, or ERR_PTR() encoded error code.
988  */
989 struct posix_acl *vfs_set_acl_prepare(struct user_namespace *mnt_userns,
990 				      struct user_namespace *fs_userns,
991 				      const void *value, size_t size)
992 {
993 	return make_posix_acl(mnt_userns, fs_userns, value, size,
994 			      vfs_set_acl_prepare_kuid,
995 			      vfs_set_acl_prepare_kgid);
996 }
997 EXPORT_SYMBOL(vfs_set_acl_prepare);
998 
999 /**
1000  * posix_acl_from_xattr_kuid - map ACL_USER uid into filesystem idmapping
1001  * @mnt_userns: unused
1002  * @fs_userns: the filesystem's idmapping
1003  * @e: a ACL_USER entry in POSIX ACL uapi format
1004  *
1005  * Map the uid stored as ACL_USER entry in @e into the filesystem's idmapping.
1006  * This is used in posix_acl_from_xattr() to generate the proper VFS
1007  * representation of POSIX ACLs with ACL_USER entries.
1008  *
1009  * Return: A kuid in @fs_userns for the uid stored in @e.
1010  */
1011 static inline kuid_t
1012 posix_acl_from_xattr_kuid(struct user_namespace *mnt_userns,
1013 			  struct user_namespace *fs_userns,
1014 			  const struct posix_acl_xattr_entry *e)
1015 {
1016 	return make_kuid(fs_userns, le32_to_cpu(e->e_id));
1017 }
1018 
1019 /**
1020  * posix_acl_from_xattr_kgid - map ACL_GROUP gid into filesystem idmapping
1021  * @mnt_userns: unused
1022  * @fs_userns: the filesystem's idmapping
1023  * @e: a ACL_GROUP entry in POSIX ACL uapi format
1024  *
1025  * Map the gid stored as ACL_GROUP entry in @e into the filesystem's idmapping.
1026  * This is used in posix_acl_from_xattr() to generate the proper VFS
1027  * representation of POSIX ACLs with ACL_GROUP entries.
1028  *
1029  * Return: A kgid in @fs_userns for the gid stored in @e.
1030  */
1031 static inline kgid_t
1032 posix_acl_from_xattr_kgid(struct user_namespace *mnt_userns,
1033 			  struct user_namespace *fs_userns,
1034 			  const struct posix_acl_xattr_entry *e)
1035 {
1036 	return make_kgid(fs_userns, le32_to_cpu(e->e_id));
1037 }
1038 
1039 /**
1040  * posix_acl_from_xattr - convert POSIX ACLs from backing store to VFS format
1041  * @fs_userns: the filesystem's idmapping
1042  * @value: the uapi representation of POSIX ACLs
1043  * @size: the size of @void
1044  *
1045  * Filesystems that store POSIX ACLs in the unaltered uapi format should use
1046  * posix_acl_from_xattr() when reading them from the backing store and
1047  * converting them into the struct posix_acl VFS format. The helper is
1048  * specifically intended to be called from the ->get_acl() inode operation.
1049  *
1050  * The posix_acl_from_xattr() function will map the raw {g,u}id values stored
1051  * in ACL_{GROUP,USER} entries into the filesystem idmapping in @fs_userns. The
1052  * posix_acl_from_xattr_k{g,u}id() helpers will take care to generate the
1053  * correct k{g,u}id_t. The returned struct posix_acl can be cached.
1054  *
1055  * Note that posix_acl_from_xattr() does not take idmapped mounts into account.
1056  * If it did it calling is from the ->get_acl() inode operation would return
1057  * POSIX ACLs mapped according to an idmapped mount which would mean that the
1058  * value couldn't be cached for the filesystem. Idmapped mounts are taken into
1059  * account on the fly during permission checking or right at the VFS -
1060  * userspace boundary before reporting them to the user.
1061  *
1062  * Return: Allocated struct posix_acl on success, NULL for a valid header but
1063  *         without actual POSIX ACL entries, or ERR_PTR() encoded error code.
1064  */
1065 struct posix_acl *
1066 posix_acl_from_xattr(struct user_namespace *fs_userns,
1067 		     const void *value, size_t size)
1068 {
1069 	return make_posix_acl(&init_user_ns, fs_userns, value, size,
1070 			      posix_acl_from_xattr_kuid,
1071 			      posix_acl_from_xattr_kgid);
1072 }
1073 EXPORT_SYMBOL (posix_acl_from_xattr);
1074 
1075 /*
1076  * Convert from in-memory to extended attribute representation.
1077  */
1078 int
1079 posix_acl_to_xattr(struct user_namespace *user_ns, const struct posix_acl *acl,
1080 		   void *buffer, size_t size)
1081 {
1082 	struct posix_acl_xattr_header *ext_acl = buffer;
1083 	struct posix_acl_xattr_entry *ext_entry;
1084 	int real_size, n;
1085 
1086 	real_size = posix_acl_xattr_size(acl->a_count);
1087 	if (!buffer)
1088 		return real_size;
1089 	if (real_size > size)
1090 		return -ERANGE;
1091 
1092 	ext_entry = (void *)(ext_acl + 1);
1093 	ext_acl->a_version = cpu_to_le32(POSIX_ACL_XATTR_VERSION);
1094 
1095 	for (n=0; n < acl->a_count; n++, ext_entry++) {
1096 		const struct posix_acl_entry *acl_e = &acl->a_entries[n];
1097 		ext_entry->e_tag  = cpu_to_le16(acl_e->e_tag);
1098 		ext_entry->e_perm = cpu_to_le16(acl_e->e_perm);
1099 		switch(acl_e->e_tag) {
1100 		case ACL_USER:
1101 			ext_entry->e_id =
1102 				cpu_to_le32(from_kuid(user_ns, acl_e->e_uid));
1103 			break;
1104 		case ACL_GROUP:
1105 			ext_entry->e_id =
1106 				cpu_to_le32(from_kgid(user_ns, acl_e->e_gid));
1107 			break;
1108 		default:
1109 			ext_entry->e_id = cpu_to_le32(ACL_UNDEFINED_ID);
1110 			break;
1111 		}
1112 	}
1113 	return real_size;
1114 }
1115 EXPORT_SYMBOL (posix_acl_to_xattr);
1116 
1117 static int
1118 posix_acl_xattr_get(const struct xattr_handler *handler,
1119 		    struct dentry *unused, struct inode *inode,
1120 		    const char *name, void *value, size_t size)
1121 {
1122 	struct posix_acl *acl;
1123 	int error;
1124 
1125 	if (!IS_POSIXACL(inode))
1126 		return -EOPNOTSUPP;
1127 	if (S_ISLNK(inode->i_mode))
1128 		return -EOPNOTSUPP;
1129 
1130 	acl = get_acl(inode, handler->flags);
1131 	if (IS_ERR(acl))
1132 		return PTR_ERR(acl);
1133 	if (acl == NULL)
1134 		return -ENODATA;
1135 
1136 	error = posix_acl_to_xattr(&init_user_ns, acl, value, size);
1137 	posix_acl_release(acl);
1138 
1139 	return error;
1140 }
1141 
1142 int
1143 set_posix_acl(struct user_namespace *mnt_userns, struct dentry *dentry,
1144 	      int type, struct posix_acl *acl)
1145 {
1146 	struct inode *inode = d_inode(dentry);
1147 
1148 	if (!IS_POSIXACL(inode))
1149 		return -EOPNOTSUPP;
1150 	if (!inode->i_op->set_acl)
1151 		return -EOPNOTSUPP;
1152 
1153 	if (type == ACL_TYPE_DEFAULT && !S_ISDIR(inode->i_mode))
1154 		return acl ? -EACCES : 0;
1155 	if (!inode_owner_or_capable(mnt_userns, inode))
1156 		return -EPERM;
1157 
1158 	if (acl) {
1159 		int ret = posix_acl_valid(inode->i_sb->s_user_ns, acl);
1160 		if (ret)
1161 			return ret;
1162 	}
1163 	return inode->i_op->set_acl(mnt_userns, dentry, acl, type);
1164 }
1165 EXPORT_SYMBOL(set_posix_acl);
1166 
1167 static int
1168 posix_acl_xattr_set(const struct xattr_handler *handler,
1169 			   struct user_namespace *mnt_userns,
1170 			   struct dentry *dentry, struct inode *inode,
1171 			   const char *name, const void *value, size_t size,
1172 			   int flags)
1173 {
1174 	struct posix_acl *acl = NULL;
1175 	int ret;
1176 
1177 	if (value) {
1178 		/*
1179 		 * By the time we end up here the {g,u}ids stored in
1180 		 * ACL_{GROUP,USER} have already been mapped according to the
1181 		 * caller's idmapping. The vfs_set_acl_prepare() helper will
1182 		 * recover them and take idmapped mounts into account. The
1183 		 * filesystem will receive the POSIX ACLs in the correct
1184 		 * format ready to be cached or written to the backing store
1185 		 * taking the filesystem idmapping into account.
1186 		 */
1187 		acl = vfs_set_acl_prepare(mnt_userns, i_user_ns(inode),
1188 					  value, size);
1189 		if (IS_ERR(acl))
1190 			return PTR_ERR(acl);
1191 	}
1192 	ret = set_posix_acl(mnt_userns, dentry, handler->flags, acl);
1193 	posix_acl_release(acl);
1194 	return ret;
1195 }
1196 
1197 static bool
1198 posix_acl_xattr_list(struct dentry *dentry)
1199 {
1200 	return IS_POSIXACL(d_backing_inode(dentry));
1201 }
1202 
1203 const struct xattr_handler posix_acl_access_xattr_handler = {
1204 	.name = XATTR_NAME_POSIX_ACL_ACCESS,
1205 	.flags = ACL_TYPE_ACCESS,
1206 	.list = posix_acl_xattr_list,
1207 	.get = posix_acl_xattr_get,
1208 	.set = posix_acl_xattr_set,
1209 };
1210 EXPORT_SYMBOL_GPL(posix_acl_access_xattr_handler);
1211 
1212 const struct xattr_handler posix_acl_default_xattr_handler = {
1213 	.name = XATTR_NAME_POSIX_ACL_DEFAULT,
1214 	.flags = ACL_TYPE_DEFAULT,
1215 	.list = posix_acl_xattr_list,
1216 	.get = posix_acl_xattr_get,
1217 	.set = posix_acl_xattr_set,
1218 };
1219 EXPORT_SYMBOL_GPL(posix_acl_default_xattr_handler);
1220 
1221 int simple_set_acl(struct user_namespace *mnt_userns, struct dentry *dentry,
1222 		   struct posix_acl *acl, int type)
1223 {
1224 	int error;
1225 	struct inode *inode = d_inode(dentry);
1226 
1227 	if (type == ACL_TYPE_ACCESS) {
1228 		error = posix_acl_update_mode(mnt_userns, inode,
1229 				&inode->i_mode, &acl);
1230 		if (error)
1231 			return error;
1232 	}
1233 
1234 	inode->i_ctime = current_time(inode);
1235 	if (IS_I_VERSION(inode))
1236 		inode_inc_iversion(inode);
1237 	set_cached_acl(inode, type, acl);
1238 	return 0;
1239 }
1240 
1241 int simple_acl_create(struct inode *dir, struct inode *inode)
1242 {
1243 	struct posix_acl *default_acl, *acl;
1244 	int error;
1245 
1246 	error = posix_acl_create(dir, &inode->i_mode, &default_acl, &acl);
1247 	if (error)
1248 		return error;
1249 
1250 	set_cached_acl(inode, ACL_TYPE_DEFAULT, default_acl);
1251 	set_cached_acl(inode, ACL_TYPE_ACCESS, acl);
1252 
1253 	if (default_acl)
1254 		posix_acl_release(default_acl);
1255 	if (acl)
1256 		posix_acl_release(acl);
1257 	return 0;
1258 }
1259