| // SPDX-License-Identifier: GPL-2.0 | 
 | /* | 
 |  *  linux/fs/attr.c | 
 |  * | 
 |  *  Copyright (C) 1991, 1992  Linus Torvalds | 
 |  *  changes by Thomas Schoebel-Theuer | 
 |  */ | 
 |  | 
 | #include <linux/export.h> | 
 | #include <linux/time.h> | 
 | #include <linux/mm.h> | 
 | #include <linux/string.h> | 
 | #include <linux/sched/signal.h> | 
 | #include <linux/capability.h> | 
 | #include <linux/fsnotify.h> | 
 | #include <linux/fcntl.h> | 
 | #include <linux/filelock.h> | 
 | #include <linux/security.h> | 
 | #include <linux/evm.h> | 
 | #include <linux/ima.h> | 
 |  | 
 | #include "internal.h" | 
 |  | 
 | /** | 
 |  * setattr_should_drop_sgid - determine whether the setgid bit needs to be | 
 |  *                            removed | 
 |  * @idmap:	idmap of the mount @inode was found from | 
 |  * @inode:	inode to check | 
 |  * | 
 |  * This function determines whether the setgid bit needs to be removed. | 
 |  * We retain backwards compatibility and require setgid bit to be removed | 
 |  * unconditionally if S_IXGRP is set. Otherwise we have the exact same | 
 |  * requirements as setattr_prepare() and setattr_copy(). | 
 |  * | 
 |  * Return: ATTR_KILL_SGID if setgid bit needs to be removed, 0 otherwise. | 
 |  */ | 
 | int setattr_should_drop_sgid(struct mnt_idmap *idmap, | 
 | 			     const struct inode *inode) | 
 | { | 
 | 	umode_t mode = inode->i_mode; | 
 |  | 
 | 	if (!(mode & S_ISGID)) | 
 | 		return 0; | 
 | 	if (mode & S_IXGRP) | 
 | 		return ATTR_KILL_SGID; | 
 | 	if (!in_group_or_capable(idmap, inode, i_gid_into_vfsgid(idmap, inode))) | 
 | 		return ATTR_KILL_SGID; | 
 | 	return 0; | 
 | } | 
 | EXPORT_SYMBOL(setattr_should_drop_sgid); | 
 |  | 
 | /** | 
 |  * setattr_should_drop_suidgid - determine whether the set{g,u}id bit needs to | 
 |  *                               be dropped | 
 |  * @idmap:	idmap of the mount @inode was found from | 
 |  * @inode:	inode to check | 
 |  * | 
 |  * This function determines whether the set{g,u}id bits need to be removed. | 
 |  * If the setuid bit needs to be removed ATTR_KILL_SUID is returned. If the | 
 |  * setgid bit needs to be removed ATTR_KILL_SGID is returned. If both | 
 |  * set{g,u}id bits need to be removed the corresponding mask of both flags is | 
 |  * returned. | 
 |  * | 
 |  * Return: A mask of ATTR_KILL_S{G,U}ID indicating which - if any - setid bits | 
 |  * to remove, 0 otherwise. | 
 |  */ | 
 | int setattr_should_drop_suidgid(struct mnt_idmap *idmap, | 
 | 				struct inode *inode) | 
 | { | 
 | 	umode_t mode = inode->i_mode; | 
 | 	int kill = 0; | 
 |  | 
 | 	/* suid always must be killed */ | 
 | 	if (unlikely(mode & S_ISUID)) | 
 | 		kill = ATTR_KILL_SUID; | 
 |  | 
 | 	kill |= setattr_should_drop_sgid(idmap, inode); | 
 |  | 
 | 	if (unlikely(kill && !capable(CAP_FSETID) && S_ISREG(mode))) | 
 | 		return kill; | 
 |  | 
 | 	return 0; | 
 | } | 
 | EXPORT_SYMBOL(setattr_should_drop_suidgid); | 
 |  | 
 | /** | 
 |  * chown_ok - verify permissions to chown inode | 
 |  * @idmap:	idmap of the mount @inode was found from | 
 |  * @inode:	inode to check permissions on | 
 |  * @ia_vfsuid:	uid to chown @inode to | 
 |  * | 
 |  * If the inode has been found through an idmapped mount the idmap of | 
 |  * the vfsmount must be passed through @idmap. This function will then | 
 |  * take care to map the inode according to @idmap before checking | 
 |  * permissions. On non-idmapped mounts or if permission checking is to be | 
 |  * performed on the raw inode simply pass @nop_mnt_idmap. | 
 |  */ | 
 | static bool chown_ok(struct mnt_idmap *idmap, | 
 | 		     const struct inode *inode, vfsuid_t ia_vfsuid) | 
 | { | 
 | 	vfsuid_t vfsuid = i_uid_into_vfsuid(idmap, inode); | 
 | 	if (vfsuid_eq_kuid(vfsuid, current_fsuid()) && | 
 | 	    vfsuid_eq(ia_vfsuid, vfsuid)) | 
 | 		return true; | 
 | 	if (capable_wrt_inode_uidgid(idmap, inode, CAP_CHOWN)) | 
 | 		return true; | 
 | 	if (!vfsuid_valid(vfsuid) && | 
 | 	    ns_capable(inode->i_sb->s_user_ns, CAP_CHOWN)) | 
 | 		return true; | 
 | 	return false; | 
 | } | 
 |  | 
 | /** | 
 |  * chgrp_ok - verify permissions to chgrp inode | 
 |  * @idmap:	idmap of the mount @inode was found from | 
 |  * @inode:	inode to check permissions on | 
 |  * @ia_vfsgid:	gid to chown @inode to | 
 |  * | 
 |  * If the inode has been found through an idmapped mount the idmap of | 
 |  * the vfsmount must be passed through @idmap. This function will then | 
 |  * take care to map the inode according to @idmap before checking | 
 |  * permissions. On non-idmapped mounts or if permission checking is to be | 
 |  * performed on the raw inode simply pass @nop_mnt_idmap. | 
 |  */ | 
 | static bool chgrp_ok(struct mnt_idmap *idmap, | 
 | 		     const struct inode *inode, vfsgid_t ia_vfsgid) | 
 | { | 
 | 	vfsgid_t vfsgid = i_gid_into_vfsgid(idmap, inode); | 
 | 	vfsuid_t vfsuid = i_uid_into_vfsuid(idmap, inode); | 
 | 	if (vfsuid_eq_kuid(vfsuid, current_fsuid())) { | 
 | 		if (vfsgid_eq(ia_vfsgid, vfsgid)) | 
 | 			return true; | 
 | 		if (vfsgid_in_group_p(ia_vfsgid)) | 
 | 			return true; | 
 | 	} | 
 | 	if (capable_wrt_inode_uidgid(idmap, inode, CAP_CHOWN)) | 
 | 		return true; | 
 | 	if (!vfsgid_valid(vfsgid) && | 
 | 	    ns_capable(inode->i_sb->s_user_ns, CAP_CHOWN)) | 
 | 		return true; | 
 | 	return false; | 
 | } | 
 |  | 
 | /** | 
 |  * setattr_prepare - check if attribute changes to a dentry are allowed | 
 |  * @idmap:	idmap of the mount the inode was found from | 
 |  * @dentry:	dentry to check | 
 |  * @attr:	attributes to change | 
 |  * | 
 |  * Check if we are allowed to change the attributes contained in @attr | 
 |  * in the given dentry.  This includes the normal unix access permission | 
 |  * checks, as well as checks for rlimits and others. The function also clears | 
 |  * SGID bit from mode if user is not allowed to set it. Also file capabilities | 
 |  * and IMA extended attributes are cleared if ATTR_KILL_PRIV is set. | 
 |  * | 
 |  * If the inode has been found through an idmapped mount the idmap of | 
 |  * the vfsmount must be passed through @idmap. This function will then | 
 |  * take care to map the inode according to @idmap before checking | 
 |  * permissions. On non-idmapped mounts or if permission checking is to be | 
 |  * performed on the raw inode simply passs @nop_mnt_idmap. | 
 |  * | 
 |  * Should be called as the first thing in ->setattr implementations, | 
 |  * possibly after taking additional locks. | 
 |  */ | 
 | int setattr_prepare(struct mnt_idmap *idmap, struct dentry *dentry, | 
 | 		    struct iattr *attr) | 
 | { | 
 | 	struct inode *inode = d_inode(dentry); | 
 | 	unsigned int ia_valid = attr->ia_valid; | 
 |  | 
 | 	/* | 
 | 	 * First check size constraints.  These can't be overriden using | 
 | 	 * ATTR_FORCE. | 
 | 	 */ | 
 | 	if (ia_valid & ATTR_SIZE) { | 
 | 		int error = inode_newsize_ok(inode, attr->ia_size); | 
 | 		if (error) | 
 | 			return error; | 
 | 	} | 
 |  | 
 | 	/* If force is set do it anyway. */ | 
 | 	if (ia_valid & ATTR_FORCE) | 
 | 		goto kill_priv; | 
 |  | 
 | 	/* Make sure a caller can chown. */ | 
 | 	if ((ia_valid & ATTR_UID) && | 
 | 	    !chown_ok(idmap, inode, attr->ia_vfsuid)) | 
 | 		return -EPERM; | 
 |  | 
 | 	/* Make sure caller can chgrp. */ | 
 | 	if ((ia_valid & ATTR_GID) && | 
 | 	    !chgrp_ok(idmap, inode, attr->ia_vfsgid)) | 
 | 		return -EPERM; | 
 |  | 
 | 	/* Make sure a caller can chmod. */ | 
 | 	if (ia_valid & ATTR_MODE) { | 
 | 		vfsgid_t vfsgid; | 
 |  | 
 | 		if (!inode_owner_or_capable(idmap, inode)) | 
 | 			return -EPERM; | 
 |  | 
 | 		if (ia_valid & ATTR_GID) | 
 | 			vfsgid = attr->ia_vfsgid; | 
 | 		else | 
 | 			vfsgid = i_gid_into_vfsgid(idmap, inode); | 
 |  | 
 | 		/* Also check the setgid bit! */ | 
 | 		if (!in_group_or_capable(idmap, inode, vfsgid)) | 
 | 			attr->ia_mode &= ~S_ISGID; | 
 | 	} | 
 |  | 
 | 	/* Check for setting the inode time. */ | 
 | 	if (ia_valid & (ATTR_MTIME_SET | ATTR_ATIME_SET | ATTR_TIMES_SET)) { | 
 | 		if (!inode_owner_or_capable(idmap, inode)) | 
 | 			return -EPERM; | 
 | 	} | 
 |  | 
 | kill_priv: | 
 | 	/* User has permission for the change */ | 
 | 	if (ia_valid & ATTR_KILL_PRIV) { | 
 | 		int error; | 
 |  | 
 | 		error = security_inode_killpriv(idmap, dentry); | 
 | 		if (error) | 
 | 			return error; | 
 | 	} | 
 |  | 
 | 	return 0; | 
 | } | 
 | EXPORT_SYMBOL(setattr_prepare); | 
 |  | 
 | /** | 
 |  * inode_newsize_ok - may this inode be truncated to a given size | 
 |  * @inode:	the inode to be truncated | 
 |  * @offset:	the new size to assign to the inode | 
 |  * | 
 |  * inode_newsize_ok must be called with i_mutex held. | 
 |  * | 
 |  * inode_newsize_ok will check filesystem limits and ulimits to check that the | 
 |  * new inode size is within limits. inode_newsize_ok will also send SIGXFSZ | 
 |  * when necessary. Caller must not proceed with inode size change if failure is | 
 |  * returned. @inode must be a file (not directory), with appropriate | 
 |  * permissions to allow truncate (inode_newsize_ok does NOT check these | 
 |  * conditions). | 
 |  * | 
 |  * Return: 0 on success, -ve errno on failure | 
 |  */ | 
 | int inode_newsize_ok(const struct inode *inode, loff_t offset) | 
 | { | 
 | 	if (offset < 0) | 
 | 		return -EINVAL; | 
 | 	if (inode->i_size < offset) { | 
 | 		unsigned long limit; | 
 |  | 
 | 		limit = rlimit(RLIMIT_FSIZE); | 
 | 		if (limit != RLIM_INFINITY && offset > limit) | 
 | 			goto out_sig; | 
 | 		if (offset > inode->i_sb->s_maxbytes) | 
 | 			goto out_big; | 
 | 	} else { | 
 | 		/* | 
 | 		 * truncation of in-use swapfiles is disallowed - it would | 
 | 		 * cause subsequent swapout to scribble on the now-freed | 
 | 		 * blocks. | 
 | 		 */ | 
 | 		if (IS_SWAPFILE(inode)) | 
 | 			return -ETXTBSY; | 
 | 	} | 
 |  | 
 | 	return 0; | 
 | out_sig: | 
 | 	send_sig(SIGXFSZ, current, 0); | 
 | out_big: | 
 | 	return -EFBIG; | 
 | } | 
 | EXPORT_SYMBOL(inode_newsize_ok); | 
 |  | 
 | /** | 
 |  * setattr_copy - copy simple metadata updates into the generic inode | 
 |  * @idmap:	idmap of the mount the inode was found from | 
 |  * @inode:	the inode to be updated | 
 |  * @attr:	the new attributes | 
 |  * | 
 |  * setattr_copy must be called with i_mutex held. | 
 |  * | 
 |  * setattr_copy updates the inode's metadata with that specified | 
 |  * in attr on idmapped mounts. Necessary permission checks to determine | 
 |  * whether or not the S_ISGID property needs to be removed are performed with | 
 |  * the correct idmapped mount permission helpers. | 
 |  * Noticeably missing is inode size update, which is more complex | 
 |  * as it requires pagecache updates. | 
 |  * | 
 |  * If the inode has been found through an idmapped mount the idmap of | 
 |  * the vfsmount must be passed through @idmap. This function will then | 
 |  * take care to map the inode according to @idmap before checking | 
 |  * permissions. On non-idmapped mounts or if permission checking is to be | 
 |  * performed on the raw inode simply pass @nop_mnt_idmap. | 
 |  * | 
 |  * The inode is not marked as dirty after this operation. The rationale is | 
 |  * that for "simple" filesystems, the struct inode is the inode storage. | 
 |  * The caller is free to mark the inode dirty afterwards if needed. | 
 |  */ | 
 | void setattr_copy(struct mnt_idmap *idmap, struct inode *inode, | 
 | 		  const struct iattr *attr) | 
 | { | 
 | 	unsigned int ia_valid = attr->ia_valid; | 
 |  | 
 | 	i_uid_update(idmap, attr, inode); | 
 | 	i_gid_update(idmap, attr, inode); | 
 | 	if (ia_valid & ATTR_ATIME) | 
 | 		inode->i_atime = attr->ia_atime; | 
 | 	if (ia_valid & ATTR_MTIME) | 
 | 		inode->i_mtime = attr->ia_mtime; | 
 | 	if (ia_valid & ATTR_CTIME) | 
 | 		inode_set_ctime_to_ts(inode, attr->ia_ctime); | 
 | 	if (ia_valid & ATTR_MODE) { | 
 | 		umode_t mode = attr->ia_mode; | 
 | 		if (!in_group_or_capable(idmap, inode, | 
 | 					 i_gid_into_vfsgid(idmap, inode))) | 
 | 			mode &= ~S_ISGID; | 
 | 		inode->i_mode = mode; | 
 | 	} | 
 | } | 
 | EXPORT_SYMBOL(setattr_copy); | 
 |  | 
 | int may_setattr(struct mnt_idmap *idmap, struct inode *inode, | 
 | 		unsigned int ia_valid) | 
 | { | 
 | 	int error; | 
 |  | 
 | 	if (ia_valid & (ATTR_MODE | ATTR_UID | ATTR_GID | ATTR_TIMES_SET)) { | 
 | 		if (IS_IMMUTABLE(inode) || IS_APPEND(inode)) | 
 | 			return -EPERM; | 
 | 	} | 
 |  | 
 | 	/* | 
 | 	 * If utimes(2) and friends are called with times == NULL (or both | 
 | 	 * times are UTIME_NOW), then we need to check for write permission | 
 | 	 */ | 
 | 	if (ia_valid & ATTR_TOUCH) { | 
 | 		if (IS_IMMUTABLE(inode)) | 
 | 			return -EPERM; | 
 |  | 
 | 		if (!inode_owner_or_capable(idmap, inode)) { | 
 | 			error = inode_permission(idmap, inode, MAY_WRITE); | 
 | 			if (error) | 
 | 				return error; | 
 | 		} | 
 | 	} | 
 | 	return 0; | 
 | } | 
 | EXPORT_SYMBOL(may_setattr); | 
 |  | 
 | /** | 
 |  * notify_change - modify attributes of a filesytem object | 
 |  * @idmap:	idmap of the mount the inode was found from | 
 |  * @dentry:	object affected | 
 |  * @attr:	new attributes | 
 |  * @delegated_inode: returns inode, if the inode is delegated | 
 |  * | 
 |  * The caller must hold the i_mutex on the affected object. | 
 |  * | 
 |  * If notify_change discovers a delegation in need of breaking, | 
 |  * it will return -EWOULDBLOCK and return a reference to the inode in | 
 |  * delegated_inode.  The caller should then break the delegation and | 
 |  * retry.  Because breaking a delegation may take a long time, the | 
 |  * caller should drop the i_mutex before doing so. | 
 |  * | 
 |  * Alternatively, a caller may pass NULL for delegated_inode.  This may | 
 |  * be appropriate for callers that expect the underlying filesystem not | 
 |  * to be NFS exported.  Also, passing NULL is fine for callers holding | 
 |  * the file open for write, as there can be no conflicting delegation in | 
 |  * that case. | 
 |  * | 
 |  * If the inode has been found through an idmapped mount the idmap of | 
 |  * the vfsmount must be passed through @idmap. This function will then | 
 |  * take care to map the inode according to @idmap before checking | 
 |  * permissions. On non-idmapped mounts or if permission checking is to be | 
 |  * performed on the raw inode simply pass @nop_mnt_idmap. | 
 |  */ | 
 | int notify_change(struct mnt_idmap *idmap, struct dentry *dentry, | 
 | 		  struct iattr *attr, struct inode **delegated_inode) | 
 | { | 
 | 	struct inode *inode = dentry->d_inode; | 
 | 	umode_t mode = inode->i_mode; | 
 | 	int error; | 
 | 	struct timespec64 now; | 
 | 	unsigned int ia_valid = attr->ia_valid; | 
 |  | 
 | 	WARN_ON_ONCE(!inode_is_locked(inode)); | 
 |  | 
 | 	error = may_setattr(idmap, inode, ia_valid); | 
 | 	if (error) | 
 | 		return error; | 
 |  | 
 | 	if ((ia_valid & ATTR_MODE)) { | 
 | 		/* | 
 | 		 * Don't allow changing the mode of symlinks: | 
 | 		 * | 
 | 		 * (1) The vfs doesn't take the mode of symlinks into account | 
 | 		 *     during permission checking. | 
 | 		 * (2) This has never worked correctly. Most major filesystems | 
 | 		 *     did return EOPNOTSUPP due to interactions with POSIX ACLs | 
 | 		 *     but did still updated the mode of the symlink. | 
 | 		 *     This inconsistency led system call wrapper providers such | 
 | 		 *     as libc to block changing the mode of symlinks with | 
 | 		 *     EOPNOTSUPP already. | 
 | 		 * (3) To even do this in the first place one would have to use | 
 | 		 *     specific file descriptors and quite some effort. | 
 | 		 */ | 
 | 		if (S_ISLNK(inode->i_mode)) | 
 | 			return -EOPNOTSUPP; | 
 |  | 
 | 		/* Flag setting protected by i_mutex */ | 
 | 		if (is_sxid(attr->ia_mode)) | 
 | 			inode->i_flags &= ~S_NOSEC; | 
 | 	} | 
 |  | 
 | 	now = current_time(inode); | 
 |  | 
 | 	attr->ia_ctime = now; | 
 | 	if (!(ia_valid & ATTR_ATIME_SET)) | 
 | 		attr->ia_atime = now; | 
 | 	else | 
 | 		attr->ia_atime = timestamp_truncate(attr->ia_atime, inode); | 
 | 	if (!(ia_valid & ATTR_MTIME_SET)) | 
 | 		attr->ia_mtime = now; | 
 | 	else | 
 | 		attr->ia_mtime = timestamp_truncate(attr->ia_mtime, inode); | 
 |  | 
 | 	if (ia_valid & ATTR_KILL_PRIV) { | 
 | 		error = security_inode_need_killpriv(dentry); | 
 | 		if (error < 0) | 
 | 			return error; | 
 | 		if (error == 0) | 
 | 			ia_valid = attr->ia_valid &= ~ATTR_KILL_PRIV; | 
 | 	} | 
 |  | 
 | 	/* | 
 | 	 * We now pass ATTR_KILL_S*ID to the lower level setattr function so | 
 | 	 * that the function has the ability to reinterpret a mode change | 
 | 	 * that's due to these bits. This adds an implicit restriction that | 
 | 	 * no function will ever call notify_change with both ATTR_MODE and | 
 | 	 * ATTR_KILL_S*ID set. | 
 | 	 */ | 
 | 	if ((ia_valid & (ATTR_KILL_SUID|ATTR_KILL_SGID)) && | 
 | 	    (ia_valid & ATTR_MODE)) | 
 | 		BUG(); | 
 |  | 
 | 	if (ia_valid & ATTR_KILL_SUID) { | 
 | 		if (mode & S_ISUID) { | 
 | 			ia_valid = attr->ia_valid |= ATTR_MODE; | 
 | 			attr->ia_mode = (inode->i_mode & ~S_ISUID); | 
 | 		} | 
 | 	} | 
 | 	if (ia_valid & ATTR_KILL_SGID) { | 
 | 		if (mode & S_ISGID) { | 
 | 			if (!(ia_valid & ATTR_MODE)) { | 
 | 				ia_valid = attr->ia_valid |= ATTR_MODE; | 
 | 				attr->ia_mode = inode->i_mode; | 
 | 			} | 
 | 			attr->ia_mode &= ~S_ISGID; | 
 | 		} | 
 | 	} | 
 | 	if (!(attr->ia_valid & ~(ATTR_KILL_SUID | ATTR_KILL_SGID))) | 
 | 		return 0; | 
 |  | 
 | 	/* | 
 | 	 * Verify that uid/gid changes are valid in the target | 
 | 	 * namespace of the superblock. | 
 | 	 */ | 
 | 	if (ia_valid & ATTR_UID && | 
 | 	    !vfsuid_has_fsmapping(idmap, inode->i_sb->s_user_ns, | 
 | 				  attr->ia_vfsuid)) | 
 | 		return -EOVERFLOW; | 
 | 	if (ia_valid & ATTR_GID && | 
 | 	    !vfsgid_has_fsmapping(idmap, inode->i_sb->s_user_ns, | 
 | 				  attr->ia_vfsgid)) | 
 | 		return -EOVERFLOW; | 
 |  | 
 | 	/* Don't allow modifications of files with invalid uids or | 
 | 	 * gids unless those uids & gids are being made valid. | 
 | 	 */ | 
 | 	if (!(ia_valid & ATTR_UID) && | 
 | 	    !vfsuid_valid(i_uid_into_vfsuid(idmap, inode))) | 
 | 		return -EOVERFLOW; | 
 | 	if (!(ia_valid & ATTR_GID) && | 
 | 	    !vfsgid_valid(i_gid_into_vfsgid(idmap, inode))) | 
 | 		return -EOVERFLOW; | 
 |  | 
 | 	error = security_inode_setattr(idmap, dentry, attr); | 
 | 	if (error) | 
 | 		return error; | 
 | 	error = try_break_deleg(inode, delegated_inode); | 
 | 	if (error) | 
 | 		return error; | 
 |  | 
 | 	if (inode->i_op->setattr) | 
 | 		error = inode->i_op->setattr(idmap, dentry, attr); | 
 | 	else | 
 | 		error = simple_setattr(idmap, dentry, attr); | 
 |  | 
 | 	if (!error) { | 
 | 		fsnotify_change(dentry, ia_valid); | 
 | 		ima_inode_post_setattr(idmap, dentry); | 
 | 		evm_inode_post_setattr(dentry, ia_valid); | 
 | 	} | 
 |  | 
 | 	return error; | 
 | } | 
 | EXPORT_SYMBOL(notify_change); |