diff options
Diffstat (limited to 'fs/userfaultfd.c')
| -rw-r--r-- | fs/userfaultfd.c | 53 | 
1 files changed, 36 insertions, 17 deletions
diff --git a/fs/userfaultfd.c b/fs/userfaultfd.c index 60dcfafdc11a..eee7320ab0b0 100644 --- a/fs/userfaultfd.c +++ b/fs/userfaultfd.c @@ -31,6 +31,7 @@  #include <linux/hugetlb.h>  #include <linux/swapops.h>  #include <linux/miscdevice.h> +#include <linux/uio.h>  static int sysctl_unprivileged_userfaultfd __read_mostly; @@ -282,7 +283,7 @@ static inline bool userfaultfd_huge_must_wait(struct userfaultfd_ctx *ctx,  /*   * Verify the pagetables are still not ok after having reigstered into   * the fault_pending_wqh to avoid userland having to UFFDIO_WAKE any - * userfault that has already been resolved, if userfaultfd_read and + * userfault that has already been resolved, if userfaultfd_read_iter and   * UFFDIO_COPY|ZEROPAGE are being run simultaneously on two different   * threads.   */ @@ -657,7 +658,10 @@ int dup_userfaultfd(struct vm_area_struct *vma, struct list_head *fcs)  	struct userfaultfd_fork_ctx *fctx;  	octx = vma->vm_userfaultfd_ctx.ctx; -	if (!octx || !(octx->features & UFFD_FEATURE_EVENT_FORK)) { +	if (!octx) +		return 0; + +	if (!(octx->features & UFFD_FEATURE_EVENT_FORK)) {  		vma_start_write(vma);  		vma->vm_userfaultfd_ctx = NULL_VM_UFFD_CTX;  		userfaultfd_set_vm_flags(vma, vma->vm_flags & ~__VM_UFFD_FLAGS); @@ -895,6 +899,10 @@ static int userfaultfd_release(struct inode *inode, struct file *file)  			prev = vma;  			continue;  		} +		/* Reset ptes for the whole vma range if wr-protected */ +		if (userfaultfd_wp(vma)) +			uffd_wp_range(vma, vma->vm_start, +				      vma->vm_end - vma->vm_start, false);  		new_flags = vma->vm_flags & ~__VM_UFFD_FLAGS;  		vma = vma_modify_flags_uffd(&vmi, prev, vma, vma->vm_start,  					    vma->vm_end, new_flags, @@ -1177,34 +1185,34 @@ static ssize_t userfaultfd_ctx_read(struct userfaultfd_ctx *ctx, int no_wait,  	return ret;  } -static ssize_t userfaultfd_read(struct file *file, char __user *buf, -				size_t count, loff_t *ppos) +static ssize_t userfaultfd_read_iter(struct kiocb *iocb, struct iov_iter *to)  { +	struct file *file = iocb->ki_filp;  	struct userfaultfd_ctx *ctx = file->private_data;  	ssize_t _ret, ret = 0;  	struct uffd_msg msg; -	int no_wait = file->f_flags & O_NONBLOCK;  	struct inode *inode = file_inode(file); +	bool no_wait;  	if (!userfaultfd_is_initialized(ctx))  		return -EINVAL; +	no_wait = file->f_flags & O_NONBLOCK || iocb->ki_flags & IOCB_NOWAIT;  	for (;;) { -		if (count < sizeof(msg)) +		if (iov_iter_count(to) < sizeof(msg))  			return ret ? ret : -EINVAL;  		_ret = userfaultfd_ctx_read(ctx, no_wait, &msg, inode);  		if (_ret < 0)  			return ret ? ret : _ret; -		if (copy_to_user((__u64 __user *) buf, &msg, sizeof(msg))) +		_ret = !copy_to_iter_full(&msg, sizeof(msg), to); +		if (_ret)  			return ret ? ret : -EFAULT;  		ret += sizeof(msg); -		buf += sizeof(msg); -		count -= sizeof(msg);  		/*  		 * Allow to read more than one fault at time but only  		 * block if waiting for the very first one.  		 */ -		no_wait = O_NONBLOCK; +		no_wait = true;  	}  } @@ -2172,7 +2180,7 @@ static const struct file_operations userfaultfd_fops = {  #endif  	.release	= userfaultfd_release,  	.poll		= userfaultfd_poll, -	.read		= userfaultfd_read, +	.read_iter	= userfaultfd_read_iter,  	.unlocked_ioctl = userfaultfd_ioctl,  	.compat_ioctl	= compat_ptr_ioctl,  	.llseek		= noop_llseek, @@ -2192,6 +2200,7 @@ static void init_once_userfaultfd_ctx(void *mem)  static int new_userfaultfd(int flags)  {  	struct userfaultfd_ctx *ctx; +	struct file *file;  	int fd;  	BUG_ON(!current->mm); @@ -2215,16 +2224,26 @@ static int new_userfaultfd(int flags)  	init_rwsem(&ctx->map_changing_lock);  	atomic_set(&ctx->mmap_changing, 0);  	ctx->mm = current->mm; -	/* prevent the mm struct to be freed */ -	mmgrab(ctx->mm); + +	fd = get_unused_fd_flags(flags & UFFD_SHARED_FCNTL_FLAGS); +	if (fd < 0) +		goto err_out;  	/* Create a new inode so that the LSM can block the creation.  */ -	fd = anon_inode_create_getfd("[userfaultfd]", &userfaultfd_fops, ctx, +	file = anon_inode_create_getfile("[userfaultfd]", &userfaultfd_fops, ctx,  			O_RDONLY | (flags & UFFD_SHARED_FCNTL_FLAGS), NULL); -	if (fd < 0) { -		mmdrop(ctx->mm); -		kmem_cache_free(userfaultfd_ctx_cachep, ctx); +	if (IS_ERR(file)) { +		put_unused_fd(fd); +		fd = PTR_ERR(file); +		goto err_out;  	} +	/* prevent the mm struct to be freed */ +	mmgrab(ctx->mm); +	file->f_mode |= FMODE_NOWAIT; +	fd_install(fd, file); +	return fd; +err_out: +	kmem_cache_free(userfaultfd_ctx_cachep, ctx);  	return fd;  }  |