diff options
Diffstat (limited to 'ipc')
| -rw-r--r-- | ipc/mqueue.c | 252 | ||||
| -rw-r--r-- | ipc/msg.c | 20 | ||||
| -rw-r--r-- | ipc/sem.c | 10 | ||||
| -rw-r--r-- | ipc/shm.c | 20 | ||||
| -rw-r--r-- | ipc/util.c | 5 | 
5 files changed, 160 insertions, 147 deletions
| diff --git a/ipc/mqueue.c b/ipc/mqueue.c index 9649ecd8a73a..d7f309f74dec 100644 --- a/ipc/mqueue.c +++ b/ipc/mqueue.c @@ -270,13 +270,30 @@ static struct inode *mqueue_get_inode(struct super_block *sb,  		 * that means the min(mq_maxmsg, max_priorities) * struct  		 * posix_msg_tree_node.  		 */ + +		ret = -EINVAL; +		if (info->attr.mq_maxmsg <= 0 || info->attr.mq_msgsize <= 0) +			goto out_inode; +		if (capable(CAP_SYS_RESOURCE)) { +			if (info->attr.mq_maxmsg > HARD_MSGMAX || +			    info->attr.mq_msgsize > HARD_MSGSIZEMAX) +				goto out_inode; +		} else { +			if (info->attr.mq_maxmsg > ipc_ns->mq_msg_max || +					info->attr.mq_msgsize > ipc_ns->mq_msgsize_max) +				goto out_inode; +		} +		ret = -EOVERFLOW; +		/* check for overflow */ +		if (info->attr.mq_msgsize > ULONG_MAX/info->attr.mq_maxmsg) +			goto out_inode;  		mq_treesize = info->attr.mq_maxmsg * sizeof(struct msg_msg) +  			min_t(unsigned int, info->attr.mq_maxmsg, MQ_PRIO_MAX) *  			sizeof(struct posix_msg_tree_node); - -		mq_bytes = mq_treesize + (info->attr.mq_maxmsg * -					  info->attr.mq_msgsize); - +		mq_bytes = info->attr.mq_maxmsg * info->attr.mq_msgsize; +		if (mq_bytes + mq_treesize < mq_bytes) +			goto out_inode; +		mq_bytes += mq_treesize;  		spin_lock(&mq_lock);  		if (u->mq_bytes + mq_bytes < u->mq_bytes ||  		    u->mq_bytes + mq_bytes > rlimit(RLIMIT_MSGQUEUE)) { @@ -308,8 +325,9 @@ err:  static int mqueue_fill_super(struct super_block *sb, void *data, int silent)  {  	struct inode *inode; -	struct ipc_namespace *ns = sb->s_fs_info; +	struct ipc_namespace *ns = data; +	sb->s_fs_info = ns;  	sb->s_iflags |= SB_I_NOEXEC | SB_I_NODEV;  	sb->s_blocksize = PAGE_SIZE;  	sb->s_blocksize_bits = PAGE_SHIFT; @@ -326,18 +344,44 @@ static int mqueue_fill_super(struct super_block *sb, void *data, int silent)  	return 0;  } +static struct file_system_type mqueue_fs_type; +/* + * Return value is pinned only by reference in ->mq_mnt; it will + * live until ipcns dies.  Caller does not need to drop it. + */ +static struct vfsmount *mq_internal_mount(void) +{ +	struct ipc_namespace *ns = current->nsproxy->ipc_ns; +	struct vfsmount *m = ns->mq_mnt; +	if (m) +		return m; +	m = kern_mount_data(&mqueue_fs_type, ns); +	spin_lock(&mq_lock); +	if (unlikely(ns->mq_mnt)) { +		spin_unlock(&mq_lock); +		if (!IS_ERR(m)) +			kern_unmount(m); +		return ns->mq_mnt; +	} +	if (!IS_ERR(m)) +		ns->mq_mnt = m; +	spin_unlock(&mq_lock); +	return m; +} +  static struct dentry *mqueue_mount(struct file_system_type *fs_type,  			 int flags, const char *dev_name,  			 void *data)  { -	struct ipc_namespace *ns; -	if (flags & SB_KERNMOUNT) { -		ns = data; -		data = NULL; -	} else { -		ns = current->nsproxy->ipc_ns; -	} -	return mount_ns(fs_type, flags, data, ns, ns->user_ns, mqueue_fill_super); +	struct vfsmount *m; +	if (flags & SB_KERNMOUNT) +		return mount_nodev(fs_type, flags, data, mqueue_fill_super); +	m = mq_internal_mount(); +	if (IS_ERR(m)) +		return ERR_CAST(m); +	atomic_inc(&m->mnt_sb->s_active); +	down_write(&m->mnt_sb->s_umount); +	return dget(m->mnt_root);  }  static void init_once(void *foo) @@ -416,11 +460,11 @@ static void mqueue_evict_inode(struct inode *inode)  		put_ipc_ns(ipc_ns);  } -static int mqueue_create(struct inode *dir, struct dentry *dentry, -				umode_t mode, bool excl) +static int mqueue_create_attr(struct dentry *dentry, umode_t mode, void *arg)  { +	struct inode *dir = dentry->d_parent->d_inode;  	struct inode *inode; -	struct mq_attr *attr = dentry->d_fsdata; +	struct mq_attr *attr = arg;  	int error;  	struct ipc_namespace *ipc_ns; @@ -461,6 +505,12 @@ out_unlock:  	return error;  } +static int mqueue_create(struct inode *dir, struct dentry *dentry, +				umode_t mode, bool excl) +{ +	return mqueue_create_attr(dentry, mode, NULL); +} +  static int mqueue_unlink(struct inode *dir, struct dentry *dentry)  {  	struct inode *inode = d_inode(dentry); @@ -519,19 +569,19 @@ static int mqueue_flush_file(struct file *filp, fl_owner_t id)  	return 0;  } -static unsigned int mqueue_poll_file(struct file *filp, struct poll_table_struct *poll_tab) +static __poll_t mqueue_poll_file(struct file *filp, struct poll_table_struct *poll_tab)  {  	struct mqueue_inode_info *info = MQUEUE_I(file_inode(filp)); -	int retval = 0; +	__poll_t retval = 0;  	poll_wait(filp, &info->wait_q, poll_tab);  	spin_lock(&info->lock);  	if (info->attr.mq_curmsgs) -		retval = POLLIN | POLLRDNORM; +		retval = EPOLLIN | EPOLLRDNORM;  	if (info->attr.mq_curmsgs < info->attr.mq_maxmsg) -		retval |= POLLOUT | POLLWRNORM; +		retval |= EPOLLOUT | EPOLLWRNORM;  	spin_unlock(&info->lock);  	return retval; @@ -546,7 +596,7 @@ static void wq_add(struct mqueue_inode_info *info, int sr,  	ewp->task = current;  	list_for_each_entry(walk, &info->e_wait_q[sr].list, list) { -		if (walk->task->static_prio <= current->static_prio) { +		if (walk->task->prio <= current->prio) {  			list_add_tail(&ewp->list, &walk->list);  			return;  		} @@ -639,6 +689,7 @@ static void __do_notify(struct mqueue_inode_info *info)  		case SIGEV_SIGNAL:  			/* sends signal */ +			clear_siginfo(&sig_i);  			sig_i.si_signo = info->notify.sigev_signo;  			sig_i.si_errno = 0;  			sig_i.si_code = SI_MESGQ; @@ -690,96 +741,46 @@ static void remove_notification(struct mqueue_inode_info *info)  	info->notify_user_ns = NULL;  } -static int mq_attr_ok(struct ipc_namespace *ipc_ns, struct mq_attr *attr) -{ -	int mq_treesize; -	unsigned long total_size; - -	if (attr->mq_maxmsg <= 0 || attr->mq_msgsize <= 0) -		return -EINVAL; -	if (capable(CAP_SYS_RESOURCE)) { -		if (attr->mq_maxmsg > HARD_MSGMAX || -		    attr->mq_msgsize > HARD_MSGSIZEMAX) -			return -EINVAL; -	} else { -		if (attr->mq_maxmsg > ipc_ns->mq_msg_max || -				attr->mq_msgsize > ipc_ns->mq_msgsize_max) -			return -EINVAL; -	} -	/* check for overflow */ -	if (attr->mq_msgsize > ULONG_MAX/attr->mq_maxmsg) -		return -EOVERFLOW; -	mq_treesize = attr->mq_maxmsg * sizeof(struct msg_msg) + -		min_t(unsigned int, attr->mq_maxmsg, MQ_PRIO_MAX) * -		sizeof(struct posix_msg_tree_node); -	total_size = attr->mq_maxmsg * attr->mq_msgsize; -	if (total_size + mq_treesize < total_size) -		return -EOVERFLOW; -	return 0; -} - -/* - * Invoked when creating a new queue via sys_mq_open - */ -static struct file *do_create(struct ipc_namespace *ipc_ns, struct inode *dir, -			struct path *path, int oflag, umode_t mode, +static int prepare_open(struct dentry *dentry, int oflag, int ro, +			umode_t mode, struct filename *name,  			struct mq_attr *attr)  { -	const struct cred *cred = current_cred(); -	int ret; - -	if (attr) { -		ret = mq_attr_ok(ipc_ns, attr); -		if (ret) -			return ERR_PTR(ret); -		/* store for use during create */ -		path->dentry->d_fsdata = attr; -	} else { -		struct mq_attr def_attr; - -		def_attr.mq_maxmsg = min(ipc_ns->mq_msg_max, -					 ipc_ns->mq_msg_default); -		def_attr.mq_msgsize = min(ipc_ns->mq_msgsize_max, -					  ipc_ns->mq_msgsize_default); -		ret = mq_attr_ok(ipc_ns, &def_attr); -		if (ret) -			return ERR_PTR(ret); -	} - -	mode &= ~current_umask(); -	ret = vfs_create(dir, path->dentry, mode, true); -	path->dentry->d_fsdata = NULL; -	if (ret) -		return ERR_PTR(ret); -	return dentry_open(path, oflag, cred); -} - -/* Opens existing queue */ -static struct file *do_open(struct path *path, int oflag) -{  	static const int oflag2acc[O_ACCMODE] = { MAY_READ, MAY_WRITE,  						  MAY_READ | MAY_WRITE };  	int acc; + +	if (d_really_is_negative(dentry)) { +		if (!(oflag & O_CREAT)) +			return -ENOENT; +		if (ro) +			return ro; +		audit_inode_parent_hidden(name, dentry->d_parent); +		return vfs_mkobj(dentry, mode & ~current_umask(), +				  mqueue_create_attr, attr); +	} +	/* it already existed */ +	audit_inode(name, dentry, 0); +	if ((oflag & (O_CREAT|O_EXCL)) == (O_CREAT|O_EXCL)) +		return -EEXIST;  	if ((oflag & O_ACCMODE) == (O_RDWR | O_WRONLY)) -		return ERR_PTR(-EINVAL); +		return -EINVAL;  	acc = oflag2acc[oflag & O_ACCMODE]; -	if (inode_permission(d_inode(path->dentry), acc)) -		return ERR_PTR(-EACCES); -	return dentry_open(path, oflag, current_cred()); +	return inode_permission(d_inode(dentry), acc);  }  static int do_mq_open(const char __user *u_name, int oflag, umode_t mode,  		      struct mq_attr *attr)  { -	struct path path; -	struct file *filp; +	struct vfsmount *mnt = mq_internal_mount(); +	struct dentry *root;  	struct filename *name; +	struct path path;  	int fd, error; -	struct ipc_namespace *ipc_ns = current->nsproxy->ipc_ns; -	struct vfsmount *mnt = ipc_ns->mq_mnt; -	struct dentry *root = mnt->mnt_root;  	int ro; +	if (IS_ERR(mnt)) +		return PTR_ERR(mnt); +  	audit_mq_open(oflag, mode, attr);  	if (IS_ERR(name = getname(u_name))) @@ -790,7 +791,7 @@ static int do_mq_open(const char __user *u_name, int oflag, umode_t mode,  		goto out_putname;  	ro = mnt_want_write(mnt);	/* we'll drop it in any case */ -	error = 0; +	root = mnt->mnt_root;  	inode_lock(d_inode(root));  	path.dentry = lookup_one_len(name->name, root, strlen(name->name));  	if (IS_ERR(path.dentry)) { @@ -798,38 +799,14 @@ static int do_mq_open(const char __user *u_name, int oflag, umode_t mode,  		goto out_putfd;  	}  	path.mnt = mntget(mnt); - -	if (oflag & O_CREAT) { -		if (d_really_is_positive(path.dentry)) {	/* entry already exists */ -			audit_inode(name, path.dentry, 0); -			if (oflag & O_EXCL) { -				error = -EEXIST; -				goto out; -			} -			filp = do_open(&path, oflag); -		} else { -			if (ro) { -				error = ro; -				goto out; -			} -			audit_inode_parent_hidden(name, root); -			filp = do_create(ipc_ns, d_inode(root), &path, -					 oflag, mode, attr); -		} -	} else { -		if (d_really_is_negative(path.dentry)) { -			error = -ENOENT; -			goto out; -		} -		audit_inode(name, path.dentry, 0); -		filp = do_open(&path, oflag); +	error = prepare_open(path.dentry, oflag, ro, mode, name, attr); +	if (!error) { +		struct file *file = dentry_open(&path, oflag, current_cred()); +		if (!IS_ERR(file)) +			fd_install(fd, file); +		else +			error = PTR_ERR(file);  	} - -	if (!IS_ERR(filp)) -		fd_install(fd, filp); -	else -		error = PTR_ERR(filp); -out:  	path_put(&path);  out_putfd:  	if (error) { @@ -863,6 +840,9 @@ SYSCALL_DEFINE1(mq_unlink, const char __user *, u_name)  	struct ipc_namespace *ipc_ns = current->nsproxy->ipc_ns;  	struct vfsmount *mnt = ipc_ns->mq_mnt; +	if (!mnt) +		return -ENOENT; +  	name = getname(u_name);  	if (IS_ERR(name))  		return PTR_ERR(name); @@ -1589,28 +1569,26 @@ int mq_init_ns(struct ipc_namespace *ns)  	ns->mq_msgsize_max   = DFLT_MSGSIZEMAX;  	ns->mq_msg_default   = DFLT_MSG;  	ns->mq_msgsize_default  = DFLT_MSGSIZE; +	ns->mq_mnt = NULL; -	ns->mq_mnt = kern_mount_data(&mqueue_fs_type, ns); -	if (IS_ERR(ns->mq_mnt)) { -		int err = PTR_ERR(ns->mq_mnt); -		ns->mq_mnt = NULL; -		return err; -	}  	return 0;  }  void mq_clear_sbinfo(struct ipc_namespace *ns)  { -	ns->mq_mnt->mnt_sb->s_fs_info = NULL; +	if (ns->mq_mnt) +		ns->mq_mnt->mnt_sb->s_fs_info = NULL;  }  void mq_put_mnt(struct ipc_namespace *ns)  { -	kern_unmount(ns->mq_mnt); +	if (ns->mq_mnt) +		kern_unmount(ns->mq_mnt);  }  static int __init init_mqueue_fs(void)  { +	struct vfsmount *m;  	int error;  	mqueue_inode_cachep = kmem_cache_create("mqueue_inode_cache", @@ -1632,6 +1610,10 @@ static int __init init_mqueue_fs(void)  	if (error)  		goto out_filesystem; +	m = kern_mount_data(&mqueue_fs_type, &init_ipc_ns); +	if (IS_ERR(m)) +		goto out_filesystem; +	init_ipc_ns.mq_mnt = m;  	return 0;  out_filesystem: diff --git a/ipc/msg.c b/ipc/msg.c index 1bbc029d2b17..0dcc6699dc53 100644 --- a/ipc/msg.c +++ b/ipc/msg.c @@ -476,9 +476,9 @@ static int msgctl_info(struct ipc_namespace *ns, int msqid,  static int msgctl_stat(struct ipc_namespace *ns, int msqid,  			 int cmd, struct msqid64_ds *p)  { -	int err;  	struct msg_queue *msq; -	int success_return; +	int id = 0; +	int err;  	memset(p, 0, sizeof(*p)); @@ -489,14 +489,13 @@ static int msgctl_stat(struct ipc_namespace *ns, int msqid,  			err = PTR_ERR(msq);  			goto out_unlock;  		} -		success_return = msq->q_perm.id; +		id = msq->q_perm.id;  	} else {  		msq = msq_obtain_object_check(ns, msqid);  		if (IS_ERR(msq)) {  			err = PTR_ERR(msq);  			goto out_unlock;  		} -		success_return = 0;  	}  	err = -EACCES; @@ -507,6 +506,14 @@ static int msgctl_stat(struct ipc_namespace *ns, int msqid,  	if (err)  		goto out_unlock; +	ipc_lock_object(&msq->q_perm); + +	if (!ipc_valid_object(&msq->q_perm)) { +		ipc_unlock_object(&msq->q_perm); +		err = -EIDRM; +		goto out_unlock; +	} +  	kernel_to_ipc64_perm(&msq->q_perm, &p->msg_perm);  	p->msg_stime  = msq->q_stime;  	p->msg_rtime  = msq->q_rtime; @@ -516,9 +523,10 @@ static int msgctl_stat(struct ipc_namespace *ns, int msqid,  	p->msg_qbytes = msq->q_qbytes;  	p->msg_lspid  = msq->q_lspid;  	p->msg_lrpid  = msq->q_lrpid; -	rcu_read_unlock(); -	return success_return; +	ipc_unlock_object(&msq->q_perm); +	rcu_read_unlock(); +	return id;  out_unlock:  	rcu_read_unlock(); diff --git a/ipc/sem.c b/ipc/sem.c index 87bd38f38dc3..a4af04979fd2 100644 --- a/ipc/sem.c +++ b/ipc/sem.c @@ -1213,10 +1213,20 @@ static int semctl_stat(struct ipc_namespace *ns, int semid,  	if (err)  		goto out_unlock; +	ipc_lock_object(&sma->sem_perm); + +	if (!ipc_valid_object(&sma->sem_perm)) { +		ipc_unlock_object(&sma->sem_perm); +		err = -EIDRM; +		goto out_unlock; +	} +  	kernel_to_ipc64_perm(&sma->sem_perm, &semid64->sem_perm);  	semid64->sem_otime = get_semotime(sma);  	semid64->sem_ctime = sma->sem_ctime;  	semid64->sem_nsems = sma->sem_nsems; + +	ipc_unlock_object(&sma->sem_perm);  	rcu_read_unlock();  	return id; diff --git a/ipc/shm.c b/ipc/shm.c index 7acda23430aa..4643865e9171 100644 --- a/ipc/shm.c +++ b/ipc/shm.c @@ -909,9 +909,11 @@ static int shmctl_stat(struct ipc_namespace *ns, int shmid,  			int cmd, struct shmid64_ds *tbuf)  {  	struct shmid_kernel *shp; -	int result; +	int id = 0;  	int err; +	memset(tbuf, 0, sizeof(*tbuf)); +  	rcu_read_lock();  	if (cmd == SHM_STAT) {  		shp = shm_obtain_object(ns, shmid); @@ -919,14 +921,13 @@ static int shmctl_stat(struct ipc_namespace *ns, int shmid,  			err = PTR_ERR(shp);  			goto out_unlock;  		} -		result = shp->shm_perm.id; +		id = shp->shm_perm.id;  	} else {  		shp = shm_obtain_object_check(ns, shmid);  		if (IS_ERR(shp)) {  			err = PTR_ERR(shp);  			goto out_unlock;  		} -		result = 0;  	}  	err = -EACCES; @@ -937,7 +938,14 @@ static int shmctl_stat(struct ipc_namespace *ns, int shmid,  	if (err)  		goto out_unlock; -	memset(tbuf, 0, sizeof(*tbuf)); +	ipc_lock_object(&shp->shm_perm); + +	if (!ipc_valid_object(&shp->shm_perm)) { +		ipc_unlock_object(&shp->shm_perm); +		err = -EIDRM; +		goto out_unlock; +	} +  	kernel_to_ipc64_perm(&shp->shm_perm, &tbuf->shm_perm);  	tbuf->shm_segsz	= shp->shm_segsz;  	tbuf->shm_atime	= shp->shm_atim; @@ -946,8 +954,10 @@ static int shmctl_stat(struct ipc_namespace *ns, int shmid,  	tbuf->shm_cpid	= shp->shm_cprid;  	tbuf->shm_lpid	= shp->shm_lprid;  	tbuf->shm_nattch = shp->shm_nattch; + +	ipc_unlock_object(&shp->shm_perm);  	rcu_read_unlock(); -	return result; +	return id;  out_unlock:  	rcu_read_unlock(); diff --git a/ipc/util.c b/ipc/util.c index ff045fec8d83..4ed5a17dd06f 100644 --- a/ipc/util.c +++ b/ipc/util.c @@ -23,9 +23,12 @@   *	    tree.   *	    - perform initial checks (capabilities, auditing and permission,   *	      etc). - *	    - perform read-only operations, such as STAT, INFO commands. + *	    - perform read-only operations, such as INFO command, that + *	      do not demand atomicity   *	      acquire the ipc lock (kern_ipc_perm.lock) through   *	      ipc_lock_object() + *		- perform read-only operations that demand atomicity, + *		  such as STAT command.   *		- perform data updates, such as SET, RMID commands and   *		  mechanism-specific operations (semop/semtimedop,   *		  msgsnd/msgrcv, shmat/shmdt). |