diff options
Diffstat (limited to 'fs/sysfs')
| -rw-r--r-- | fs/sysfs/Makefile | 2 | ||||
| -rw-r--r-- | fs/sysfs/dir.c | 1075 | ||||
| -rw-r--r-- | fs/sysfs/file.c | 963 | ||||
| -rw-r--r-- | fs/sysfs/group.c | 102 | ||||
| -rw-r--r-- | fs/sysfs/inode.c | 331 | ||||
| -rw-r--r-- | fs/sysfs/mount.c | 184 | ||||
| -rw-r--r-- | fs/sysfs/symlink.c | 219 | ||||
| -rw-r--r-- | fs/sysfs/sysfs.h | 236 | 
8 files changed, 351 insertions, 2761 deletions
| diff --git a/fs/sysfs/Makefile b/fs/sysfs/Makefile index 8876ac183373..6eff6e1205a5 100644 --- a/fs/sysfs/Makefile +++ b/fs/sysfs/Makefile @@ -2,4 +2,4 @@  # Makefile for the sysfs virtual filesystem  # -obj-y		:= inode.o file.o dir.o symlink.o mount.o group.o +obj-y		:= file.o dir.o symlink.o mount.o group.o diff --git a/fs/sysfs/dir.c b/fs/sysfs/dir.c index 5e73d6626e50..ee0d761c3179 100644 --- a/fs/sysfs/dir.c +++ b/fs/sysfs/dir.c @@ -13,465 +13,31 @@  #undef DEBUG  #include <linux/fs.h> -#include <linux/mount.h> -#include <linux/module.h>  #include <linux/kobject.h> -#include <linux/namei.h> -#include <linux/idr.h> -#include <linux/completion.h> -#include <linux/mutex.h>  #include <linux/slab.h> -#include <linux/security.h> -#include <linux/hash.h>  #include "sysfs.h" -DEFINE_MUTEX(sysfs_mutex);  DEFINE_SPINLOCK(sysfs_symlink_target_lock); -#define to_sysfs_dirent(X) rb_entry((X), struct sysfs_dirent, s_rb) - -static DEFINE_SPINLOCK(sysfs_ino_lock); -static DEFINE_IDA(sysfs_ino_ida); - -/** - *	sysfs_name_hash - *	@name: Null terminated string to hash - *	@ns:   Namespace tag to hash - * - *	Returns 31 bit hash of ns + name (so it fits in an off_t ) - */ -static unsigned int sysfs_name_hash(const char *name, const void *ns) -{ -	unsigned long hash = init_name_hash(); -	unsigned int len = strlen(name); -	while (len--) -		hash = partial_name_hash(*name++, hash); -	hash = (end_name_hash(hash) ^ hash_ptr((void *)ns, 31)); -	hash &= 0x7fffffffU; -	/* Reserve hash numbers 0, 1 and INT_MAX for magic directory entries */ -	if (hash < 1) -		hash += 2; -	if (hash >= INT_MAX) -		hash = INT_MAX - 1; -	return hash; -} - -static int sysfs_name_compare(unsigned int hash, const char *name, -			      const void *ns, const struct sysfs_dirent *sd) -{ -	if (hash != sd->s_hash) -		return hash - sd->s_hash; -	if (ns != sd->s_ns) -		return ns - sd->s_ns; -	return strcmp(name, sd->s_name); -} - -static int sysfs_sd_compare(const struct sysfs_dirent *left, -			    const struct sysfs_dirent *right) -{ -	return sysfs_name_compare(left->s_hash, left->s_name, left->s_ns, -				  right); -} - -/** - *	sysfs_link_sibling - link sysfs_dirent into sibling rbtree - *	@sd: sysfs_dirent of interest - * - *	Link @sd into its sibling rbtree which starts from - *	sd->s_parent->s_dir.children. - * - *	Locking: - *	mutex_lock(sysfs_mutex) - * - *	RETURNS: - *	0 on susccess -EEXIST on failure. - */ -static int sysfs_link_sibling(struct sysfs_dirent *sd) -{ -	struct rb_node **node = &sd->s_parent->s_dir.children.rb_node; -	struct rb_node *parent = NULL; - -	if (sysfs_type(sd) == SYSFS_DIR) -		sd->s_parent->s_dir.subdirs++; - -	while (*node) { -		struct sysfs_dirent *pos; -		int result; - -		pos = to_sysfs_dirent(*node); -		parent = *node; -		result = sysfs_sd_compare(sd, pos); -		if (result < 0) -			node = &pos->s_rb.rb_left; -		else if (result > 0) -			node = &pos->s_rb.rb_right; -		else -			return -EEXIST; -	} -	/* add new node and rebalance the tree */ -	rb_link_node(&sd->s_rb, parent, node); -	rb_insert_color(&sd->s_rb, &sd->s_parent->s_dir.children); -	return 0; -} - -/** - *	sysfs_unlink_sibling - unlink sysfs_dirent from sibling rbtree - *	@sd: sysfs_dirent of interest - * - *	Unlink @sd from its sibling rbtree which starts from - *	sd->s_parent->s_dir.children. - * - *	Locking: - *	mutex_lock(sysfs_mutex) - */ -static void sysfs_unlink_sibling(struct sysfs_dirent *sd) -{ -	if (sysfs_type(sd) == SYSFS_DIR) -		sd->s_parent->s_dir.subdirs--; - -	rb_erase(&sd->s_rb, &sd->s_parent->s_dir.children); -} - -/** - *	sysfs_get_active - get an active reference to sysfs_dirent - *	@sd: sysfs_dirent to get an active reference to - * - *	Get an active reference of @sd.  This function is noop if @sd - *	is NULL. - * - *	RETURNS: - *	Pointer to @sd on success, NULL on failure. - */ -struct sysfs_dirent *sysfs_get_active(struct sysfs_dirent *sd) -{ -	if (unlikely(!sd)) -		return NULL; - -	if (!atomic_inc_unless_negative(&sd->s_active)) -		return NULL; - -	if (likely(!sysfs_ignore_lockdep(sd))) -		rwsem_acquire_read(&sd->dep_map, 0, 1, _RET_IP_); -	return sd; -} - -/** - *	sysfs_put_active - put an active reference to sysfs_dirent - *	@sd: sysfs_dirent to put an active reference to - * - *	Put an active reference to @sd.  This function is noop if @sd - *	is NULL. - */ -void sysfs_put_active(struct sysfs_dirent *sd) -{ -	int v; - -	if (unlikely(!sd)) -		return; - -	if (likely(!sysfs_ignore_lockdep(sd))) -		rwsem_release(&sd->dep_map, 1, _RET_IP_); -	v = atomic_dec_return(&sd->s_active); -	if (likely(v != SD_DEACTIVATED_BIAS)) -		return; - -	/* atomic_dec_return() is a mb(), we'll always see the updated -	 * sd->u.completion. -	 */ -	complete(sd->u.completion); -} - -/** - *	sysfs_deactivate - deactivate sysfs_dirent - *	@sd: sysfs_dirent to deactivate - * - *	Deny new active references and drain existing ones. - */ -static void sysfs_deactivate(struct sysfs_dirent *sd) -{ -	DECLARE_COMPLETION_ONSTACK(wait); -	int v; - -	BUG_ON(!(sd->s_flags & SYSFS_FLAG_REMOVED)); - -	if (!(sysfs_type(sd) & SYSFS_ACTIVE_REF)) -		return; - -	sd->u.completion = (void *)&wait; - -	rwsem_acquire(&sd->dep_map, 0, 0, _RET_IP_); -	/* atomic_add_return() is a mb(), put_active() will always see -	 * the updated sd->u.completion. -	 */ -	v = atomic_add_return(SD_DEACTIVATED_BIAS, &sd->s_active); - -	if (v != SD_DEACTIVATED_BIAS) { -		lock_contended(&sd->dep_map, _RET_IP_); -		wait_for_completion(&wait); -	} - -	lock_acquired(&sd->dep_map, _RET_IP_); -	rwsem_release(&sd->dep_map, 1, _RET_IP_); -} - -static int sysfs_alloc_ino(unsigned int *pino) -{ -	int ino, rc; - - retry: -	spin_lock(&sysfs_ino_lock); -	rc = ida_get_new_above(&sysfs_ino_ida, 2, &ino); -	spin_unlock(&sysfs_ino_lock); - -	if (rc == -EAGAIN) { -		if (ida_pre_get(&sysfs_ino_ida, GFP_KERNEL)) -			goto retry; -		rc = -ENOMEM; -	} - -	*pino = ino; -	return rc; -} - -static void sysfs_free_ino(unsigned int ino) -{ -	spin_lock(&sysfs_ino_lock); -	ida_remove(&sysfs_ino_ida, ino); -	spin_unlock(&sysfs_ino_lock); -} - -void release_sysfs_dirent(struct sysfs_dirent *sd) -{ -	struct sysfs_dirent *parent_sd; - - repeat: -	/* Moving/renaming is always done while holding reference. -	 * sd->s_parent won't change beneath us. -	 */ -	parent_sd = sd->s_parent; - -	WARN(!(sd->s_flags & SYSFS_FLAG_REMOVED), -		"sysfs: free using entry: %s/%s\n", -		parent_sd ? parent_sd->s_name : "", sd->s_name); - -	if (sysfs_type(sd) == SYSFS_KOBJ_LINK) -		sysfs_put(sd->s_symlink.target_sd); -	if (sysfs_type(sd) & SYSFS_COPY_NAME) -		kfree(sd->s_name); -	if (sd->s_iattr && sd->s_iattr->ia_secdata) -		security_release_secctx(sd->s_iattr->ia_secdata, -					sd->s_iattr->ia_secdata_len); -	kfree(sd->s_iattr); -	sysfs_free_ino(sd->s_ino); -	kmem_cache_free(sysfs_dir_cachep, sd); - -	sd = parent_sd; -	if (sd && atomic_dec_and_test(&sd->s_count)) -		goto repeat; -} - -static int sysfs_dentry_delete(const struct dentry *dentry) -{ -	struct sysfs_dirent *sd = dentry->d_fsdata; -	return !(sd && !(sd->s_flags & SYSFS_FLAG_REMOVED)); -} - -static int sysfs_dentry_revalidate(struct dentry *dentry, unsigned int flags) -{ -	struct sysfs_dirent *sd; -	int type; - -	if (flags & LOOKUP_RCU) -		return -ECHILD; - -	sd = dentry->d_fsdata; -	mutex_lock(&sysfs_mutex); - -	/* The sysfs dirent has been deleted */ -	if (sd->s_flags & SYSFS_FLAG_REMOVED) -		goto out_bad; - -	/* The sysfs dirent has been moved? */ -	if (dentry->d_parent->d_fsdata != sd->s_parent) -		goto out_bad; - -	/* The sysfs dirent has been renamed */ -	if (strcmp(dentry->d_name.name, sd->s_name) != 0) -		goto out_bad; - -	/* The sysfs dirent has been moved to a different namespace */ -	type = KOBJ_NS_TYPE_NONE; -	if (sd->s_parent) { -		type = sysfs_ns_type(sd->s_parent); -		if (type != KOBJ_NS_TYPE_NONE && -				sysfs_info(dentry->d_sb)->ns[type] != sd->s_ns) -			goto out_bad; -	} - -	mutex_unlock(&sysfs_mutex); -out_valid: -	return 1; -out_bad: -	/* Remove the dentry from the dcache hashes. -	 * If this is a deleted dentry we use d_drop instead of d_delete -	 * so sysfs doesn't need to cope with negative dentries. -	 * -	 * If this is a dentry that has simply been renamed we -	 * use d_drop to remove it from the dcache lookup on its -	 * old parent.  If this dentry persists later when a lookup -	 * is performed at its new name the dentry will be readded -	 * to the dcache hashes. -	 */ -	mutex_unlock(&sysfs_mutex); - -	/* If we have submounts we must allow the vfs caches -	 * to lie about the state of the filesystem to prevent -	 * leaks and other nasty things. -	 */ -	if (check_submounts_and_drop(dentry) != 0) -		goto out_valid; - -	return 0; -} - -static void sysfs_dentry_release(struct dentry *dentry) -{ -	sysfs_put(dentry->d_fsdata); -} - -const struct dentry_operations sysfs_dentry_ops = { -	.d_revalidate	= sysfs_dentry_revalidate, -	.d_delete	= sysfs_dentry_delete, -	.d_release	= sysfs_dentry_release, -}; - -struct sysfs_dirent *sysfs_new_dirent(const char *name, umode_t mode, int type) -{ -	char *dup_name = NULL; -	struct sysfs_dirent *sd; - -	if (type & SYSFS_COPY_NAME) { -		name = dup_name = kstrdup(name, GFP_KERNEL); -		if (!name) -			return NULL; -	} - -	sd = kmem_cache_zalloc(sysfs_dir_cachep, GFP_KERNEL); -	if (!sd) -		goto err_out1; - -	if (sysfs_alloc_ino(&sd->s_ino)) -		goto err_out2; - -	atomic_set(&sd->s_count, 1); -	atomic_set(&sd->s_active, 0); - -	sd->s_name = name; -	sd->s_mode = mode; -	sd->s_flags = type | SYSFS_FLAG_REMOVED; - -	return sd; - - err_out2: -	kmem_cache_free(sysfs_dir_cachep, sd); - err_out1: -	kfree(dup_name); -	return NULL; -} - -/** - *	sysfs_addrm_start - prepare for sysfs_dirent add/remove - *	@acxt: pointer to sysfs_addrm_cxt to be used - * - *	This function is called when the caller is about to add or remove - *	sysfs_dirent.  This function acquires sysfs_mutex.  @acxt is used - *	to keep and pass context to other addrm functions. - * - *	LOCKING: - *	Kernel thread context (may sleep).  sysfs_mutex is locked on - *	return. - */ -void sysfs_addrm_start(struct sysfs_addrm_cxt *acxt) -	__acquires(sysfs_mutex) -{ -	memset(acxt, 0, sizeof(*acxt)); - -	mutex_lock(&sysfs_mutex); -} - -/** - *	__sysfs_add_one - add sysfs_dirent to parent without warning - *	@acxt: addrm context to use - *	@sd: sysfs_dirent to be added - *	@parent_sd: the parent sysfs_dirent to add @sd to - * - *	Get @parent_sd and set @sd->s_parent to it and increment nlink of - *	the parent inode if @sd is a directory and link into the children - *	list of the parent. - * - *	This function should be called between calls to - *	sysfs_addrm_start() and sysfs_addrm_finish() and should be - *	passed the same @acxt as passed to sysfs_addrm_start(). - * - *	LOCKING: - *	Determined by sysfs_addrm_start(). - * - *	RETURNS: - *	0 on success, -EEXIST if entry with the given name already - *	exists. - */ -int __sysfs_add_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd, -		    struct sysfs_dirent *parent_sd) -{ -	struct sysfs_inode_attrs *ps_iattr; -	int ret; - -	if (!!sysfs_ns_type(parent_sd) != !!sd->s_ns) { -		WARN(1, KERN_WARNING "sysfs: ns %s in '%s' for '%s'\n", -			sysfs_ns_type(parent_sd) ? "required" : "invalid", -			parent_sd->s_name, sd->s_name); -		return -EINVAL; -	} - -	sd->s_hash = sysfs_name_hash(sd->s_name, sd->s_ns); -	sd->s_parent = sysfs_get(parent_sd); - -	ret = sysfs_link_sibling(sd); -	if (ret) -		return ret; - -	/* Update timestamps on the parent */ -	ps_iattr = parent_sd->s_iattr; -	if (ps_iattr) { -		struct iattr *ps_iattrs = &ps_iattr->ia_iattr; -		ps_iattrs->ia_ctime = ps_iattrs->ia_mtime = CURRENT_TIME; -	} - -	/* Mark the entry added into directory tree */ -	sd->s_flags &= ~SYSFS_FLAG_REMOVED; - -	return 0; -} -  /**   *	sysfs_pathname - return full path to sysfs dirent - *	@sd: sysfs_dirent whose path we want + *	@kn: kernfs_node whose path we want   *	@path: caller allocated buffer of size PATH_MAX   *   *	Gives the name "/" to the sysfs_root entry; any path returned   *	is relative to wherever sysfs is mounted.   */ -static char *sysfs_pathname(struct sysfs_dirent *sd, char *path) +static char *sysfs_pathname(struct kernfs_node *kn, char *path)  { -	if (sd->s_parent) { -		sysfs_pathname(sd->s_parent, path); +	if (kn->parent) { +		sysfs_pathname(kn->parent, path);  		strlcat(path, "/", PATH_MAX);  	} -	strlcat(path, sd->s_name, PATH_MAX); +	strlcat(path, kn->name, PATH_MAX);  	return path;  } -void sysfs_warn_dup(struct sysfs_dirent *parent, const char *name) +void sysfs_warn_dup(struct kernfs_node *parent, const char *name)  {  	char *path; @@ -489,445 +55,34 @@ void sysfs_warn_dup(struct sysfs_dirent *parent, const char *name)  }  /** - *	sysfs_add_one - add sysfs_dirent to parent - *	@acxt: addrm context to use - *	@sd: sysfs_dirent to be added - *	@parent_sd: the parent sysfs_dirent to add @sd to - * - *	Get @parent_sd and set @sd->s_parent to it and increment nlink of - *	the parent inode if @sd is a directory and link into the children - *	list of the parent. - * - *	This function should be called between calls to - *	sysfs_addrm_start() and sysfs_addrm_finish() and should be - *	passed the same @acxt as passed to sysfs_addrm_start(). - * - *	LOCKING: - *	Determined by sysfs_addrm_start(). - * - *	RETURNS: - *	0 on success, -EEXIST if entry with the given name already - *	exists. - */ -int sysfs_add_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd, -		  struct sysfs_dirent *parent_sd) -{ -	int ret; - -	ret = __sysfs_add_one(acxt, sd, parent_sd); - -	if (ret == -EEXIST) -		sysfs_warn_dup(parent_sd, sd->s_name); -	return ret; -} - -/** - *	sysfs_remove_one - remove sysfs_dirent from parent - *	@acxt: addrm context to use - *	@sd: sysfs_dirent to be removed - * - *	Mark @sd removed and drop nlink of parent inode if @sd is a - *	directory.  @sd is unlinked from the children list. - * - *	This function should be called between calls to - *	sysfs_addrm_start() and sysfs_addrm_finish() and should be - *	passed the same @acxt as passed to sysfs_addrm_start(). - * - *	LOCKING: - *	Determined by sysfs_addrm_start(). - */ -static void sysfs_remove_one(struct sysfs_addrm_cxt *acxt, -			     struct sysfs_dirent *sd) -{ -	struct sysfs_inode_attrs *ps_iattr; - -	/* -	 * Removal can be called multiple times on the same node.  Only the -	 * first invocation is effective and puts the base ref. -	 */ -	if (sd->s_flags & SYSFS_FLAG_REMOVED) -		return; - -	sysfs_unlink_sibling(sd); - -	/* Update timestamps on the parent */ -	ps_iattr = sd->s_parent->s_iattr; -	if (ps_iattr) { -		struct iattr *ps_iattrs = &ps_iattr->ia_iattr; -		ps_iattrs->ia_ctime = ps_iattrs->ia_mtime = CURRENT_TIME; -	} - -	sd->s_flags |= SYSFS_FLAG_REMOVED; -	sd->u.removed_list = acxt->removed; -	acxt->removed = sd; -} - -/** - *	sysfs_addrm_finish - finish up sysfs_dirent add/remove - *	@acxt: addrm context to finish up - * - *	Finish up sysfs_dirent add/remove.  Resources acquired by - *	sysfs_addrm_start() are released and removed sysfs_dirents are - *	cleaned up. - * - *	LOCKING: - *	sysfs_mutex is released. - */ -void sysfs_addrm_finish(struct sysfs_addrm_cxt *acxt) -	__releases(sysfs_mutex) -{ -	/* release resources acquired by sysfs_addrm_start() */ -	mutex_unlock(&sysfs_mutex); - -	/* kill removed sysfs_dirents */ -	while (acxt->removed) { -		struct sysfs_dirent *sd = acxt->removed; - -		acxt->removed = sd->u.removed_list; - -		sysfs_deactivate(sd); -		sysfs_unmap_bin_file(sd); -		sysfs_put(sd); -	} -} - -/** - *	sysfs_find_dirent - find sysfs_dirent with the given name - *	@parent_sd: sysfs_dirent to search under - *	@name: name to look for - *	@ns: the namespace tag to use - * - *	Look for sysfs_dirent with name @name under @parent_sd. - * - *	LOCKING: - *	mutex_lock(sysfs_mutex) - * - *	RETURNS: - *	Pointer to sysfs_dirent if found, NULL if not. - */ -struct sysfs_dirent *sysfs_find_dirent(struct sysfs_dirent *parent_sd, -				       const unsigned char *name, -				       const void *ns) -{ -	struct rb_node *node = parent_sd->s_dir.children.rb_node; -	unsigned int hash; - -	if (!!sysfs_ns_type(parent_sd) != !!ns) { -		WARN(1, KERN_WARNING "sysfs: ns %s in '%s' for '%s'\n", -			sysfs_ns_type(parent_sd) ? "required" : "invalid", -			parent_sd->s_name, name); -		return NULL; -	} - -	hash = sysfs_name_hash(name, ns); -	while (node) { -		struct sysfs_dirent *sd; -		int result; - -		sd = to_sysfs_dirent(node); -		result = sysfs_name_compare(hash, name, ns, sd); -		if (result < 0) -			node = node->rb_left; -		else if (result > 0) -			node = node->rb_right; -		else -			return sd; -	} -	return NULL; -} - -/** - *	sysfs_get_dirent_ns - find and get sysfs_dirent with the given name - *	@parent_sd: sysfs_dirent to search under - *	@name: name to look for - *	@ns: the namespace tag to use - * - *	Look for sysfs_dirent with name @name under @parent_sd and get - *	it if found. - * - *	LOCKING: - *	Kernel thread context (may sleep).  Grabs sysfs_mutex. - * - *	RETURNS: - *	Pointer to sysfs_dirent if found, NULL if not. - */ -struct sysfs_dirent *sysfs_get_dirent_ns(struct sysfs_dirent *parent_sd, -					 const unsigned char *name, -					 const void *ns) -{ -	struct sysfs_dirent *sd; - -	mutex_lock(&sysfs_mutex); -	sd = sysfs_find_dirent(parent_sd, name, ns); -	sysfs_get(sd); -	mutex_unlock(&sysfs_mutex); - -	return sd; -} -EXPORT_SYMBOL_GPL(sysfs_get_dirent_ns); - -static int create_dir(struct kobject *kobj, struct sysfs_dirent *parent_sd, -		      enum kobj_ns_type type, -		      const char *name, const void *ns, -		      struct sysfs_dirent **p_sd) -{ -	umode_t mode = S_IFDIR | S_IRWXU | S_IRUGO | S_IXUGO; -	struct sysfs_addrm_cxt acxt; -	struct sysfs_dirent *sd; -	int rc; - -	/* allocate */ -	sd = sysfs_new_dirent(name, mode, SYSFS_DIR); -	if (!sd) -		return -ENOMEM; - -	sd->s_flags |= (type << SYSFS_NS_TYPE_SHIFT); -	sd->s_ns = ns; -	sd->s_dir.kobj = kobj; - -	/* link in */ -	sysfs_addrm_start(&acxt); -	rc = sysfs_add_one(&acxt, sd, parent_sd); -	sysfs_addrm_finish(&acxt); - -	if (rc == 0) -		*p_sd = sd; -	else -		sysfs_put(sd); - -	return rc; -} - -int sysfs_create_subdir(struct kobject *kobj, const char *name, -			struct sysfs_dirent **p_sd) -{ -	return create_dir(kobj, kobj->sd, -			  KOBJ_NS_TYPE_NONE, name, NULL, p_sd); -} - -/** - *	sysfs_read_ns_type: return associated ns_type - *	@kobj: the kobject being queried - * - *	Each kobject can be tagged with exactly one namespace type - *	(i.e. network or user).  Return the ns_type associated with - *	this object if any - */ -static enum kobj_ns_type sysfs_read_ns_type(struct kobject *kobj) -{ -	const struct kobj_ns_type_operations *ops; -	enum kobj_ns_type type; - -	ops = kobj_child_ns_ops(kobj); -	if (!ops) -		return KOBJ_NS_TYPE_NONE; - -	type = ops->type; -	BUG_ON(type <= KOBJ_NS_TYPE_NONE); -	BUG_ON(type >= KOBJ_NS_TYPES); -	BUG_ON(!kobj_ns_type_registered(type)); - -	return type; -} - -/**   * sysfs_create_dir_ns - create a directory for an object with a namespace tag   * @kobj: object we're creating directory for   * @ns: the namespace tag to use   */  int sysfs_create_dir_ns(struct kobject *kobj, const void *ns)  { -	enum kobj_ns_type type; -	struct sysfs_dirent *parent_sd, *sd; -	int error = 0; +	struct kernfs_node *parent, *kn;  	BUG_ON(!kobj);  	if (kobj->parent) -		parent_sd = kobj->parent->sd; +		parent = kobj->parent->sd;  	else -		parent_sd = &sysfs_root; +		parent = sysfs_root_kn; -	if (!parent_sd) +	if (!parent)  		return -ENOENT; -	type = sysfs_read_ns_type(kobj); - -	error = create_dir(kobj, parent_sd, type, kobject_name(kobj), ns, &sd); -	if (!error) -		kobj->sd = sd; -	return error; -} - -static struct dentry *sysfs_lookup(struct inode *dir, struct dentry *dentry, -				   unsigned int flags) -{ -	struct dentry *ret = NULL; -	struct dentry *parent = dentry->d_parent; -	struct sysfs_dirent *parent_sd = parent->d_fsdata; -	struct sysfs_dirent *sd; -	struct inode *inode; -	enum kobj_ns_type type; -	const void *ns; - -	mutex_lock(&sysfs_mutex); - -	type = sysfs_ns_type(parent_sd); -	ns = sysfs_info(dir->i_sb)->ns[type]; - -	sd = sysfs_find_dirent(parent_sd, dentry->d_name.name, ns); - -	/* no such entry */ -	if (!sd) { -		ret = ERR_PTR(-ENOENT); -		goto out_unlock; -	} -	dentry->d_fsdata = sysfs_get(sd); - -	/* attach dentry and inode */ -	inode = sysfs_get_inode(dir->i_sb, sd); -	if (!inode) { -		ret = ERR_PTR(-ENOMEM); -		goto out_unlock; -	} - -	/* instantiate and hash dentry */ -	ret = d_materialise_unique(dentry, inode); - out_unlock: -	mutex_unlock(&sysfs_mutex); -	return ret; -} - -const struct inode_operations sysfs_dir_inode_operations = { -	.lookup		= sysfs_lookup, -	.permission	= sysfs_permission, -	.setattr	= sysfs_setattr, -	.getattr	= sysfs_getattr, -	.setxattr	= sysfs_setxattr, -}; - -static struct sysfs_dirent *sysfs_leftmost_descendant(struct sysfs_dirent *pos) -{ -	struct sysfs_dirent *last; - -	while (true) { -		struct rb_node *rbn; - -		last = pos; - -		if (sysfs_type(pos) != SYSFS_DIR) -			break; - -		rbn = rb_first(&pos->s_dir.children); -		if (!rbn) -			break; - -		pos = to_sysfs_dirent(rbn); -	} - -	return last; -} - -/** - * sysfs_next_descendant_post - find the next descendant for post-order walk - * @pos: the current position (%NULL to initiate traversal) - * @root: sysfs_dirent whose descendants to walk - * - * Find the next descendant to visit for post-order traversal of @root's - * descendants.  @root is included in the iteration and the last node to be - * visited. - */ -static struct sysfs_dirent *sysfs_next_descendant_post(struct sysfs_dirent *pos, -						       struct sysfs_dirent *root) -{ -	struct rb_node *rbn; - -	lockdep_assert_held(&sysfs_mutex); - -	/* if first iteration, visit leftmost descendant which may be root */ -	if (!pos) -		return sysfs_leftmost_descendant(root); - -	/* if we visited @root, we're done */ -	if (pos == root) -		return NULL; - -	/* if there's an unvisited sibling, visit its leftmost descendant */ -	rbn = rb_next(&pos->s_rb); -	if (rbn) -		return sysfs_leftmost_descendant(to_sysfs_dirent(rbn)); - -	/* no sibling left, visit parent */ -	return pos->s_parent; -} - -static void __sysfs_remove(struct sysfs_addrm_cxt *acxt, -			   struct sysfs_dirent *sd) -{ -	struct sysfs_dirent *pos, *next; - -	if (!sd) -		return; - -	pr_debug("sysfs %s: removing\n", sd->s_name); - -	next = NULL; -	do { -		pos = next; -		next = sysfs_next_descendant_post(pos, sd); -		if (pos) -			sysfs_remove_one(acxt, pos); -	} while (next); -} - -/** - * sysfs_remove - remove a sysfs_dirent recursively - * @sd: the sysfs_dirent to remove - * - * Remove @sd along with all its subdirectories and files. - */ -void sysfs_remove(struct sysfs_dirent *sd) -{ -	struct sysfs_addrm_cxt acxt; - -	sysfs_addrm_start(&acxt); -	__sysfs_remove(&acxt, sd); -	sysfs_addrm_finish(&acxt); -} - -/** - * sysfs_hash_and_remove - find a sysfs_dirent by name and remove it - * @dir_sd: parent of the target - * @name: name of the sysfs_dirent to remove - * @ns: namespace tag of the sysfs_dirent to remove - * - * Look for the sysfs_dirent with @name and @ns under @dir_sd and remove - * it.  Returns 0 on success, -ENOENT if such entry doesn't exist. - */ -int sysfs_hash_and_remove(struct sysfs_dirent *dir_sd, const char *name, -			  const void *ns) -{ -	struct sysfs_addrm_cxt acxt; -	struct sysfs_dirent *sd; - -	if (!dir_sd) { -		WARN(1, KERN_WARNING "sysfs: can not remove '%s', no directory\n", -			name); -		return -ENOENT; +	kn = kernfs_create_dir_ns(parent, kobject_name(kobj), +				  S_IRWXU | S_IRUGO | S_IXUGO, kobj, ns); +	if (IS_ERR(kn)) { +		if (PTR_ERR(kn) == -EEXIST) +			sysfs_warn_dup(parent, kobject_name(kobj)); +		return PTR_ERR(kn);  	} -	sysfs_addrm_start(&acxt); - -	sd = sysfs_find_dirent(dir_sd, name, ns); -	if (sd) -		__sysfs_remove(&acxt, sd); - -	sysfs_addrm_finish(&acxt); - -	if (sd) -		return 0; -	else -		return -ENOENT; +	kobj->sd = kn; +	return 0;  }  /** @@ -940,207 +95,47 @@ int sysfs_hash_and_remove(struct sysfs_dirent *dir_sd, const char *name,   */  void sysfs_remove_dir(struct kobject *kobj)  { -	struct sysfs_dirent *sd = kobj->sd; +	struct kernfs_node *kn = kobj->sd;  	/*  	 * In general, kboject owner is responsible for ensuring removal  	 * doesn't race with other operations and sysfs doesn't provide any  	 * protection; however, when @kobj is used as a symlink target, the  	 * symlinking entity usually doesn't own @kobj and thus has no -	 * control over removal.  @kobj->sd may be removed anytime and -	 * symlink code may end up dereferencing an already freed sd. +	 * control over removal.  @kobj->sd may be removed anytime +	 * and symlink code may end up dereferencing an already freed node.  	 * -	 * sysfs_symlink_target_lock synchronizes @kobj->sd disassociation -	 * against symlink operations so that symlink code can safely -	 * dereference @kobj->sd. +	 * sysfs_symlink_target_lock synchronizes @kobj->sd +	 * disassociation against symlink operations so that symlink code +	 * can safely dereference @kobj->sd.  	 */  	spin_lock(&sysfs_symlink_target_lock);  	kobj->sd = NULL;  	spin_unlock(&sysfs_symlink_target_lock); -	if (sd) { -		WARN_ON_ONCE(sysfs_type(sd) != SYSFS_DIR); -		sysfs_remove(sd); +	if (kn) { +		WARN_ON_ONCE(kernfs_type(kn) != KERNFS_DIR); +		kernfs_remove(kn);  	}  } -int sysfs_rename(struct sysfs_dirent *sd, struct sysfs_dirent *new_parent_sd, -		 const char *new_name, const void *new_ns) -{ -	int error; - -	mutex_lock(&sysfs_mutex); - -	error = 0; -	if ((sd->s_parent == new_parent_sd) && (sd->s_ns == new_ns) && -	    (strcmp(sd->s_name, new_name) == 0)) -		goto out;	/* nothing to rename */ - -	error = -EEXIST; -	if (sysfs_find_dirent(new_parent_sd, new_name, new_ns)) -		goto out; - -	/* rename sysfs_dirent */ -	if (strcmp(sd->s_name, new_name) != 0) { -		error = -ENOMEM; -		new_name = kstrdup(new_name, GFP_KERNEL); -		if (!new_name) -			goto out; - -		kfree(sd->s_name); -		sd->s_name = new_name; -	} - -	/* -	 * Move to the appropriate place in the appropriate directories rbtree. -	 */ -	sysfs_unlink_sibling(sd); -	sysfs_get(new_parent_sd); -	sysfs_put(sd->s_parent); -	sd->s_ns = new_ns; -	sd->s_hash = sysfs_name_hash(sd->s_name, sd->s_ns); -	sd->s_parent = new_parent_sd; -	sysfs_link_sibling(sd); - -	error = 0; - out: -	mutex_unlock(&sysfs_mutex); -	return error; -} -  int sysfs_rename_dir_ns(struct kobject *kobj, const char *new_name,  			const void *new_ns)  { -	struct sysfs_dirent *parent_sd = kobj->sd->s_parent; +	struct kernfs_node *parent = kobj->sd->parent; -	return sysfs_rename(kobj->sd, parent_sd, new_name, new_ns); +	return kernfs_rename_ns(kobj->sd, parent, new_name, new_ns);  }  int sysfs_move_dir_ns(struct kobject *kobj, struct kobject *new_parent_kobj,  		      const void *new_ns)  { -	struct sysfs_dirent *sd = kobj->sd; -	struct sysfs_dirent *new_parent_sd; +	struct kernfs_node *kn = kobj->sd; +	struct kernfs_node *new_parent; -	BUG_ON(!sd->s_parent); -	new_parent_sd = new_parent_kobj && new_parent_kobj->sd ? -		new_parent_kobj->sd : &sysfs_root; +	BUG_ON(!kn->parent); +	new_parent = new_parent_kobj && new_parent_kobj->sd ? +		new_parent_kobj->sd : sysfs_root_kn; -	return sysfs_rename(sd, new_parent_sd, sd->s_name, new_ns); +	return kernfs_rename_ns(kn, new_parent, kn->name, new_ns);  } - -/* Relationship between s_mode and the DT_xxx types */ -static inline unsigned char dt_type(struct sysfs_dirent *sd) -{ -	return (sd->s_mode >> 12) & 15; -} - -static int sysfs_dir_release(struct inode *inode, struct file *filp) -{ -	sysfs_put(filp->private_data); -	return 0; -} - -static struct sysfs_dirent *sysfs_dir_pos(const void *ns, -	struct sysfs_dirent *parent_sd,	loff_t hash, struct sysfs_dirent *pos) -{ -	if (pos) { -		int valid = !(pos->s_flags & SYSFS_FLAG_REMOVED) && -			pos->s_parent == parent_sd && -			hash == pos->s_hash; -		sysfs_put(pos); -		if (!valid) -			pos = NULL; -	} -	if (!pos && (hash > 1) && (hash < INT_MAX)) { -		struct rb_node *node = parent_sd->s_dir.children.rb_node; -		while (node) { -			pos = to_sysfs_dirent(node); - -			if (hash < pos->s_hash) -				node = node->rb_left; -			else if (hash > pos->s_hash) -				node = node->rb_right; -			else -				break; -		} -	} -	/* Skip over entries in the wrong namespace */ -	while (pos && pos->s_ns != ns) { -		struct rb_node *node = rb_next(&pos->s_rb); -		if (!node) -			pos = NULL; -		else -			pos = to_sysfs_dirent(node); -	} -	return pos; -} - -static struct sysfs_dirent *sysfs_dir_next_pos(const void *ns, -	struct sysfs_dirent *parent_sd,	ino_t ino, struct sysfs_dirent *pos) -{ -	pos = sysfs_dir_pos(ns, parent_sd, ino, pos); -	if (pos) -		do { -			struct rb_node *node = rb_next(&pos->s_rb); -			if (!node) -				pos = NULL; -			else -				pos = to_sysfs_dirent(node); -		} while (pos && pos->s_ns != ns); -	return pos; -} - -static int sysfs_readdir(struct file *file, struct dir_context *ctx) -{ -	struct dentry *dentry = file->f_path.dentry; -	struct sysfs_dirent *parent_sd = dentry->d_fsdata; -	struct sysfs_dirent *pos = file->private_data; -	enum kobj_ns_type type; -	const void *ns; - -	type = sysfs_ns_type(parent_sd); -	ns = sysfs_info(dentry->d_sb)->ns[type]; - -	if (!dir_emit_dots(file, ctx)) -		return 0; -	mutex_lock(&sysfs_mutex); -	for (pos = sysfs_dir_pos(ns, parent_sd, ctx->pos, pos); -	     pos; -	     pos = sysfs_dir_next_pos(ns, parent_sd, ctx->pos, pos)) { -		const char *name = pos->s_name; -		unsigned int type = dt_type(pos); -		int len = strlen(name); -		ino_t ino = pos->s_ino; -		ctx->pos = pos->s_hash; -		file->private_data = sysfs_get(pos); - -		mutex_unlock(&sysfs_mutex); -		if (!dir_emit(ctx, name, len, ino, type)) -			return 0; -		mutex_lock(&sysfs_mutex); -	} -	mutex_unlock(&sysfs_mutex); -	file->private_data = NULL; -	ctx->pos = INT_MAX; -	return 0; -} - -static loff_t sysfs_dir_llseek(struct file *file, loff_t offset, int whence) -{ -	struct inode *inode = file_inode(file); -	loff_t ret; - -	mutex_lock(&inode->i_mutex); -	ret = generic_file_llseek(file, offset, whence); -	mutex_unlock(&inode->i_mutex); - -	return ret; -} - -const struct file_operations sysfs_dir_operations = { -	.read		= generic_read_dir, -	.iterate	= sysfs_readdir, -	.release	= sysfs_dir_release, -	.llseek		= sysfs_dir_llseek, -}; diff --git a/fs/sysfs/file.c b/fs/sysfs/file.c index b94f93685093..810cf6e613e5 100644 --- a/fs/sysfs/file.c +++ b/fs/sysfs/file.c @@ -14,70 +14,23 @@  #include <linux/kobject.h>  #include <linux/kallsyms.h>  #include <linux/slab.h> -#include <linux/fsnotify.h> -#include <linux/namei.h> -#include <linux/poll.h>  #include <linux/list.h>  #include <linux/mutex.h> -#include <linux/limits.h> -#include <linux/uaccess.h>  #include <linux/seq_file.h> -#include <linux/mm.h>  #include "sysfs.h" +#include "../kernfs/kernfs-internal.h"  /* - * There's one sysfs_open_file for each open file and one sysfs_open_dirent - * for each sysfs_dirent with one or more open files. - * - * sysfs_dirent->s_attr.open points to sysfs_open_dirent.  s_attr.open is - * protected by sysfs_open_dirent_lock. - * - * filp->private_data points to seq_file whose ->private points to - * sysfs_open_file.  sysfs_open_files are chained at - * sysfs_open_dirent->files, which is protected by sysfs_open_file_mutex. - */ -static DEFINE_SPINLOCK(sysfs_open_dirent_lock); -static DEFINE_MUTEX(sysfs_open_file_mutex); - -struct sysfs_open_dirent { -	atomic_t		refcnt; -	atomic_t		event; -	wait_queue_head_t	poll; -	struct list_head	files; /* goes through sysfs_open_file.list */ -}; - -struct sysfs_open_file { -	struct sysfs_dirent	*sd; -	struct file		*file; -	struct mutex		mutex; -	int			event; -	struct list_head	list; - -	bool			mmapped; -	const struct vm_operations_struct *vm_ops; -}; - -static bool sysfs_is_bin(struct sysfs_dirent *sd) -{ -	return sysfs_type(sd) == SYSFS_KOBJ_BIN_ATTR; -} - -static struct sysfs_open_file *sysfs_of(struct file *file) -{ -	return ((struct seq_file *)file->private_data)->private; -} - -/* - * Determine ktype->sysfs_ops for the given sysfs_dirent.  This function + * Determine ktype->sysfs_ops for the given kernfs_node.  This function   * must be called while holding an active reference.   */ -static const struct sysfs_ops *sysfs_file_ops(struct sysfs_dirent *sd) +static const struct sysfs_ops *sysfs_file_ops(struct kernfs_node *kn)  { -	struct kobject *kobj = sd->s_parent->s_dir.kobj; +	struct kobject *kobj = kn->parent->priv; -	if (!sysfs_ignore_lockdep(sd)) -		lockdep_assert_held(sd); +	if (kn->flags & KERNFS_LOCKDEP) +		lockdep_assert_held(kn);  	return kobj->ktype ? kobj->ktype->sysfs_ops : NULL;  } @@ -86,13 +39,13 @@ static const struct sysfs_ops *sysfs_file_ops(struct sysfs_dirent *sd)   * details like buffering and seeking.  The following function pipes   * sysfs_ops->show() result through seq_file.   */ -static int sysfs_seq_show(struct seq_file *sf, void *v) +static int sysfs_kf_seq_show(struct seq_file *sf, void *v)  { -	struct sysfs_open_file *of = sf->private; -	struct kobject *kobj = of->sd->s_parent->s_dir.kobj; -	const struct sysfs_ops *ops; -	char *buf; +	struct kernfs_open_file *of = sf->private; +	struct kobject *kobj = of->kn->parent->priv; +	const struct sysfs_ops *ops = sysfs_file_ops(of->kn);  	ssize_t count; +	char *buf;  	/* acquire buffer and ensure that it's >= PAGE_SIZE */  	count = seq_get_buf(sf, &buf); @@ -102,34 +55,15 @@ static int sysfs_seq_show(struct seq_file *sf, void *v)  	}  	/* -	 * Need @of->sd for attr and ops, its parent for kobj.  @of->mutex -	 * nests outside active ref and is just to ensure that the ops -	 * aren't called concurrently for the same open file. +	 * Invoke show().  Control may reach here via seq file lseek even +	 * if @ops->show() isn't implemented.  	 */ -	mutex_lock(&of->mutex); -	if (!sysfs_get_active(of->sd)) { -		mutex_unlock(&of->mutex); -		return -ENODEV; +	if (ops->show) { +		count = ops->show(kobj, of->kn->priv, buf); +		if (count < 0) +			return count;  	} -	of->event = atomic_read(&of->sd->s_attr.open->event); - -	/* -	 * Lookup @ops and invoke show().  Control may reach here via seq -	 * file lseek even if @ops->show() isn't implemented. -	 */ -	ops = sysfs_file_ops(of->sd); -	if (ops->show) -		count = ops->show(kobj, of->sd->s_attr.attr, buf); -	else -		count = 0; - -	sysfs_put_active(of->sd); -	mutex_unlock(&of->mutex); - -	if (count < 0) -		return count; -  	/*  	 * The code works fine with PAGE_SIZE return but it's likely to  	 * indicate truncated result or overflow in normal use cases. @@ -144,728 +78,194 @@ static int sysfs_seq_show(struct seq_file *sf, void *v)  	return 0;  } -/* - * Read method for bin files.  As reading a bin file can have side-effects, - * the exact offset and bytes specified in read(2) call should be passed to - * the read callback making it difficult to use seq_file.  Implement - * simplistic custom buffering for bin files. - */ -static ssize_t sysfs_bin_read(struct file *file, char __user *userbuf, -			      size_t bytes, loff_t *off) +static ssize_t sysfs_kf_bin_read(struct kernfs_open_file *of, char *buf, +				 size_t count, loff_t pos)  { -	struct sysfs_open_file *of = sysfs_of(file); -	struct bin_attribute *battr = of->sd->s_attr.bin_attr; -	struct kobject *kobj = of->sd->s_parent->s_dir.kobj; -	loff_t size = file_inode(file)->i_size; -	int count = min_t(size_t, bytes, PAGE_SIZE); -	loff_t offs = *off; -	char *buf; +	struct bin_attribute *battr = of->kn->priv; +	struct kobject *kobj = of->kn->parent->priv; +	loff_t size = file_inode(of->file)->i_size; -	if (!bytes) +	if (!count)  		return 0;  	if (size) { -		if (offs > size) +		if (pos > size)  			return 0; -		if (offs + count > size) -			count = size - offs; -	} - -	buf = kmalloc(count, GFP_KERNEL); -	if (!buf) -		return -ENOMEM; - -	/* need of->sd for battr, its parent for kobj */ -	mutex_lock(&of->mutex); -	if (!sysfs_get_active(of->sd)) { -		count = -ENODEV; -		mutex_unlock(&of->mutex); -		goto out_free; -	} - -	if (battr->read) -		count = battr->read(file, kobj, battr, buf, offs, count); -	else -		count = -EIO; - -	sysfs_put_active(of->sd); -	mutex_unlock(&of->mutex); - -	if (count < 0) -		goto out_free; - -	if (copy_to_user(userbuf, buf, count)) { -		count = -EFAULT; -		goto out_free; +		if (pos + count > size) +			count = size - pos;  	} -	pr_debug("offs = %lld, *off = %lld, count = %d\n", offs, *off, count); - -	*off = offs + count; +	if (!battr->read) +		return -EIO; - out_free: -	kfree(buf); -	return count; +	return battr->read(of->file, kobj, battr, buf, pos, count);  } -/** - * flush_write_buffer - push buffer to kobject - * @of: open file - * @buf: data buffer for file - * @off: file offset to write to - * @count: number of bytes - * - * Get the correct pointers for the kobject and the attribute we're dealing - * with, then call the store() method for it with @buf. - */ -static int flush_write_buffer(struct sysfs_open_file *of, char *buf, loff_t off, -			      size_t count) +/* kernfs write callback for regular sysfs files */ +static ssize_t sysfs_kf_write(struct kernfs_open_file *of, char *buf, +			      size_t count, loff_t pos)  { -	struct kobject *kobj = of->sd->s_parent->s_dir.kobj; -	int rc = 0; - -	/* -	 * Need @of->sd for attr and ops, its parent for kobj.  @of->mutex -	 * nests outside active ref and is just to ensure that the ops -	 * aren't called concurrently for the same open file. -	 */ -	mutex_lock(&of->mutex); -	if (!sysfs_get_active(of->sd)) { -		mutex_unlock(&of->mutex); -		return -ENODEV; -	} +	const struct sysfs_ops *ops = sysfs_file_ops(of->kn); +	struct kobject *kobj = of->kn->parent->priv; -	if (sysfs_is_bin(of->sd)) { -		struct bin_attribute *battr = of->sd->s_attr.bin_attr; - -		rc = -EIO; -		if (battr->write) -			rc = battr->write(of->file, kobj, battr, buf, off, -					  count); -	} else { -		const struct sysfs_ops *ops = sysfs_file_ops(of->sd); - -		rc = ops->store(kobj, of->sd->s_attr.attr, buf, count); -	} - -	sysfs_put_active(of->sd); -	mutex_unlock(&of->mutex); +	if (!count) +		return 0; -	return rc; +	return ops->store(kobj, of->kn->priv, buf, count);  } -/** - * sysfs_write_file - write an attribute - * @file: file pointer - * @user_buf: data to write - * @count: number of bytes - * @ppos: starting offset - * - * Copy data in from userland and pass it to the matching - * sysfs_ops->store() by invoking flush_write_buffer(). - * - * There is no easy way for us to know if userspace is only doing a partial - * write, so we don't support them. We expect the entire buffer to come on - * the first write.  Hint: if you're writing a value, first read the file, - * modify only the the value you're changing, then write entire buffer - * back. - */ -static ssize_t sysfs_write_file(struct file *file, const char __user *user_buf, -				size_t count, loff_t *ppos) +/* kernfs write callback for bin sysfs files */ +static ssize_t sysfs_kf_bin_write(struct kernfs_open_file *of, char *buf, +				  size_t count, loff_t pos)  { -	struct sysfs_open_file *of = sysfs_of(file); -	ssize_t len = min_t(size_t, count, PAGE_SIZE); -	loff_t size = file_inode(file)->i_size; -	char *buf; +	struct bin_attribute *battr = of->kn->priv; +	struct kobject *kobj = of->kn->parent->priv; +	loff_t size = file_inode(of->file)->i_size; -	if (sysfs_is_bin(of->sd) && size) { -		if (size <= *ppos) +	if (size) { +		if (size <= pos)  			return 0; -		len = min_t(ssize_t, len, size - *ppos); +		count = min_t(ssize_t, count, size - pos);  	} - -	if (!len) +	if (!count)  		return 0; -	buf = kmalloc(len + 1, GFP_KERNEL); -	if (!buf) -		return -ENOMEM; +	if (!battr->write) +		return -EIO; -	if (copy_from_user(buf, user_buf, len)) { -		len = -EFAULT; -		goto out_free; -	} -	buf[len] = '\0';	/* guarantee string termination */ - -	len = flush_write_buffer(of, buf, *ppos, len); -	if (len > 0) -		*ppos += len; -out_free: -	kfree(buf); -	return len; -} - -static void sysfs_bin_vma_open(struct vm_area_struct *vma) -{ -	struct file *file = vma->vm_file; -	struct sysfs_open_file *of = sysfs_of(file); - -	if (!of->vm_ops) -		return; - -	if (!sysfs_get_active(of->sd)) -		return; - -	if (of->vm_ops->open) -		of->vm_ops->open(vma); - -	sysfs_put_active(of->sd); +	return battr->write(of->file, kobj, battr, buf, pos, count);  } -static int sysfs_bin_fault(struct vm_area_struct *vma, struct vm_fault *vmf) +static int sysfs_kf_bin_mmap(struct kernfs_open_file *of, +			     struct vm_area_struct *vma)  { -	struct file *file = vma->vm_file; -	struct sysfs_open_file *of = sysfs_of(file); -	int ret; +	struct bin_attribute *battr = of->kn->priv; +	struct kobject *kobj = of->kn->parent->priv; -	if (!of->vm_ops) -		return VM_FAULT_SIGBUS; - -	if (!sysfs_get_active(of->sd)) -		return VM_FAULT_SIGBUS; - -	ret = VM_FAULT_SIGBUS; -	if (of->vm_ops->fault) -		ret = of->vm_ops->fault(vma, vmf); - -	sysfs_put_active(of->sd); -	return ret; +	return battr->mmap(of->file, kobj, battr, vma);  } -static int sysfs_bin_page_mkwrite(struct vm_area_struct *vma, -				  struct vm_fault *vmf) +void sysfs_notify(struct kobject *kobj, const char *dir, const char *attr)  { -	struct file *file = vma->vm_file; -	struct sysfs_open_file *of = sysfs_of(file); -	int ret; - -	if (!of->vm_ops) -		return VM_FAULT_SIGBUS; +	struct kernfs_node *kn = kobj->sd, *tmp; -	if (!sysfs_get_active(of->sd)) -		return VM_FAULT_SIGBUS; - -	ret = 0; -	if (of->vm_ops->page_mkwrite) -		ret = of->vm_ops->page_mkwrite(vma, vmf); +	if (kn && dir) +		kn = kernfs_find_and_get(kn, dir);  	else -		file_update_time(file); - -	sysfs_put_active(of->sd); -	return ret; -} - -static int sysfs_bin_access(struct vm_area_struct *vma, unsigned long addr, -			    void *buf, int len, int write) -{ -	struct file *file = vma->vm_file; -	struct sysfs_open_file *of = sysfs_of(file); -	int ret; - -	if (!of->vm_ops) -		return -EINVAL; - -	if (!sysfs_get_active(of->sd)) -		return -EINVAL; - -	ret = -EINVAL; -	if (of->vm_ops->access) -		ret = of->vm_ops->access(vma, addr, buf, len, write); - -	sysfs_put_active(of->sd); -	return ret; -} - -#ifdef CONFIG_NUMA -static int sysfs_bin_set_policy(struct vm_area_struct *vma, -				struct mempolicy *new) -{ -	struct file *file = vma->vm_file; -	struct sysfs_open_file *of = sysfs_of(file); -	int ret; - -	if (!of->vm_ops) -		return 0; - -	if (!sysfs_get_active(of->sd)) -		return -EINVAL; - -	ret = 0; -	if (of->vm_ops->set_policy) -		ret = of->vm_ops->set_policy(vma, new); - -	sysfs_put_active(of->sd); -	return ret; -} - -static struct mempolicy *sysfs_bin_get_policy(struct vm_area_struct *vma, -					      unsigned long addr) -{ -	struct file *file = vma->vm_file; -	struct sysfs_open_file *of = sysfs_of(file); -	struct mempolicy *pol; - -	if (!of->vm_ops) -		return vma->vm_policy; - -	if (!sysfs_get_active(of->sd)) -		return vma->vm_policy; - -	pol = vma->vm_policy; -	if (of->vm_ops->get_policy) -		pol = of->vm_ops->get_policy(vma, addr); - -	sysfs_put_active(of->sd); -	return pol; -} - -static int sysfs_bin_migrate(struct vm_area_struct *vma, const nodemask_t *from, -			     const nodemask_t *to, unsigned long flags) -{ -	struct file *file = vma->vm_file; -	struct sysfs_open_file *of = sysfs_of(file); -	int ret; - -	if (!of->vm_ops) -		return 0; - -	if (!sysfs_get_active(of->sd)) -		return 0; - -	ret = 0; -	if (of->vm_ops->migrate) -		ret = of->vm_ops->migrate(vma, from, to, flags); - -	sysfs_put_active(of->sd); -	return ret; -} -#endif - -static const struct vm_operations_struct sysfs_bin_vm_ops = { -	.open		= sysfs_bin_vma_open, -	.fault		= sysfs_bin_fault, -	.page_mkwrite	= sysfs_bin_page_mkwrite, -	.access		= sysfs_bin_access, -#ifdef CONFIG_NUMA -	.set_policy	= sysfs_bin_set_policy, -	.get_policy	= sysfs_bin_get_policy, -	.migrate	= sysfs_bin_migrate, -#endif -}; - -static int sysfs_bin_mmap(struct file *file, struct vm_area_struct *vma) -{ -	struct sysfs_open_file *of = sysfs_of(file); -	struct bin_attribute *battr = of->sd->s_attr.bin_attr; -	struct kobject *kobj = of->sd->s_parent->s_dir.kobj; -	int rc; - -	mutex_lock(&of->mutex); - -	/* need of->sd for battr, its parent for kobj */ -	rc = -ENODEV; -	if (!sysfs_get_active(of->sd)) -		goto out_unlock; - -	if (!battr->mmap) -		goto out_put; - -	rc = battr->mmap(file, kobj, battr, vma); -	if (rc) -		goto out_put; - -	/* -	 * PowerPC's pci_mmap of legacy_mem uses shmem_zero_setup() -	 * to satisfy versions of X which crash if the mmap fails: that -	 * substitutes a new vm_file, and we don't then want bin_vm_ops. -	 */ -	if (vma->vm_file != file) -		goto out_put; - -	rc = -EINVAL; -	if (of->mmapped && of->vm_ops != vma->vm_ops) -		goto out_put; +		kernfs_get(kn); -	/* -	 * It is not possible to successfully wrap close. -	 * So error if someone is trying to use close. -	 */ -	rc = -EINVAL; -	if (vma->vm_ops && vma->vm_ops->close) -		goto out_put; - -	rc = 0; -	of->mmapped = 1; -	of->vm_ops = vma->vm_ops; -	vma->vm_ops = &sysfs_bin_vm_ops; -out_put: -	sysfs_put_active(of->sd); -out_unlock: -	mutex_unlock(&of->mutex); - -	return rc; -} - -/** - *	sysfs_get_open_dirent - get or create sysfs_open_dirent - *	@sd: target sysfs_dirent - *	@of: sysfs_open_file for this instance of open - * - *	If @sd->s_attr.open exists, increment its reference count; - *	otherwise, create one.  @of is chained to the files list. - * - *	LOCKING: - *	Kernel thread context (may sleep). - * - *	RETURNS: - *	0 on success, -errno on failure. - */ -static int sysfs_get_open_dirent(struct sysfs_dirent *sd, -				 struct sysfs_open_file *of) -{ -	struct sysfs_open_dirent *od, *new_od = NULL; - - retry: -	mutex_lock(&sysfs_open_file_mutex); -	spin_lock_irq(&sysfs_open_dirent_lock); - -	if (!sd->s_attr.open && new_od) { -		sd->s_attr.open = new_od; -		new_od = NULL; +	if (kn && attr) { +		tmp = kernfs_find_and_get(kn, attr); +		kernfs_put(kn); +		kn = tmp;  	} -	od = sd->s_attr.open; -	if (od) { -		atomic_inc(&od->refcnt); -		list_add_tail(&of->list, &od->files); -	} - -	spin_unlock_irq(&sysfs_open_dirent_lock); -	mutex_unlock(&sysfs_open_file_mutex); - -	if (od) { -		kfree(new_od); -		return 0; +	if (kn) { +		kernfs_notify(kn); +		kernfs_put(kn);  	} +} +EXPORT_SYMBOL_GPL(sysfs_notify); -	/* not there, initialize a new one and retry */ -	new_od = kmalloc(sizeof(*new_od), GFP_KERNEL); -	if (!new_od) -		return -ENOMEM; +static const struct kernfs_ops sysfs_file_kfops_empty = { +}; -	atomic_set(&new_od->refcnt, 0); -	atomic_set(&new_od->event, 1); -	init_waitqueue_head(&new_od->poll); -	INIT_LIST_HEAD(&new_od->files); -	goto retry; -} +static const struct kernfs_ops sysfs_file_kfops_ro = { +	.seq_show	= sysfs_kf_seq_show, +}; -/** - *	sysfs_put_open_dirent - put sysfs_open_dirent - *	@sd: target sysfs_dirent - *	@of: associated sysfs_open_file - * - *	Put @sd->s_attr.open and unlink @of from the files list.  If - *	reference count reaches zero, disassociate and free it. - * - *	LOCKING: - *	None. - */ -static void sysfs_put_open_dirent(struct sysfs_dirent *sd, -				  struct sysfs_open_file *of) -{ -	struct sysfs_open_dirent *od = sd->s_attr.open; -	unsigned long flags; +static const struct kernfs_ops sysfs_file_kfops_wo = { +	.write		= sysfs_kf_write, +}; -	mutex_lock(&sysfs_open_file_mutex); -	spin_lock_irqsave(&sysfs_open_dirent_lock, flags); +static const struct kernfs_ops sysfs_file_kfops_rw = { +	.seq_show	= sysfs_kf_seq_show, +	.write		= sysfs_kf_write, +}; -	if (of) -		list_del(&of->list); +static const struct kernfs_ops sysfs_bin_kfops_ro = { +	.read		= sysfs_kf_bin_read, +}; -	if (atomic_dec_and_test(&od->refcnt)) -		sd->s_attr.open = NULL; -	else -		od = NULL; +static const struct kernfs_ops sysfs_bin_kfops_wo = { +	.write		= sysfs_kf_bin_write, +}; -	spin_unlock_irqrestore(&sysfs_open_dirent_lock, flags); -	mutex_unlock(&sysfs_open_file_mutex); +static const struct kernfs_ops sysfs_bin_kfops_rw = { +	.read		= sysfs_kf_bin_read, +	.write		= sysfs_kf_bin_write, +}; -	kfree(od); -} +static const struct kernfs_ops sysfs_bin_kfops_mmap = { +	.read		= sysfs_kf_bin_read, +	.write		= sysfs_kf_bin_write, +	.mmap		= sysfs_kf_bin_mmap, +}; -static int sysfs_open_file(struct inode *inode, struct file *file) +int sysfs_add_file_mode_ns(struct kernfs_node *parent, +			   const struct attribute *attr, bool is_bin, +			   umode_t mode, const void *ns)  { -	struct sysfs_dirent *attr_sd = file->f_path.dentry->d_fsdata; -	struct kobject *kobj = attr_sd->s_parent->s_dir.kobj; -	struct sysfs_open_file *of; -	bool has_read, has_write, has_mmap; -	int error = -EACCES; - -	/* need attr_sd for attr and ops, its parent for kobj */ -	if (!sysfs_get_active(attr_sd)) -		return -ENODEV; +	struct lock_class_key *key = NULL; +	const struct kernfs_ops *ops; +	struct kernfs_node *kn; +	loff_t size; -	if (sysfs_is_bin(attr_sd)) { -		struct bin_attribute *battr = attr_sd->s_attr.bin_attr; - -		has_read = battr->read || battr->mmap; -		has_write = battr->write || battr->mmap; -		has_mmap = battr->mmap; -	} else { -		const struct sysfs_ops *ops = sysfs_file_ops(attr_sd); +	if (!is_bin) { +		struct kobject *kobj = parent->priv; +		const struct sysfs_ops *sysfs_ops = kobj->ktype->sysfs_ops;  		/* every kobject with an attribute needs a ktype assigned */ -		if (WARN(!ops, KERN_ERR +		if (WARN(!sysfs_ops, KERN_ERR  			 "missing sysfs attribute operations for kobject: %s\n",  			 kobject_name(kobj))) -			goto err_out; - -		has_read = ops->show; -		has_write = ops->store; -		has_mmap = false; -	} - -	/* check perms and supported operations */ -	if ((file->f_mode & FMODE_WRITE) && -	    (!(inode->i_mode & S_IWUGO) || !has_write)) -		goto err_out; - -	if ((file->f_mode & FMODE_READ) && -	    (!(inode->i_mode & S_IRUGO) || !has_read)) -		goto err_out; - -	/* allocate a sysfs_open_file for the file */ -	error = -ENOMEM; -	of = kzalloc(sizeof(struct sysfs_open_file), GFP_KERNEL); -	if (!of) -		goto err_out; - -	/* -	 * The following is done to give a different lockdep key to -	 * @of->mutex for files which implement mmap.  This is a rather -	 * crude way to avoid false positive lockdep warning around -	 * mm->mmap_sem - mmap nests @of->mutex under mm->mmap_sem and -	 * reading /sys/block/sda/trace/act_mask grabs sr_mutex, under -	 * which mm->mmap_sem nests, while holding @of->mutex.  As each -	 * open file has a separate mutex, it's okay as long as those don't -	 * happen on the same file.  At this point, we can't easily give -	 * each file a separate locking class.  Let's differentiate on -	 * whether the file has mmap or not for now. -	 */ -	if (has_mmap) -		mutex_init(&of->mutex); -	else -		mutex_init(&of->mutex); - -	of->sd = attr_sd; -	of->file = file; - -	/* -	 * Always instantiate seq_file even if read access doesn't use -	 * seq_file or is not requested.  This unifies private data access -	 * and readable regular files are the vast majority anyway. -	 */ -	if (sysfs_is_bin(attr_sd)) -		error = single_open(file, NULL, of); -	else -		error = single_open(file, sysfs_seq_show, of); -	if (error) -		goto err_free; - -	/* seq_file clears PWRITE unconditionally, restore it if WRITE */ -	if (file->f_mode & FMODE_WRITE) -		file->f_mode |= FMODE_PWRITE; - -	/* make sure we have open dirent struct */ -	error = sysfs_get_open_dirent(attr_sd, of); -	if (error) -		goto err_close; - -	/* open succeeded, put active references */ -	sysfs_put_active(attr_sd); -	return 0; - -err_close: -	single_release(inode, file); -err_free: -	kfree(of); -err_out: -	sysfs_put_active(attr_sd); -	return error; -} - -static int sysfs_release(struct inode *inode, struct file *filp) -{ -	struct sysfs_dirent *sd = filp->f_path.dentry->d_fsdata; -	struct sysfs_open_file *of = sysfs_of(filp); - -	sysfs_put_open_dirent(sd, of); -	single_release(inode, filp); -	kfree(of); - -	return 0; -} - -void sysfs_unmap_bin_file(struct sysfs_dirent *sd) -{ -	struct sysfs_open_dirent *od; -	struct sysfs_open_file *of; - -	if (!sysfs_is_bin(sd)) -		return; - -	spin_lock_irq(&sysfs_open_dirent_lock); -	od = sd->s_attr.open; -	if (od) -		atomic_inc(&od->refcnt); -	spin_unlock_irq(&sysfs_open_dirent_lock); -	if (!od) -		return; - -	mutex_lock(&sysfs_open_file_mutex); -	list_for_each_entry(of, &od->files, list) { -		struct inode *inode = file_inode(of->file); -		unmap_mapping_range(inode->i_mapping, 0, 0, 1); +			return -EINVAL; + +		if (sysfs_ops->show && sysfs_ops->store) +			ops = &sysfs_file_kfops_rw; +		else if (sysfs_ops->show) +			ops = &sysfs_file_kfops_ro; +		else if (sysfs_ops->store) +			ops = &sysfs_file_kfops_wo; +		else +			ops = &sysfs_file_kfops_empty; + +		size = PAGE_SIZE; +	} else { +		struct bin_attribute *battr = (void *)attr; + +		if (battr->mmap) +			ops = &sysfs_bin_kfops_mmap; +		else if (battr->read && battr->write) +			ops = &sysfs_bin_kfops_rw; +		else if (battr->read) +			ops = &sysfs_bin_kfops_ro; +		else if (battr->write) +			ops = &sysfs_bin_kfops_wo; +		else +			ops = &sysfs_file_kfops_empty; + +		size = battr->size;  	} -	mutex_unlock(&sysfs_open_file_mutex); - -	sysfs_put_open_dirent(sd, NULL); -} - -/* Sysfs attribute files are pollable.  The idea is that you read - * the content and then you use 'poll' or 'select' to wait for - * the content to change.  When the content changes (assuming the - * manager for the kobject supports notification), poll will - * return POLLERR|POLLPRI, and select will return the fd whether - * it is waiting for read, write, or exceptions. - * Once poll/select indicates that the value has changed, you - * need to close and re-open the file, or seek to 0 and read again. - * Reminder: this only works for attributes which actively support - * it, and it is not possible to test an attribute from userspace - * to see if it supports poll (Neither 'poll' nor 'select' return - * an appropriate error code).  When in doubt, set a suitable timeout value. - */ -static unsigned int sysfs_poll(struct file *filp, poll_table *wait) -{ -	struct sysfs_open_file *of = sysfs_of(filp); -	struct sysfs_dirent *attr_sd = filp->f_path.dentry->d_fsdata; -	struct sysfs_open_dirent *od = attr_sd->s_attr.open; - -	/* need parent for the kobj, grab both */ -	if (!sysfs_get_active(attr_sd)) -		goto trigger; - -	poll_wait(filp, &od->poll, wait); -	sysfs_put_active(attr_sd); - -	if (of->event != atomic_read(&od->event)) -		goto trigger; - -	return DEFAULT_POLLMASK; - - trigger: -	return DEFAULT_POLLMASK|POLLERR|POLLPRI; -} - -void sysfs_notify_dirent(struct sysfs_dirent *sd) -{ -	struct sysfs_open_dirent *od; -	unsigned long flags; - -	spin_lock_irqsave(&sysfs_open_dirent_lock, flags); - -	if (!WARN_ON(sysfs_type(sd) != SYSFS_KOBJ_ATTR)) { -		od = sd->s_attr.open; -		if (od) { -			atomic_inc(&od->event); -			wake_up_interruptible(&od->poll); -		} +#ifdef CONFIG_DEBUG_LOCK_ALLOC +	if (!attr->ignore_lockdep) +		key = attr->key ?: (struct lock_class_key *)&attr->skey; +#endif +	kn = __kernfs_create_file(parent, attr->name, mode, size, ops, +				  (void *)attr, ns, true, key); +	if (IS_ERR(kn)) { +		if (PTR_ERR(kn) == -EEXIST) +			sysfs_warn_dup(parent, attr->name); +		return PTR_ERR(kn);  	} - -	spin_unlock_irqrestore(&sysfs_open_dirent_lock, flags); -} -EXPORT_SYMBOL_GPL(sysfs_notify_dirent); - -void sysfs_notify(struct kobject *k, const char *dir, const char *attr) -{ -	struct sysfs_dirent *sd = k->sd; - -	mutex_lock(&sysfs_mutex); - -	if (sd && dir) -		sd = sysfs_find_dirent(sd, dir, NULL); -	if (sd && attr) -		sd = sysfs_find_dirent(sd, attr, NULL); -	if (sd) -		sysfs_notify_dirent(sd); - -	mutex_unlock(&sysfs_mutex); -} -EXPORT_SYMBOL_GPL(sysfs_notify); - -const struct file_operations sysfs_file_operations = { -	.read		= seq_read, -	.write		= sysfs_write_file, -	.llseek		= generic_file_llseek, -	.open		= sysfs_open_file, -	.release	= sysfs_release, -	.poll		= sysfs_poll, -}; - -const struct file_operations sysfs_bin_operations = { -	.read		= sysfs_bin_read, -	.write		= sysfs_write_file, -	.llseek		= generic_file_llseek, -	.mmap		= sysfs_bin_mmap, -	.open		= sysfs_open_file, -	.release	= sysfs_release, -	.poll		= sysfs_poll, -}; - -int sysfs_add_file_mode_ns(struct sysfs_dirent *dir_sd, -			   const struct attribute *attr, int type, -			   umode_t amode, const void *ns) -{ -	umode_t mode = (amode & S_IALLUGO) | S_IFREG; -	struct sysfs_addrm_cxt acxt; -	struct sysfs_dirent *sd; -	int rc; - -	sd = sysfs_new_dirent(attr->name, mode, type); -	if (!sd) -		return -ENOMEM; - -	sd->s_ns = ns; -	sd->s_attr.attr = (void *)attr; -	sysfs_dirent_init_lockdep(sd); - -	sysfs_addrm_start(&acxt); -	rc = sysfs_add_one(&acxt, sd, dir_sd); -	sysfs_addrm_finish(&acxt); - -	if (rc) -		sysfs_put(sd); - -	return rc; +	return 0;  } - -int sysfs_add_file(struct sysfs_dirent *dir_sd, const struct attribute *attr, -		   int type) +int sysfs_add_file(struct kernfs_node *parent, const struct attribute *attr, +		   bool is_bin)  { -	return sysfs_add_file_mode_ns(dir_sd, attr, type, attr->mode, NULL); +	return sysfs_add_file_mode_ns(parent, attr, is_bin, attr->mode, NULL);  }  /** @@ -879,8 +279,7 @@ int sysfs_create_file_ns(struct kobject *kobj, const struct attribute *attr,  {  	BUG_ON(!kobj || !kobj->sd || !attr); -	return sysfs_add_file_mode_ns(kobj->sd, attr, SYSFS_KOBJ_ATTR, -				      attr->mode, ns); +	return sysfs_add_file_mode_ns(kobj->sd, attr, false, attr->mode, ns);  }  EXPORT_SYMBOL_GPL(sysfs_create_file_ns); @@ -908,19 +307,21 @@ EXPORT_SYMBOL_GPL(sysfs_create_files);  int sysfs_add_file_to_group(struct kobject *kobj,  		const struct attribute *attr, const char *group)  { -	struct sysfs_dirent *dir_sd; +	struct kernfs_node *parent;  	int error; -	if (group) -		dir_sd = sysfs_get_dirent(kobj->sd, group); -	else -		dir_sd = sysfs_get(kobj->sd); +	if (group) { +		parent = kernfs_find_and_get(kobj->sd, group); +	} else { +		parent = kobj->sd; +		kernfs_get(parent); +	} -	if (!dir_sd) +	if (!parent)  		return -ENOENT; -	error = sysfs_add_file(dir_sd, attr, SYSFS_KOBJ_ATTR); -	sysfs_put(dir_sd); +	error = sysfs_add_file(parent, attr, false); +	kernfs_put(parent);  	return error;  } @@ -936,23 +337,20 @@ EXPORT_SYMBOL_GPL(sysfs_add_file_to_group);  int sysfs_chmod_file(struct kobject *kobj, const struct attribute *attr,  		     umode_t mode)  { -	struct sysfs_dirent *sd; +	struct kernfs_node *kn;  	struct iattr newattrs;  	int rc; -	mutex_lock(&sysfs_mutex); - -	rc = -ENOENT; -	sd = sysfs_find_dirent(kobj->sd, attr->name, NULL); -	if (!sd) -		goto out; +	kn = kernfs_find_and_get(kobj->sd, attr->name); +	if (!kn) +		return -ENOENT; -	newattrs.ia_mode = (mode & S_IALLUGO) | (sd->s_mode & ~S_IALLUGO); +	newattrs.ia_mode = (mode & S_IALLUGO) | (kn->mode & ~S_IALLUGO);  	newattrs.ia_valid = ATTR_MODE; -	rc = sysfs_sd_setattr(sd, &newattrs); - out: -	mutex_unlock(&sysfs_mutex); +	rc = kernfs_setattr(kn, &newattrs); + +	kernfs_put(kn);  	return rc;  }  EXPORT_SYMBOL_GPL(sysfs_chmod_file); @@ -968,9 +366,9 @@ EXPORT_SYMBOL_GPL(sysfs_chmod_file);  void sysfs_remove_file_ns(struct kobject *kobj, const struct attribute *attr,  			  const void *ns)  { -	struct sysfs_dirent *dir_sd = kobj->sd; +	struct kernfs_node *parent = kobj->sd; -	sysfs_hash_and_remove(dir_sd, attr->name, ns); +	kernfs_remove_by_name_ns(parent, attr->name, ns);  }  EXPORT_SYMBOL_GPL(sysfs_remove_file_ns); @@ -991,15 +389,18 @@ EXPORT_SYMBOL_GPL(sysfs_remove_files);  void sysfs_remove_file_from_group(struct kobject *kobj,  		const struct attribute *attr, const char *group)  { -	struct sysfs_dirent *dir_sd; +	struct kernfs_node *parent; -	if (group) -		dir_sd = sysfs_get_dirent(kobj->sd, group); -	else -		dir_sd = sysfs_get(kobj->sd); -	if (dir_sd) { -		sysfs_hash_and_remove(dir_sd, attr->name, NULL); -		sysfs_put(dir_sd); +	if (group) { +		parent = kernfs_find_and_get(kobj->sd, group); +	} else { +		parent = kobj->sd; +		kernfs_get(parent); +	} + +	if (parent) { +		kernfs_remove_by_name(parent, attr->name); +		kernfs_put(parent);  	}  }  EXPORT_SYMBOL_GPL(sysfs_remove_file_from_group); @@ -1014,7 +415,7 @@ int sysfs_create_bin_file(struct kobject *kobj,  {  	BUG_ON(!kobj || !kobj->sd || !attr); -	return sysfs_add_file(kobj->sd, &attr->attr, SYSFS_KOBJ_BIN_ATTR); +	return sysfs_add_file(kobj->sd, &attr->attr, true);  }  EXPORT_SYMBOL_GPL(sysfs_create_bin_file); @@ -1026,7 +427,7 @@ EXPORT_SYMBOL_GPL(sysfs_create_bin_file);  void sysfs_remove_bin_file(struct kobject *kobj,  			   const struct bin_attribute *attr)  { -	sysfs_hash_and_remove(kobj->sd, attr->attr.name, NULL); +	kernfs_remove_by_name(kobj->sd, attr->attr.name);  }  EXPORT_SYMBOL_GPL(sysfs_remove_bin_file); diff --git a/fs/sysfs/group.c b/fs/sysfs/group.c index 1898a10e38ce..6b579387c67a 100644 --- a/fs/sysfs/group.c +++ b/fs/sysfs/group.c @@ -18,7 +18,7 @@  #include "sysfs.h" -static void remove_files(struct sysfs_dirent *dir_sd, struct kobject *kobj, +static void remove_files(struct kernfs_node *parent, struct kobject *kobj,  			 const struct attribute_group *grp)  {  	struct attribute *const *attr; @@ -26,13 +26,13 @@ static void remove_files(struct sysfs_dirent *dir_sd, struct kobject *kobj,  	if (grp->attrs)  		for (attr = grp->attrs; *attr; attr++) -			sysfs_hash_and_remove(dir_sd, (*attr)->name, NULL); +			kernfs_remove_by_name(parent, (*attr)->name);  	if (grp->bin_attrs)  		for (bin_attr = grp->bin_attrs; *bin_attr; bin_attr++)  			sysfs_remove_bin_file(kobj, *bin_attr);  } -static int create_files(struct sysfs_dirent *dir_sd, struct kobject *kobj, +static int create_files(struct kernfs_node *parent, struct kobject *kobj,  			const struct attribute_group *grp, int update)  {  	struct attribute *const *attr; @@ -49,22 +49,20 @@ static int create_files(struct sysfs_dirent *dir_sd, struct kobject *kobj,  			 * re-adding (if required) the file.  			 */  			if (update) -				sysfs_hash_and_remove(dir_sd, (*attr)->name, -						      NULL); +				kernfs_remove_by_name(parent, (*attr)->name);  			if (grp->is_visible) {  				mode = grp->is_visible(kobj, *attr, i);  				if (!mode)  					continue;  			} -			error = sysfs_add_file_mode_ns(dir_sd, *attr, -						       SYSFS_KOBJ_ATTR, +			error = sysfs_add_file_mode_ns(parent, *attr, false,  						       (*attr)->mode | mode,  						       NULL);  			if (unlikely(error))  				break;  		}  		if (error) { -			remove_files(dir_sd, kobj, grp); +			remove_files(parent, kobj, grp);  			goto exit;  		}  	} @@ -78,7 +76,7 @@ static int create_files(struct sysfs_dirent *dir_sd, struct kobject *kobj,  				break;  		}  		if (error) -			remove_files(dir_sd, kobj, grp); +			remove_files(parent, kobj, grp);  	}  exit:  	return error; @@ -88,7 +86,7 @@ exit:  static int internal_create_group(struct kobject *kobj, int update,  				 const struct attribute_group *grp)  { -	struct sysfs_dirent *sd; +	struct kernfs_node *kn;  	int error;  	BUG_ON(!kobj || (!update && !kobj->sd)); @@ -102,18 +100,22 @@ static int internal_create_group(struct kobject *kobj, int update,  		return -EINVAL;  	}  	if (grp->name) { -		error = sysfs_create_subdir(kobj, grp->name, &sd); -		if (error) -			return error; +		kn = kernfs_create_dir(kobj->sd, grp->name, +				       S_IRWXU | S_IRUGO | S_IXUGO, kobj); +		if (IS_ERR(kn)) { +			if (PTR_ERR(kn) == -EEXIST) +				sysfs_warn_dup(kobj->sd, grp->name); +			return PTR_ERR(kn); +		}  	} else -		sd = kobj->sd; -	sysfs_get(sd); -	error = create_files(sd, kobj, grp, update); +		kn = kobj->sd; +	kernfs_get(kn); +	error = create_files(kn, kobj, grp, update);  	if (error) {  		if (grp->name) -			sysfs_remove(sd); +			kernfs_remove(kn);  	} -	sysfs_put(sd); +	kernfs_put(kn);  	return error;  } @@ -203,25 +205,27 @@ EXPORT_SYMBOL_GPL(sysfs_update_group);  void sysfs_remove_group(struct kobject *kobj,  			const struct attribute_group *grp)  { -	struct sysfs_dirent *dir_sd = kobj->sd; -	struct sysfs_dirent *sd; +	struct kernfs_node *parent = kobj->sd; +	struct kernfs_node *kn;  	if (grp->name) { -		sd = sysfs_get_dirent(dir_sd, grp->name); -		if (!sd) { -			WARN(!sd, KERN_WARNING +		kn = kernfs_find_and_get(parent, grp->name); +		if (!kn) { +			WARN(!kn, KERN_WARNING  			     "sysfs group %p not found for kobject '%s'\n",  			     grp, kobject_name(kobj));  			return;  		} -	} else -		sd = sysfs_get(dir_sd); +	} else { +		kn = parent; +		kernfs_get(kn); +	} -	remove_files(sd, kobj, grp); +	remove_files(kn, kobj, grp);  	if (grp->name) -		sysfs_remove(sd); +		kernfs_remove(kn); -	sysfs_put(sd); +	kernfs_put(kn);  }  EXPORT_SYMBOL_GPL(sysfs_remove_group); @@ -257,22 +261,22 @@ EXPORT_SYMBOL_GPL(sysfs_remove_groups);  int sysfs_merge_group(struct kobject *kobj,  		       const struct attribute_group *grp)  { -	struct sysfs_dirent *dir_sd; +	struct kernfs_node *parent;  	int error = 0;  	struct attribute *const *attr;  	int i; -	dir_sd = sysfs_get_dirent(kobj->sd, grp->name); -	if (!dir_sd) +	parent = kernfs_find_and_get(kobj->sd, grp->name); +	if (!parent)  		return -ENOENT;  	for ((i = 0, attr = grp->attrs); *attr && !error; (++i, ++attr)) -		error = sysfs_add_file(dir_sd, *attr, SYSFS_KOBJ_ATTR); +		error = sysfs_add_file(parent, *attr, false);  	if (error) {  		while (--i >= 0) -			sysfs_hash_and_remove(dir_sd, (*--attr)->name, NULL); +			kernfs_remove_by_name(parent, (*--attr)->name);  	} -	sysfs_put(dir_sd); +	kernfs_put(parent);  	return error;  } @@ -286,14 +290,14 @@ EXPORT_SYMBOL_GPL(sysfs_merge_group);  void sysfs_unmerge_group(struct kobject *kobj,  		       const struct attribute_group *grp)  { -	struct sysfs_dirent *dir_sd; +	struct kernfs_node *parent;  	struct attribute *const *attr; -	dir_sd = sysfs_get_dirent(kobj->sd, grp->name); -	if (dir_sd) { +	parent = kernfs_find_and_get(kobj->sd, grp->name); +	if (parent) {  		for (attr = grp->attrs; *attr; ++attr) -			sysfs_hash_and_remove(dir_sd, (*attr)->name, NULL); -		sysfs_put(dir_sd); +			kernfs_remove_by_name(parent, (*attr)->name); +		kernfs_put(parent);  	}  }  EXPORT_SYMBOL_GPL(sysfs_unmerge_group); @@ -308,15 +312,15 @@ EXPORT_SYMBOL_GPL(sysfs_unmerge_group);  int sysfs_add_link_to_group(struct kobject *kobj, const char *group_name,  			    struct kobject *target, const char *link_name)  { -	struct sysfs_dirent *dir_sd; +	struct kernfs_node *parent;  	int error = 0; -	dir_sd = sysfs_get_dirent(kobj->sd, group_name); -	if (!dir_sd) +	parent = kernfs_find_and_get(kobj->sd, group_name); +	if (!parent)  		return -ENOENT; -	error = sysfs_create_link_sd(dir_sd, target, link_name); -	sysfs_put(dir_sd); +	error = sysfs_create_link_sd(parent, target, link_name); +	kernfs_put(parent);  	return error;  } @@ -331,12 +335,12 @@ EXPORT_SYMBOL_GPL(sysfs_add_link_to_group);  void sysfs_remove_link_from_group(struct kobject *kobj, const char *group_name,  				  const char *link_name)  { -	struct sysfs_dirent *dir_sd; +	struct kernfs_node *parent; -	dir_sd = sysfs_get_dirent(kobj->sd, group_name); -	if (dir_sd) { -		sysfs_hash_and_remove(dir_sd, link_name, NULL); -		sysfs_put(dir_sd); +	parent = kernfs_find_and_get(kobj->sd, group_name); +	if (parent) { +		kernfs_remove_by_name(parent, link_name); +		kernfs_put(parent);  	}  }  EXPORT_SYMBOL_GPL(sysfs_remove_link_from_group); diff --git a/fs/sysfs/inode.c b/fs/sysfs/inode.c deleted file mode 100644 index 1750f790af3b..000000000000 --- a/fs/sysfs/inode.c +++ /dev/null @@ -1,331 +0,0 @@ -/* - * fs/sysfs/inode.c - basic sysfs inode and dentry operations - * - * Copyright (c) 2001-3 Patrick Mochel - * Copyright (c) 2007 SUSE Linux Products GmbH - * Copyright (c) 2007 Tejun Heo <[email protected]> - * - * This file is released under the GPLv2. - * - * Please see Documentation/filesystems/sysfs.txt for more information. - */ - -#undef DEBUG - -#include <linux/pagemap.h> -#include <linux/namei.h> -#include <linux/backing-dev.h> -#include <linux/capability.h> -#include <linux/errno.h> -#include <linux/sched.h> -#include <linux/slab.h> -#include <linux/sysfs.h> -#include <linux/xattr.h> -#include <linux/security.h> -#include "sysfs.h" - -static const struct address_space_operations sysfs_aops = { -	.readpage	= simple_readpage, -	.write_begin	= simple_write_begin, -	.write_end	= simple_write_end, -}; - -static struct backing_dev_info sysfs_backing_dev_info = { -	.name		= "sysfs", -	.ra_pages	= 0,	/* No readahead */ -	.capabilities	= BDI_CAP_NO_ACCT_AND_WRITEBACK, -}; - -static const struct inode_operations sysfs_inode_operations = { -	.permission	= sysfs_permission, -	.setattr	= sysfs_setattr, -	.getattr	= sysfs_getattr, -	.setxattr	= sysfs_setxattr, -}; - -int __init sysfs_inode_init(void) -{ -	return bdi_init(&sysfs_backing_dev_info); -} - -static struct sysfs_inode_attrs *sysfs_init_inode_attrs(struct sysfs_dirent *sd) -{ -	struct sysfs_inode_attrs *attrs; -	struct iattr *iattrs; - -	attrs = kzalloc(sizeof(struct sysfs_inode_attrs), GFP_KERNEL); -	if (!attrs) -		return NULL; -	iattrs = &attrs->ia_iattr; - -	/* assign default attributes */ -	iattrs->ia_mode = sd->s_mode; -	iattrs->ia_uid = GLOBAL_ROOT_UID; -	iattrs->ia_gid = GLOBAL_ROOT_GID; -	iattrs->ia_atime = iattrs->ia_mtime = iattrs->ia_ctime = CURRENT_TIME; - -	return attrs; -} - -int sysfs_sd_setattr(struct sysfs_dirent *sd, struct iattr *iattr) -{ -	struct sysfs_inode_attrs *sd_attrs; -	struct iattr *iattrs; -	unsigned int ia_valid = iattr->ia_valid; - -	sd_attrs = sd->s_iattr; - -	if (!sd_attrs) { -		/* setting attributes for the first time, allocate now */ -		sd_attrs = sysfs_init_inode_attrs(sd); -		if (!sd_attrs) -			return -ENOMEM; -		sd->s_iattr = sd_attrs; -	} -	/* attributes were changed at least once in past */ -	iattrs = &sd_attrs->ia_iattr; - -	if (ia_valid & ATTR_UID) -		iattrs->ia_uid = iattr->ia_uid; -	if (ia_valid & ATTR_GID) -		iattrs->ia_gid = iattr->ia_gid; -	if (ia_valid & ATTR_ATIME) -		iattrs->ia_atime = iattr->ia_atime; -	if (ia_valid & ATTR_MTIME) -		iattrs->ia_mtime = iattr->ia_mtime; -	if (ia_valid & ATTR_CTIME) -		iattrs->ia_ctime = iattr->ia_ctime; -	if (ia_valid & ATTR_MODE) { -		umode_t mode = iattr->ia_mode; -		iattrs->ia_mode = sd->s_mode = mode; -	} -	return 0; -} - -int sysfs_setattr(struct dentry *dentry, struct iattr *iattr) -{ -	struct inode *inode = dentry->d_inode; -	struct sysfs_dirent *sd = dentry->d_fsdata; -	int error; - -	if (!sd) -		return -EINVAL; - -	mutex_lock(&sysfs_mutex); -	error = inode_change_ok(inode, iattr); -	if (error) -		goto out; - -	error = sysfs_sd_setattr(sd, iattr); -	if (error) -		goto out; - -	/* this ignores size changes */ -	setattr_copy(inode, iattr); - -out: -	mutex_unlock(&sysfs_mutex); -	return error; -} - -static int sysfs_sd_setsecdata(struct sysfs_dirent *sd, void **secdata, -			       u32 *secdata_len) -{ -	struct sysfs_inode_attrs *iattrs; -	void *old_secdata; -	size_t old_secdata_len; - -	if (!sd->s_iattr) { -		sd->s_iattr = sysfs_init_inode_attrs(sd); -		if (!sd->s_iattr) -			return -ENOMEM; -	} - -	iattrs = sd->s_iattr; -	old_secdata = iattrs->ia_secdata; -	old_secdata_len = iattrs->ia_secdata_len; - -	iattrs->ia_secdata = *secdata; -	iattrs->ia_secdata_len = *secdata_len; - -	*secdata = old_secdata; -	*secdata_len = old_secdata_len; -	return 0; -} - -int sysfs_setxattr(struct dentry *dentry, const char *name, const void *value, -		size_t size, int flags) -{ -	struct sysfs_dirent *sd = dentry->d_fsdata; -	void *secdata; -	int error; -	u32 secdata_len = 0; - -	if (!sd) -		return -EINVAL; - -	if (!strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN)) { -		const char *suffix = name + XATTR_SECURITY_PREFIX_LEN; -		error = security_inode_setsecurity(dentry->d_inode, suffix, -						value, size, flags); -		if (error) -			goto out; -		error = security_inode_getsecctx(dentry->d_inode, -						&secdata, &secdata_len); -		if (error) -			goto out; - -		mutex_lock(&sysfs_mutex); -		error = sysfs_sd_setsecdata(sd, &secdata, &secdata_len); -		mutex_unlock(&sysfs_mutex); - -		if (secdata) -			security_release_secctx(secdata, secdata_len); -	} else -		return -EINVAL; -out: -	return error; -} - -static inline void set_default_inode_attr(struct inode *inode, umode_t mode) -{ -	inode->i_mode = mode; -	inode->i_atime = inode->i_mtime = inode->i_ctime = CURRENT_TIME; -} - -static inline void set_inode_attr(struct inode *inode, struct iattr *iattr) -{ -	inode->i_uid = iattr->ia_uid; -	inode->i_gid = iattr->ia_gid; -	inode->i_atime = iattr->ia_atime; -	inode->i_mtime = iattr->ia_mtime; -	inode->i_ctime = iattr->ia_ctime; -} - -static void sysfs_refresh_inode(struct sysfs_dirent *sd, struct inode *inode) -{ -	struct sysfs_inode_attrs *iattrs = sd->s_iattr; - -	inode->i_mode = sd->s_mode; -	if (iattrs) { -		/* sysfs_dirent has non-default attributes -		 * get them from persistent copy in sysfs_dirent -		 */ -		set_inode_attr(inode, &iattrs->ia_iattr); -		security_inode_notifysecctx(inode, -					    iattrs->ia_secdata, -					    iattrs->ia_secdata_len); -	} - -	if (sysfs_type(sd) == SYSFS_DIR) -		set_nlink(inode, sd->s_dir.subdirs + 2); -} - -int sysfs_getattr(struct vfsmount *mnt, struct dentry *dentry, -		  struct kstat *stat) -{ -	struct sysfs_dirent *sd = dentry->d_fsdata; -	struct inode *inode = dentry->d_inode; - -	mutex_lock(&sysfs_mutex); -	sysfs_refresh_inode(sd, inode); -	mutex_unlock(&sysfs_mutex); - -	generic_fillattr(inode, stat); -	return 0; -} - -static void sysfs_init_inode(struct sysfs_dirent *sd, struct inode *inode) -{ -	struct bin_attribute *bin_attr; - -	inode->i_private = sysfs_get(sd); -	inode->i_mapping->a_ops = &sysfs_aops; -	inode->i_mapping->backing_dev_info = &sysfs_backing_dev_info; -	inode->i_op = &sysfs_inode_operations; - -	set_default_inode_attr(inode, sd->s_mode); -	sysfs_refresh_inode(sd, inode); - -	/* initialize inode according to type */ -	switch (sysfs_type(sd)) { -	case SYSFS_DIR: -		inode->i_op = &sysfs_dir_inode_operations; -		inode->i_fop = &sysfs_dir_operations; -		break; -	case SYSFS_KOBJ_ATTR: -		inode->i_size = PAGE_SIZE; -		inode->i_fop = &sysfs_file_operations; -		break; -	case SYSFS_KOBJ_BIN_ATTR: -		bin_attr = sd->s_attr.bin_attr; -		inode->i_size = bin_attr->size; -		inode->i_fop = &sysfs_bin_operations; -		break; -	case SYSFS_KOBJ_LINK: -		inode->i_op = &sysfs_symlink_inode_operations; -		break; -	default: -		BUG(); -	} - -	unlock_new_inode(inode); -} - -/** - *	sysfs_get_inode - get inode for sysfs_dirent - *	@sb: super block - *	@sd: sysfs_dirent to allocate inode for - * - *	Get inode for @sd.  If such inode doesn't exist, a new inode - *	is allocated and basics are initialized.  New inode is - *	returned locked. - * - *	LOCKING: - *	Kernel thread context (may sleep). - * - *	RETURNS: - *	Pointer to allocated inode on success, NULL on failure. - */ -struct inode *sysfs_get_inode(struct super_block *sb, struct sysfs_dirent *sd) -{ -	struct inode *inode; - -	inode = iget_locked(sb, sd->s_ino); -	if (inode && (inode->i_state & I_NEW)) -		sysfs_init_inode(sd, inode); - -	return inode; -} - -/* - * The sysfs_dirent serves as both an inode and a directory entry for sysfs. - * To prevent the sysfs inode numbers from being freed prematurely we take a - * reference to sysfs_dirent from the sysfs inode.  A - * super_operations.evict_inode() implementation is needed to drop that - * reference upon inode destruction. - */ -void sysfs_evict_inode(struct inode *inode) -{ -	struct sysfs_dirent *sd  = inode->i_private; - -	truncate_inode_pages(&inode->i_data, 0); -	clear_inode(inode); -	sysfs_put(sd); -} - -int sysfs_permission(struct inode *inode, int mask) -{ -	struct sysfs_dirent *sd; - -	if (mask & MAY_NOT_BLOCK) -		return -ECHILD; - -	sd = inode->i_private; - -	mutex_lock(&sysfs_mutex); -	sysfs_refresh_inode(sd, inode); -	mutex_unlock(&sysfs_mutex); - -	return generic_permission(inode, mask); -} diff --git a/fs/sysfs/mount.c b/fs/sysfs/mount.c index 834ec2cdb7a3..6211230814fd 100644 --- a/fs/sysfs/mount.c +++ b/fs/sysfs/mount.c @@ -14,146 +14,41 @@  #include <linux/fs.h>  #include <linux/mount.h> -#include <linux/pagemap.h>  #include <linux/init.h> -#include <linux/module.h> -#include <linux/magic.h> -#include <linux/slab.h>  #include <linux/user_namespace.h>  #include "sysfs.h" - -static struct vfsmount *sysfs_mnt; -struct kmem_cache *sysfs_dir_cachep; - -static const struct super_operations sysfs_ops = { -	.statfs		= simple_statfs, -	.drop_inode	= generic_delete_inode, -	.evict_inode	= sysfs_evict_inode, -}; - -struct sysfs_dirent sysfs_root = { -	.s_name		= "", -	.s_count	= ATOMIC_INIT(1), -	.s_flags	= SYSFS_DIR | (KOBJ_NS_TYPE_NONE << SYSFS_NS_TYPE_SHIFT), -	.s_mode		= S_IFDIR | S_IRUGO | S_IXUGO, -	.s_ino		= 1, -}; - -static int sysfs_fill_super(struct super_block *sb, void *data, int silent) -{ -	struct inode *inode; -	struct dentry *root; - -	sb->s_blocksize = PAGE_CACHE_SIZE; -	sb->s_blocksize_bits = PAGE_CACHE_SHIFT; -	sb->s_magic = SYSFS_MAGIC; -	sb->s_op = &sysfs_ops; -	sb->s_time_gran = 1; - -	/* get root inode, initialize and unlock it */ -	mutex_lock(&sysfs_mutex); -	inode = sysfs_get_inode(sb, &sysfs_root); -	mutex_unlock(&sysfs_mutex); -	if (!inode) { -		pr_debug("sysfs: could not get root inode\n"); -		return -ENOMEM; -	} - -	/* instantiate and link root dentry */ -	root = d_make_root(inode); -	if (!root) { -		pr_debug("%s: could not get root dentry!\n", __func__); -		return -ENOMEM; -	} -	root->d_fsdata = &sysfs_root; -	sb->s_root = root; -	sb->s_d_op = &sysfs_dentry_ops; -	return 0; -} - -static int sysfs_test_super(struct super_block *sb, void *data) -{ -	struct sysfs_super_info *sb_info = sysfs_info(sb); -	struct sysfs_super_info *info = data; -	enum kobj_ns_type type; -	int found = 1; - -	for (type = KOBJ_NS_TYPE_NONE; type < KOBJ_NS_TYPES; type++) { -		if (sb_info->ns[type] != info->ns[type]) -			found = 0; -	} -	return found; -} - -static int sysfs_set_super(struct super_block *sb, void *data) -{ -	int error; -	error = set_anon_super(sb, data); -	if (!error) -		sb->s_fs_info = data; -	return error; -} - -static void free_sysfs_super_info(struct sysfs_super_info *info) -{ -	int type; -	for (type = KOBJ_NS_TYPE_NONE; type < KOBJ_NS_TYPES; type++) -		kobj_ns_drop(type, info->ns[type]); -	kfree(info); -} +static struct kernfs_root *sysfs_root; +struct kernfs_node *sysfs_root_kn;  static struct dentry *sysfs_mount(struct file_system_type *fs_type,  	int flags, const char *dev_name, void *data)  { -	struct sysfs_super_info *info; -	enum kobj_ns_type type; -	struct super_block *sb; -	int error; +	struct dentry *root; +	void *ns;  	if (!(flags & MS_KERNMOUNT)) {  		if (!capable(CAP_SYS_ADMIN) && !fs_fully_visible(fs_type))  			return ERR_PTR(-EPERM); -		for (type = KOBJ_NS_TYPE_NONE; type < KOBJ_NS_TYPES; type++) { -			if (!kobj_ns_current_may_mount(type)) -				return ERR_PTR(-EPERM); -		} -	} - -	info = kzalloc(sizeof(*info), GFP_KERNEL); -	if (!info) -		return ERR_PTR(-ENOMEM); - -	for (type = KOBJ_NS_TYPE_NONE; type < KOBJ_NS_TYPES; type++) -		info->ns[type] = kobj_ns_grab_current(type); - -	sb = sget(fs_type, sysfs_test_super, sysfs_set_super, flags, info); -	if (IS_ERR(sb) || sb->s_fs_info != info) -		free_sysfs_super_info(info); -	if (IS_ERR(sb)) -		return ERR_CAST(sb); -	if (!sb->s_root) { -		error = sysfs_fill_super(sb, data, flags & MS_SILENT ? 1 : 0); -		if (error) { -			deactivate_locked_super(sb); -			return ERR_PTR(error); -		} -		sb->s_flags |= MS_ACTIVE; +		if (!kobj_ns_current_may_mount(KOBJ_NS_TYPE_NET)) +			return ERR_PTR(-EPERM);  	} -	return dget(sb->s_root); +	ns = kobj_ns_grab_current(KOBJ_NS_TYPE_NET); +	root = kernfs_mount_ns(fs_type, flags, sysfs_root, ns); +	if (IS_ERR(root)) +		kobj_ns_drop(KOBJ_NS_TYPE_NET, ns); +	return root;  }  static void sysfs_kill_sb(struct super_block *sb)  { -	struct sysfs_super_info *info = sysfs_info(sb); -	/* Remove the superblock from fs_supers/s_instances -	 * so we can't find it, before freeing sysfs_super_info. -	 */ -	kill_anon_super(sb); -	free_sysfs_super_info(info); +	void *ns = (void *)kernfs_super_ns(sb); + +	kernfs_kill_sb(sb); +	kobj_ns_drop(KOBJ_NS_TYPE_NET, ns);  }  static struct file_system_type sysfs_fs_type = { @@ -165,48 +60,19 @@ static struct file_system_type sysfs_fs_type = {  int __init sysfs_init(void)  { -	int err = -ENOMEM; +	int err; -	sysfs_dir_cachep = kmem_cache_create("sysfs_dir_cache", -					      sizeof(struct sysfs_dirent), -					      0, 0, NULL); -	if (!sysfs_dir_cachep) -		goto out; +	sysfs_root = kernfs_create_root(NULL, NULL); +	if (IS_ERR(sysfs_root)) +		return PTR_ERR(sysfs_root); -	err = sysfs_inode_init(); -	if (err) -		goto out_err; +	sysfs_root_kn = sysfs_root->kn;  	err = register_filesystem(&sysfs_fs_type); -	if (!err) { -		sysfs_mnt = kern_mount(&sysfs_fs_type); -		if (IS_ERR(sysfs_mnt)) { -			printk(KERN_ERR "sysfs: could not mount!\n"); -			err = PTR_ERR(sysfs_mnt); -			sysfs_mnt = NULL; -			unregister_filesystem(&sysfs_fs_type); -			goto out_err; -		} -	} else -		goto out_err; -out: -	return err; -out_err: -	kmem_cache_destroy(sysfs_dir_cachep); -	sysfs_dir_cachep = NULL; -	goto out; -} - -#undef sysfs_get -struct sysfs_dirent *sysfs_get(struct sysfs_dirent *sd) -{ -	return __sysfs_get(sd); -} -EXPORT_SYMBOL_GPL(sysfs_get); +	if (err) { +		kernfs_destroy_root(sysfs_root); +		return err; +	} -#undef sysfs_put -void sysfs_put(struct sysfs_dirent *sd) -{ -	__sysfs_put(sd); +	return 0;  } -EXPORT_SYMBOL_GPL(sysfs_put); diff --git a/fs/sysfs/symlink.c b/fs/sysfs/symlink.c index 3ae3f1bf1a09..aecb15f84557 100644 --- a/fs/sysfs/symlink.c +++ b/fs/sysfs/symlink.c @@ -11,109 +11,73 @@   */  #include <linux/fs.h> -#include <linux/gfp.h> -#include <linux/mount.h>  #include <linux/module.h>  #include <linux/kobject.h> -#include <linux/namei.h>  #include <linux/mutex.h>  #include <linux/security.h>  #include "sysfs.h" -static int sysfs_do_create_link_sd(struct sysfs_dirent *parent_sd, -				   struct kobject *target, +static int sysfs_do_create_link_sd(struct kernfs_node *parent, +				   struct kobject *target_kobj,  				   const char *name, int warn)  { -	struct sysfs_dirent *target_sd = NULL; -	struct sysfs_dirent *sd = NULL; -	struct sysfs_addrm_cxt acxt; -	enum kobj_ns_type ns_type; -	int error; +	struct kernfs_node *kn, *target = NULL; -	BUG_ON(!name || !parent_sd); +	BUG_ON(!name || !parent);  	/* -	 * We don't own @target and it may be removed at any time. +	 * We don't own @target_kobj and it may be removed at any time.  	 * Synchronize using sysfs_symlink_target_lock.  See  	 * sysfs_remove_dir() for details.  	 */  	spin_lock(&sysfs_symlink_target_lock); -	if (target->sd) -		target_sd = sysfs_get(target->sd); +	if (target_kobj->sd) { +		target = target_kobj->sd; +		kernfs_get(target); +	}  	spin_unlock(&sysfs_symlink_target_lock); -	error = -ENOENT; -	if (!target_sd) -		goto out_put; - -	error = -ENOMEM; -	sd = sysfs_new_dirent(name, S_IFLNK|S_IRWXUGO, SYSFS_KOBJ_LINK); -	if (!sd) -		goto out_put; +	if (!target) +		return -ENOENT; -	ns_type = sysfs_ns_type(parent_sd); -	if (ns_type) -		sd->s_ns = target_sd->s_ns; -	sd->s_symlink.target_sd = target_sd; -	target_sd = NULL;	/* reference is now owned by the symlink */ - -	sysfs_addrm_start(&acxt); -	/* Symlinks must be between directories with the same ns_type */ -	if (!ns_type || -	    (ns_type == sysfs_ns_type(sd->s_symlink.target_sd->s_parent))) { -		if (warn) -			error = sysfs_add_one(&acxt, sd, parent_sd); -		else -			error = __sysfs_add_one(&acxt, sd, parent_sd); -	} else { -		error = -EINVAL; -		WARN(1, KERN_WARNING -			"sysfs: symlink across ns_types %s/%s -> %s/%s\n", -			parent_sd->s_name, -			sd->s_name, -			sd->s_symlink.target_sd->s_parent->s_name, -			sd->s_symlink.target_sd->s_name); -	} -	sysfs_addrm_finish(&acxt); +	kn = kernfs_create_link(parent, name, target); +	kernfs_put(target); -	if (error) -		goto out_put; +	if (!IS_ERR(kn)) +		return 0; -	return 0; - - out_put: -	sysfs_put(target_sd); -	sysfs_put(sd); -	return error; +	if (warn && PTR_ERR(kn) == -EEXIST) +		sysfs_warn_dup(parent, name); +	return PTR_ERR(kn);  }  /**   *	sysfs_create_link_sd - create symlink to a given object. - *	@sd:		directory we're creating the link in. + *	@kn:		directory we're creating the link in.   *	@target:	object we're pointing to.   *	@name:		name of the symlink.   */ -int sysfs_create_link_sd(struct sysfs_dirent *sd, struct kobject *target, +int sysfs_create_link_sd(struct kernfs_node *kn, struct kobject *target,  			 const char *name)  { -	return sysfs_do_create_link_sd(sd, target, name, 1); +	return sysfs_do_create_link_sd(kn, target, name, 1);  }  static int sysfs_do_create_link(struct kobject *kobj, struct kobject *target,  				const char *name, int warn)  { -	struct sysfs_dirent *parent_sd = NULL; +	struct kernfs_node *parent = NULL;  	if (!kobj) -		parent_sd = &sysfs_root; +		parent = sysfs_root_kn;  	else -		parent_sd = kobj->sd; +		parent = kobj->sd; -	if (!parent_sd) +	if (!parent)  		return -EFAULT; -	return sysfs_do_create_link_sd(parent_sd, target, name, warn); +	return sysfs_do_create_link_sd(parent, target, name, warn);  }  /** @@ -164,10 +128,10 @@ void sysfs_delete_link(struct kobject *kobj, struct kobject *targ,  	 * sysfs_remove_dir() for details.  	 */  	spin_lock(&sysfs_symlink_target_lock); -	if (targ->sd && sysfs_ns_type(kobj->sd)) -		ns = targ->sd->s_ns; +	if (targ->sd && kernfs_ns_enabled(kobj->sd)) +		ns = targ->sd->ns;  	spin_unlock(&sysfs_symlink_target_lock); -	sysfs_hash_and_remove(kobj->sd, name, ns); +	kernfs_remove_by_name_ns(kobj->sd, name, ns);  }  /** @@ -177,14 +141,14 @@ void sysfs_delete_link(struct kobject *kobj, struct kobject *targ,   */  void sysfs_remove_link(struct kobject *kobj, const char *name)  { -	struct sysfs_dirent *parent_sd = NULL; +	struct kernfs_node *parent = NULL;  	if (!kobj) -		parent_sd = &sysfs_root; +		parent = sysfs_root_kn;  	else -		parent_sd = kobj->sd; +		parent = kobj->sd; -	sysfs_hash_and_remove(parent_sd, name, NULL); +	kernfs_remove_by_name(parent, name);  }  EXPORT_SYMBOL_GPL(sysfs_remove_link); @@ -201,130 +165,33 @@ EXPORT_SYMBOL_GPL(sysfs_remove_link);  int sysfs_rename_link_ns(struct kobject *kobj, struct kobject *targ,  			 const char *old, const char *new, const void *new_ns)  { -	struct sysfs_dirent *parent_sd, *sd = NULL; +	struct kernfs_node *parent, *kn = NULL;  	const void *old_ns = NULL;  	int result;  	if (!kobj) -		parent_sd = &sysfs_root; +		parent = sysfs_root_kn;  	else -		parent_sd = kobj->sd; +		parent = kobj->sd;  	if (targ->sd) -		old_ns = targ->sd->s_ns; +		old_ns = targ->sd->ns;  	result = -ENOENT; -	sd = sysfs_get_dirent_ns(parent_sd, old, old_ns); -	if (!sd) +	kn = kernfs_find_and_get_ns(parent, old, old_ns); +	if (!kn)  		goto out;  	result = -EINVAL; -	if (sysfs_type(sd) != SYSFS_KOBJ_LINK) +	if (kernfs_type(kn) != KERNFS_LINK)  		goto out; -	if (sd->s_symlink.target_sd->s_dir.kobj != targ) +	if (kn->symlink.target_kn->priv != targ)  		goto out; -	result = sysfs_rename(sd, parent_sd, new, new_ns); +	result = kernfs_rename_ns(kn, parent, new, new_ns);  out: -	sysfs_put(sd); +	kernfs_put(kn);  	return result;  }  EXPORT_SYMBOL_GPL(sysfs_rename_link_ns); - -static int sysfs_get_target_path(struct sysfs_dirent *parent_sd, -				 struct sysfs_dirent *target_sd, char *path) -{ -	struct sysfs_dirent *base, *sd; -	char *s = path; -	int len = 0; - -	/* go up to the root, stop at the base */ -	base = parent_sd; -	while (base->s_parent) { -		sd = target_sd->s_parent; -		while (sd->s_parent && base != sd) -			sd = sd->s_parent; - -		if (base == sd) -			break; - -		strcpy(s, "../"); -		s += 3; -		base = base->s_parent; -	} - -	/* determine end of target string for reverse fillup */ -	sd = target_sd; -	while (sd->s_parent && sd != base) { -		len += strlen(sd->s_name) + 1; -		sd = sd->s_parent; -	} - -	/* check limits */ -	if (len < 2) -		return -EINVAL; -	len--; -	if ((s - path) + len > PATH_MAX) -		return -ENAMETOOLONG; - -	/* reverse fillup of target string from target to base */ -	sd = target_sd; -	while (sd->s_parent && sd != base) { -		int slen = strlen(sd->s_name); - -		len -= slen; -		strncpy(s + len, sd->s_name, slen); -		if (len) -			s[--len] = '/'; - -		sd = sd->s_parent; -	} - -	return 0; -} - -static int sysfs_getlink(struct dentry *dentry, char *path) -{ -	struct sysfs_dirent *sd = dentry->d_fsdata; -	struct sysfs_dirent *parent_sd = sd->s_parent; -	struct sysfs_dirent *target_sd = sd->s_symlink.target_sd; -	int error; - -	mutex_lock(&sysfs_mutex); -	error = sysfs_get_target_path(parent_sd, target_sd, path); -	mutex_unlock(&sysfs_mutex); - -	return error; -} - -static void *sysfs_follow_link(struct dentry *dentry, struct nameidata *nd) -{ -	int error = -ENOMEM; -	unsigned long page = get_zeroed_page(GFP_KERNEL); -	if (page) { -		error = sysfs_getlink(dentry, (char *) page); -		if (error < 0) -			free_page((unsigned long)page); -	} -	nd_set_link(nd, error ? ERR_PTR(error) : (char *)page); -	return NULL; -} - -static void sysfs_put_link(struct dentry *dentry, struct nameidata *nd, -			   void *cookie) -{ -	char *page = nd_get_link(nd); -	if (!IS_ERR(page)) -		free_page((unsigned long)page); -} - -const struct inode_operations sysfs_symlink_inode_operations = { -	.setxattr	= sysfs_setxattr, -	.readlink	= generic_readlink, -	.follow_link	= sysfs_follow_link, -	.put_link	= sysfs_put_link, -	.setattr	= sysfs_setattr, -	.getattr	= sysfs_getattr, -	.permission	= sysfs_permission, -}; diff --git a/fs/sysfs/sysfs.h b/fs/sysfs/sysfs.h index 0af09fbfb3f6..0e2f1cccb812 100644 --- a/fs/sysfs/sysfs.h +++ b/fs/sysfs/sysfs.h @@ -8,248 +8,36 @@   * This file is released under the GPLv2.   */ -#include <linux/lockdep.h> -#include <linux/kobject_ns.h> -#include <linux/fs.h> -#include <linux/rbtree.h> +#ifndef __SYSFS_INTERNAL_H +#define __SYSFS_INTERNAL_H -struct sysfs_open_dirent; - -/* type-specific structures for sysfs_dirent->s_* union members */ -struct sysfs_elem_dir { -	struct kobject		*kobj; - -	unsigned long		subdirs; -	/* children rbtree starts here and goes through sd->s_rb */ -	struct rb_root		children; -}; - -struct sysfs_elem_symlink { -	struct sysfs_dirent	*target_sd; -}; - -struct sysfs_elem_attr { -	union { -		struct attribute	*attr; -		struct bin_attribute	*bin_attr; -	}; -	struct sysfs_open_dirent *open; -}; - -struct sysfs_inode_attrs { -	struct iattr	ia_iattr; -	void		*ia_secdata; -	u32		ia_secdata_len; -}; - -/* - * sysfs_dirent - the building block of sysfs hierarchy.  Each and - * every sysfs node is represented by single sysfs_dirent. - * - * As long as s_count reference is held, the sysfs_dirent itself is - * accessible.  Dereferencing s_elem or any other outer entity - * requires s_active reference. - */ -struct sysfs_dirent { -	atomic_t		s_count; -	atomic_t		s_active; -#ifdef CONFIG_DEBUG_LOCK_ALLOC -	struct lockdep_map	dep_map; -#endif -	struct sysfs_dirent	*s_parent; -	const char		*s_name; - -	struct rb_node		s_rb; - -	union { -		struct completion	*completion; -		struct sysfs_dirent	*removed_list; -	} u; - -	const void		*s_ns; /* namespace tag */ -	unsigned int		s_hash; /* ns + name hash */ -	union { -		struct sysfs_elem_dir		s_dir; -		struct sysfs_elem_symlink	s_symlink; -		struct sysfs_elem_attr		s_attr; -	}; - -	unsigned short		s_flags; -	umode_t			s_mode; -	unsigned int		s_ino; -	struct sysfs_inode_attrs *s_iattr; -}; - -#define SD_DEACTIVATED_BIAS		INT_MIN - -#define SYSFS_TYPE_MASK			0x00ff -#define SYSFS_DIR			0x0001 -#define SYSFS_KOBJ_ATTR			0x0002 -#define SYSFS_KOBJ_BIN_ATTR		0x0004 -#define SYSFS_KOBJ_LINK			0x0008 -#define SYSFS_COPY_NAME			(SYSFS_DIR | SYSFS_KOBJ_LINK) -#define SYSFS_ACTIVE_REF		(SYSFS_KOBJ_ATTR | SYSFS_KOBJ_BIN_ATTR) - -/* identify any namespace tag on sysfs_dirents */ -#define SYSFS_NS_TYPE_MASK		0xf00 -#define SYSFS_NS_TYPE_SHIFT		8 - -#define SYSFS_FLAG_MASK			~(SYSFS_NS_TYPE_MASK|SYSFS_TYPE_MASK) -#define SYSFS_FLAG_REMOVED		0x02000 - -static inline unsigned int sysfs_type(struct sysfs_dirent *sd) -{ -	return sd->s_flags & SYSFS_TYPE_MASK; -} - -/* - * Return any namespace tags on this dirent. - * enum kobj_ns_type is defined in linux/kobject.h - */ -static inline enum kobj_ns_type sysfs_ns_type(struct sysfs_dirent *sd) -{ -	return (sd->s_flags & SYSFS_NS_TYPE_MASK) >> SYSFS_NS_TYPE_SHIFT; -} - -#ifdef CONFIG_DEBUG_LOCK_ALLOC - -#define sysfs_dirent_init_lockdep(sd)				\ -do {								\ -	struct attribute *attr = sd->s_attr.attr;		\ -	struct lock_class_key *key = attr->key;			\ -	if (!key)						\ -		key = &attr->skey;				\ -								\ -	lockdep_init_map(&sd->dep_map, "s_active", key, 0);	\ -} while (0) - -/* Test for attributes that want to ignore lockdep for read-locking */ -static inline bool sysfs_ignore_lockdep(struct sysfs_dirent *sd) -{ -	int type = sysfs_type(sd); - -	return (type == SYSFS_KOBJ_ATTR || type == SYSFS_KOBJ_BIN_ATTR) && -		sd->s_attr.attr->ignore_lockdep; -} - -#else - -#define sysfs_dirent_init_lockdep(sd) do {} while (0) - -static inline bool sysfs_ignore_lockdep(struct sysfs_dirent *sd) -{ -	return true; -} - -#endif - -/* - * Context structure to be used while adding/removing nodes. - */ -struct sysfs_addrm_cxt { -	struct sysfs_dirent	*removed; -}; +#include <linux/sysfs.h>  /*   * mount.c   */ - -/* - * Each sb is associated with a set of namespace tags (i.e. - * the network namespace of the task which mounted this sysfs - * instance). - */ -struct sysfs_super_info { -	void *ns[KOBJ_NS_TYPES]; -}; -#define sysfs_info(SB) ((struct sysfs_super_info *)(SB->s_fs_info)) -extern struct sysfs_dirent sysfs_root; -extern struct kmem_cache *sysfs_dir_cachep; +extern struct kernfs_node *sysfs_root_kn;  /*   * dir.c   */ -extern struct mutex sysfs_mutex;  extern spinlock_t sysfs_symlink_target_lock; -extern const struct dentry_operations sysfs_dentry_ops; - -extern const struct file_operations sysfs_dir_operations; -extern const struct inode_operations sysfs_dir_inode_operations; -struct sysfs_dirent *sysfs_get_active(struct sysfs_dirent *sd); -void sysfs_put_active(struct sysfs_dirent *sd); -void sysfs_addrm_start(struct sysfs_addrm_cxt *acxt); -void sysfs_warn_dup(struct sysfs_dirent *parent, const char *name); -int __sysfs_add_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd, -		    struct sysfs_dirent *parent_sd); -int sysfs_add_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd, -		  struct sysfs_dirent *parent_sd); -void sysfs_remove(struct sysfs_dirent *sd); -int sysfs_hash_and_remove(struct sysfs_dirent *dir_sd, const char *name, -			  const void *ns); -void sysfs_addrm_finish(struct sysfs_addrm_cxt *acxt); - -struct sysfs_dirent *sysfs_find_dirent(struct sysfs_dirent *parent_sd, -				       const unsigned char *name, -				       const void *ns); -struct sysfs_dirent *sysfs_new_dirent(const char *name, umode_t mode, int type); - -void release_sysfs_dirent(struct sysfs_dirent *sd); - -int sysfs_create_subdir(struct kobject *kobj, const char *name, -			struct sysfs_dirent **p_sd); - -int sysfs_rename(struct sysfs_dirent *sd, struct sysfs_dirent *new_parent_sd, -		 const char *new_name, const void *new_ns); - -static inline struct sysfs_dirent *__sysfs_get(struct sysfs_dirent *sd) -{ -	if (sd) { -		WARN_ON(!atomic_read(&sd->s_count)); -		atomic_inc(&sd->s_count); -	} -	return sd; -} -#define sysfs_get(sd) __sysfs_get(sd) - -static inline void __sysfs_put(struct sysfs_dirent *sd) -{ -	if (sd && atomic_dec_and_test(&sd->s_count)) -		release_sysfs_dirent(sd); -} -#define sysfs_put(sd) __sysfs_put(sd) - -/* - * inode.c - */ -struct inode *sysfs_get_inode(struct super_block *sb, struct sysfs_dirent *sd); -void sysfs_evict_inode(struct inode *inode); -int sysfs_sd_setattr(struct sysfs_dirent *sd, struct iattr *iattr); -int sysfs_permission(struct inode *inode, int mask); -int sysfs_setattr(struct dentry *dentry, struct iattr *iattr); -int sysfs_getattr(struct vfsmount *mnt, struct dentry *dentry, -		  struct kstat *stat); -int sysfs_setxattr(struct dentry *dentry, const char *name, const void *value, -		   size_t size, int flags); -int sysfs_inode_init(void); +void sysfs_warn_dup(struct kernfs_node *parent, const char *name);  /*   * file.c   */ -extern const struct file_operations sysfs_file_operations; -extern const struct file_operations sysfs_bin_operations; - -int sysfs_add_file(struct sysfs_dirent *dir_sd, -		   const struct attribute *attr, int type); - -int sysfs_add_file_mode_ns(struct sysfs_dirent *dir_sd, -			   const struct attribute *attr, int type, +int sysfs_add_file(struct kernfs_node *parent, +		   const struct attribute *attr, bool is_bin); +int sysfs_add_file_mode_ns(struct kernfs_node *parent, +			   const struct attribute *attr, bool is_bin,  			   umode_t amode, const void *ns); -void sysfs_unmap_bin_file(struct sysfs_dirent *sd);  /*   * symlink.c   */ -extern const struct inode_operations sysfs_symlink_inode_operations; -int sysfs_create_link_sd(struct sysfs_dirent *sd, struct kobject *target, +int sysfs_create_link_sd(struct kernfs_node *kn, struct kobject *target,  			 const char *name); + +#endif	/* __SYSFS_INTERNAL_H */ |