sysfs: use rb-tree for name lookups
[linux-2.6.git] / fs / sysfs / dir.c
blob3e937da224d44fcceb5a1c6bdb12306b63c7ac9a
1 /*
2 * fs/sysfs/dir.c - sysfs core and dir operation implementation
4 * Copyright (c) 2001-3 Patrick Mochel
5 * Copyright (c) 2007 SUSE Linux Products GmbH
6 * Copyright (c) 2007 Tejun Heo <teheo@suse.de>
8 * This file is released under the GPLv2.
10 * Please see Documentation/filesystems/sysfs.txt for more information.
13 #undef DEBUG
15 #include <linux/fs.h>
16 #include <linux/mount.h>
17 #include <linux/module.h>
18 #include <linux/kobject.h>
19 #include <linux/namei.h>
20 #include <linux/idr.h>
21 #include <linux/completion.h>
22 #include <linux/mutex.h>
23 #include <linux/slab.h>
24 #include <linux/security.h>
25 #include "sysfs.h"
27 DEFINE_MUTEX(sysfs_mutex);
28 DEFINE_SPINLOCK(sysfs_assoc_lock);
30 static DEFINE_SPINLOCK(sysfs_ino_lock);
31 static DEFINE_IDA(sysfs_ino_ida);
33 /**
34 * sysfs_link_sibling - link sysfs_dirent into sibling list
35 * @sd: sysfs_dirent of interest
37 * Link @sd into its sibling list which starts from
38 * sd->s_parent->s_dir.children.
40 * Locking:
41 * mutex_lock(sysfs_mutex)
43 static void sysfs_link_sibling(struct sysfs_dirent *sd)
45 struct sysfs_dirent *parent_sd = sd->s_parent;
46 struct sysfs_dirent **pos;
48 struct rb_node **p;
49 struct rb_node *parent;
51 BUG_ON(sd->s_sibling);
53 if (sysfs_type(sd) == SYSFS_DIR)
54 parent_sd->s_dir.subdirs++;
56 /* Store directory entries in order by ino. This allows
57 * readdir to properly restart without having to add a
58 * cursor into the s_dir.children list.
60 for (pos = &parent_sd->s_dir.children; *pos; pos = &(*pos)->s_sibling) {
61 if (sd->s_ino < (*pos)->s_ino)
62 break;
64 sd->s_sibling = *pos;
65 *pos = sd;
67 p = &parent_sd->s_dir.name_tree.rb_node;
68 parent = NULL;
69 while (*p) {
70 int c;
71 parent = *p;
72 #define node rb_entry(parent, struct sysfs_dirent, name_node)
73 c = strcmp(sd->s_name, node->s_name);
74 if (c < 0) {
75 p = &node->name_node.rb_left;
76 } else {
77 p = &node->name_node.rb_right;
79 #undef node
81 rb_link_node(&sd->name_node, parent, p);
82 rb_insert_color(&sd->name_node, &parent_sd->s_dir.name_tree);
85 /**
86 * sysfs_unlink_sibling - unlink sysfs_dirent from sibling list
87 * @sd: sysfs_dirent of interest
89 * Unlink @sd from its sibling list which starts from
90 * sd->s_parent->s_dir.children.
92 * Locking:
93 * mutex_lock(sysfs_mutex)
95 static void sysfs_unlink_sibling(struct sysfs_dirent *sd)
97 struct sysfs_dirent **pos;
99 if (sysfs_type(sd) == SYSFS_DIR)
100 sd->s_parent->s_dir.subdirs--;
102 for (pos = &sd->s_parent->s_dir.children; *pos;
103 pos = &(*pos)->s_sibling) {
104 if (*pos == sd) {
105 *pos = sd->s_sibling;
106 sd->s_sibling = NULL;
107 break;
111 rb_erase(&sd->name_node, &sd->s_parent->s_dir.name_tree);
115 * sysfs_get_active - get an active reference to sysfs_dirent
116 * @sd: sysfs_dirent to get an active reference to
118 * Get an active reference of @sd. This function is noop if @sd
119 * is NULL.
121 * RETURNS:
122 * Pointer to @sd on success, NULL on failure.
124 struct sysfs_dirent *sysfs_get_active(struct sysfs_dirent *sd)
126 if (unlikely(!sd))
127 return NULL;
129 while (1) {
130 int v, t;
132 v = atomic_read(&sd->s_active);
133 if (unlikely(v < 0))
134 return NULL;
136 t = atomic_cmpxchg(&sd->s_active, v, v + 1);
137 if (likely(t == v)) {
138 rwsem_acquire_read(&sd->dep_map, 0, 1, _RET_IP_);
139 return sd;
141 if (t < 0)
142 return NULL;
144 cpu_relax();
149 * sysfs_put_active - put an active reference to sysfs_dirent
150 * @sd: sysfs_dirent to put an active reference to
152 * Put an active reference to @sd. This function is noop if @sd
153 * is NULL.
155 void sysfs_put_active(struct sysfs_dirent *sd)
157 struct completion *cmpl;
158 int v;
160 if (unlikely(!sd))
161 return;
163 rwsem_release(&sd->dep_map, 1, _RET_IP_);
164 v = atomic_dec_return(&sd->s_active);
165 if (likely(v != SD_DEACTIVATED_BIAS))
166 return;
168 /* atomic_dec_return() is a mb(), we'll always see the updated
169 * sd->s_sibling.
171 cmpl = (void *)sd->s_sibling;
172 complete(cmpl);
176 * sysfs_deactivate - deactivate sysfs_dirent
177 * @sd: sysfs_dirent to deactivate
179 * Deny new active references and drain existing ones.
181 static void sysfs_deactivate(struct sysfs_dirent *sd)
183 DECLARE_COMPLETION_ONSTACK(wait);
184 int v;
186 BUG_ON(sd->s_sibling || !(sd->s_flags & SYSFS_FLAG_REMOVED));
188 if (!(sysfs_type(sd) & SYSFS_ACTIVE_REF))
189 return;
191 sd->s_sibling = (void *)&wait;
193 rwsem_acquire(&sd->dep_map, 0, 0, _RET_IP_);
194 /* atomic_add_return() is a mb(), put_active() will always see
195 * the updated sd->s_sibling.
197 v = atomic_add_return(SD_DEACTIVATED_BIAS, &sd->s_active);
199 if (v != SD_DEACTIVATED_BIAS) {
200 lock_contended(&sd->dep_map, _RET_IP_);
201 wait_for_completion(&wait);
204 sd->s_sibling = NULL;
206 lock_acquired(&sd->dep_map, _RET_IP_);
207 rwsem_release(&sd->dep_map, 1, _RET_IP_);
210 static int sysfs_alloc_ino(ino_t *pino)
212 int ino, rc;
214 retry:
215 spin_lock(&sysfs_ino_lock);
216 rc = ida_get_new_above(&sysfs_ino_ida, 2, &ino);
217 spin_unlock(&sysfs_ino_lock);
219 if (rc == -EAGAIN) {
220 if (ida_pre_get(&sysfs_ino_ida, GFP_KERNEL))
221 goto retry;
222 rc = -ENOMEM;
225 *pino = ino;
226 return rc;
229 static void sysfs_free_ino(ino_t ino)
231 spin_lock(&sysfs_ino_lock);
232 ida_remove(&sysfs_ino_ida, ino);
233 spin_unlock(&sysfs_ino_lock);
236 void release_sysfs_dirent(struct sysfs_dirent * sd)
238 struct sysfs_dirent *parent_sd;
240 repeat:
241 /* Moving/renaming is always done while holding reference.
242 * sd->s_parent won't change beneath us.
244 parent_sd = sd->s_parent;
246 if (sysfs_type(sd) == SYSFS_KOBJ_LINK)
247 sysfs_put(sd->s_symlink.target_sd);
248 if (sysfs_type(sd) & SYSFS_COPY_NAME)
249 kfree(sd->s_name);
250 if (sd->s_iattr && sd->s_iattr->ia_secdata)
251 security_release_secctx(sd->s_iattr->ia_secdata,
252 sd->s_iattr->ia_secdata_len);
253 kfree(sd->s_iattr);
254 sysfs_free_ino(sd->s_ino);
255 kmem_cache_free(sysfs_dir_cachep, sd);
257 sd = parent_sd;
258 if (sd && atomic_dec_and_test(&sd->s_count))
259 goto repeat;
262 static int sysfs_dentry_delete(const struct dentry *dentry)
264 struct sysfs_dirent *sd = dentry->d_fsdata;
265 return !!(sd->s_flags & SYSFS_FLAG_REMOVED);
268 static int sysfs_dentry_revalidate(struct dentry *dentry, struct nameidata *nd)
270 struct sysfs_dirent *sd;
271 int is_dir;
273 if (nd->flags & LOOKUP_RCU)
274 return -ECHILD;
276 sd = dentry->d_fsdata;
277 mutex_lock(&sysfs_mutex);
279 /* The sysfs dirent has been deleted */
280 if (sd->s_flags & SYSFS_FLAG_REMOVED)
281 goto out_bad;
283 /* The sysfs dirent has been moved? */
284 if (dentry->d_parent->d_fsdata != sd->s_parent)
285 goto out_bad;
287 /* The sysfs dirent has been renamed */
288 if (strcmp(dentry->d_name.name, sd->s_name) != 0)
289 goto out_bad;
291 mutex_unlock(&sysfs_mutex);
292 out_valid:
293 return 1;
294 out_bad:
295 /* Remove the dentry from the dcache hashes.
296 * If this is a deleted dentry we use d_drop instead of d_delete
297 * so sysfs doesn't need to cope with negative dentries.
299 * If this is a dentry that has simply been renamed we
300 * use d_drop to remove it from the dcache lookup on its
301 * old parent. If this dentry persists later when a lookup
302 * is performed at its new name the dentry will be readded
303 * to the dcache hashes.
305 is_dir = (sysfs_type(sd) == SYSFS_DIR);
306 mutex_unlock(&sysfs_mutex);
307 if (is_dir) {
308 /* If we have submounts we must allow the vfs caches
309 * to lie about the state of the filesystem to prevent
310 * leaks and other nasty things.
312 if (have_submounts(dentry))
313 goto out_valid;
314 shrink_dcache_parent(dentry);
316 d_drop(dentry);
317 return 0;
320 static void sysfs_dentry_iput(struct dentry *dentry, struct inode *inode)
322 struct sysfs_dirent * sd = dentry->d_fsdata;
324 sysfs_put(sd);
325 iput(inode);
328 static const struct dentry_operations sysfs_dentry_ops = {
329 .d_revalidate = sysfs_dentry_revalidate,
330 .d_delete = sysfs_dentry_delete,
331 .d_iput = sysfs_dentry_iput,
334 struct sysfs_dirent *sysfs_new_dirent(const char *name, umode_t mode, int type)
336 char *dup_name = NULL;
337 struct sysfs_dirent *sd;
339 if (type & SYSFS_COPY_NAME) {
340 name = dup_name = kstrdup(name, GFP_KERNEL);
341 if (!name)
342 return NULL;
345 sd = kmem_cache_zalloc(sysfs_dir_cachep, GFP_KERNEL);
346 if (!sd)
347 goto err_out1;
349 if (sysfs_alloc_ino(&sd->s_ino))
350 goto err_out2;
352 atomic_set(&sd->s_count, 1);
353 atomic_set(&sd->s_active, 0);
355 sd->s_name = name;
356 sd->s_mode = mode;
357 sd->s_flags = type;
359 return sd;
361 err_out2:
362 kmem_cache_free(sysfs_dir_cachep, sd);
363 err_out1:
364 kfree(dup_name);
365 return NULL;
369 * sysfs_addrm_start - prepare for sysfs_dirent add/remove
370 * @acxt: pointer to sysfs_addrm_cxt to be used
371 * @parent_sd: parent sysfs_dirent
373 * This function is called when the caller is about to add or
374 * remove sysfs_dirent under @parent_sd. This function acquires
375 * sysfs_mutex. @acxt is used to keep and pass context to
376 * other addrm functions.
378 * LOCKING:
379 * Kernel thread context (may sleep). sysfs_mutex is locked on
380 * return.
382 void sysfs_addrm_start(struct sysfs_addrm_cxt *acxt,
383 struct sysfs_dirent *parent_sd)
385 memset(acxt, 0, sizeof(*acxt));
386 acxt->parent_sd = parent_sd;
388 mutex_lock(&sysfs_mutex);
392 * __sysfs_add_one - add sysfs_dirent to parent without warning
393 * @acxt: addrm context to use
394 * @sd: sysfs_dirent to be added
396 * Get @acxt->parent_sd and set sd->s_parent to it and increment
397 * nlink of parent inode if @sd is a directory and link into the
398 * children list of the parent.
400 * This function should be called between calls to
401 * sysfs_addrm_start() and sysfs_addrm_finish() and should be
402 * passed the same @acxt as passed to sysfs_addrm_start().
404 * LOCKING:
405 * Determined by sysfs_addrm_start().
407 * RETURNS:
408 * 0 on success, -EEXIST if entry with the given name already
409 * exists.
411 int __sysfs_add_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd)
413 struct sysfs_inode_attrs *ps_iattr;
415 if (sysfs_find_dirent(acxt->parent_sd, sd->s_ns, sd->s_name))
416 return -EEXIST;
418 sd->s_parent = sysfs_get(acxt->parent_sd);
420 sysfs_link_sibling(sd);
422 /* Update timestamps on the parent */
423 ps_iattr = acxt->parent_sd->s_iattr;
424 if (ps_iattr) {
425 struct iattr *ps_iattrs = &ps_iattr->ia_iattr;
426 ps_iattrs->ia_ctime = ps_iattrs->ia_mtime = CURRENT_TIME;
429 return 0;
433 * sysfs_pathname - return full path to sysfs dirent
434 * @sd: sysfs_dirent whose path we want
435 * @path: caller allocated buffer
437 * Gives the name "/" to the sysfs_root entry; any path returned
438 * is relative to wherever sysfs is mounted.
440 * XXX: does no error checking on @path size
442 static char *sysfs_pathname(struct sysfs_dirent *sd, char *path)
444 if (sd->s_parent) {
445 sysfs_pathname(sd->s_parent, path);
446 strcat(path, "/");
448 strcat(path, sd->s_name);
449 return path;
453 * sysfs_add_one - add sysfs_dirent to parent
454 * @acxt: addrm context to use
455 * @sd: sysfs_dirent to be added
457 * Get @acxt->parent_sd and set sd->s_parent to it and increment
458 * nlink of parent inode if @sd is a directory and link into the
459 * children list of the parent.
461 * This function should be called between calls to
462 * sysfs_addrm_start() and sysfs_addrm_finish() and should be
463 * passed the same @acxt as passed to sysfs_addrm_start().
465 * LOCKING:
466 * Determined by sysfs_addrm_start().
468 * RETURNS:
469 * 0 on success, -EEXIST if entry with the given name already
470 * exists.
472 int sysfs_add_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd)
474 int ret;
476 ret = __sysfs_add_one(acxt, sd);
477 if (ret == -EEXIST) {
478 char *path = kzalloc(PATH_MAX, GFP_KERNEL);
479 WARN(1, KERN_WARNING
480 "sysfs: cannot create duplicate filename '%s'\n",
481 (path == NULL) ? sd->s_name :
482 strcat(strcat(sysfs_pathname(acxt->parent_sd, path), "/"),
483 sd->s_name));
484 kfree(path);
487 return ret;
491 * sysfs_remove_one - remove sysfs_dirent from parent
492 * @acxt: addrm context to use
493 * @sd: sysfs_dirent to be removed
495 * Mark @sd removed and drop nlink of parent inode if @sd is a
496 * directory. @sd is unlinked from the children list.
498 * This function should be called between calls to
499 * sysfs_addrm_start() and sysfs_addrm_finish() and should be
500 * passed the same @acxt as passed to sysfs_addrm_start().
502 * LOCKING:
503 * Determined by sysfs_addrm_start().
505 void sysfs_remove_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd)
507 struct sysfs_inode_attrs *ps_iattr;
509 BUG_ON(sd->s_flags & SYSFS_FLAG_REMOVED);
511 sysfs_unlink_sibling(sd);
513 /* Update timestamps on the parent */
514 ps_iattr = acxt->parent_sd->s_iattr;
515 if (ps_iattr) {
516 struct iattr *ps_iattrs = &ps_iattr->ia_iattr;
517 ps_iattrs->ia_ctime = ps_iattrs->ia_mtime = CURRENT_TIME;
520 sd->s_flags |= SYSFS_FLAG_REMOVED;
521 sd->s_sibling = acxt->removed;
522 acxt->removed = sd;
526 * sysfs_addrm_finish - finish up sysfs_dirent add/remove
527 * @acxt: addrm context to finish up
529 * Finish up sysfs_dirent add/remove. Resources acquired by
530 * sysfs_addrm_start() are released and removed sysfs_dirents are
531 * cleaned up.
533 * LOCKING:
534 * sysfs_mutex is released.
536 void sysfs_addrm_finish(struct sysfs_addrm_cxt *acxt)
538 /* release resources acquired by sysfs_addrm_start() */
539 mutex_unlock(&sysfs_mutex);
541 /* kill removed sysfs_dirents */
542 while (acxt->removed) {
543 struct sysfs_dirent *sd = acxt->removed;
545 acxt->removed = sd->s_sibling;
546 sd->s_sibling = NULL;
548 sysfs_deactivate(sd);
549 unmap_bin_file(sd);
550 sysfs_put(sd);
555 * sysfs_find_dirent - find sysfs_dirent with the given name
556 * @parent_sd: sysfs_dirent to search under
557 * @name: name to look for
559 * Look for sysfs_dirent with name @name under @parent_sd.
561 * LOCKING:
562 * mutex_lock(sysfs_mutex)
564 * RETURNS:
565 * Pointer to sysfs_dirent if found, NULL if not.
567 struct sysfs_dirent *sysfs_find_dirent(struct sysfs_dirent *parent_sd,
568 const void *ns,
569 const unsigned char *name)
571 struct rb_node *p = parent_sd->s_dir.name_tree.rb_node;
572 struct sysfs_dirent *found = NULL;
574 while (p) {
575 int c;
576 #define node rb_entry(p, struct sysfs_dirent, name_node)
577 c = strcmp(name, node->s_name);
578 if (c < 0) {
579 p = node->name_node.rb_left;
580 } else if (c > 0) {
581 p = node->name_node.rb_right;
582 } else {
583 found = node;
584 p = node->name_node.rb_left;
586 #undef node
589 if (found && ns) {
590 while (found->s_ns && found->s_ns != ns) {
591 p = rb_next(&found->name_node);
592 if (!p)
593 return NULL;
594 found = rb_entry(p, struct sysfs_dirent, name_node);
595 if (strcmp(name, found->s_name))
596 return NULL;
600 return found;
604 * sysfs_get_dirent - find and get sysfs_dirent with the given name
605 * @parent_sd: sysfs_dirent to search under
606 * @name: name to look for
608 * Look for sysfs_dirent with name @name under @parent_sd and get
609 * it if found.
611 * LOCKING:
612 * Kernel thread context (may sleep). Grabs sysfs_mutex.
614 * RETURNS:
615 * Pointer to sysfs_dirent if found, NULL if not.
617 struct sysfs_dirent *sysfs_get_dirent(struct sysfs_dirent *parent_sd,
618 const void *ns,
619 const unsigned char *name)
621 struct sysfs_dirent *sd;
623 mutex_lock(&sysfs_mutex);
624 sd = sysfs_find_dirent(parent_sd, ns, name);
625 sysfs_get(sd);
626 mutex_unlock(&sysfs_mutex);
628 return sd;
630 EXPORT_SYMBOL_GPL(sysfs_get_dirent);
632 static int create_dir(struct kobject *kobj, struct sysfs_dirent *parent_sd,
633 enum kobj_ns_type type, const void *ns, const char *name,
634 struct sysfs_dirent **p_sd)
636 umode_t mode = S_IFDIR| S_IRWXU | S_IRUGO | S_IXUGO;
637 struct sysfs_addrm_cxt acxt;
638 struct sysfs_dirent *sd;
639 int rc;
641 /* allocate */
642 sd = sysfs_new_dirent(name, mode, SYSFS_DIR);
643 if (!sd)
644 return -ENOMEM;
646 sd->s_flags |= (type << SYSFS_NS_TYPE_SHIFT);
647 sd->s_ns = ns;
648 sd->s_dir.kobj = kobj;
650 /* link in */
651 sysfs_addrm_start(&acxt, parent_sd);
652 rc = sysfs_add_one(&acxt, sd);
653 sysfs_addrm_finish(&acxt);
655 if (rc == 0)
656 *p_sd = sd;
657 else
658 sysfs_put(sd);
660 return rc;
663 int sysfs_create_subdir(struct kobject *kobj, const char *name,
664 struct sysfs_dirent **p_sd)
666 return create_dir(kobj, kobj->sd,
667 KOBJ_NS_TYPE_NONE, NULL, name, p_sd);
671 * sysfs_read_ns_type: return associated ns_type
672 * @kobj: the kobject being queried
674 * Each kobject can be tagged with exactly one namespace type
675 * (i.e. network or user). Return the ns_type associated with
676 * this object if any
678 static enum kobj_ns_type sysfs_read_ns_type(struct kobject *kobj)
680 const struct kobj_ns_type_operations *ops;
681 enum kobj_ns_type type;
683 ops = kobj_child_ns_ops(kobj);
684 if (!ops)
685 return KOBJ_NS_TYPE_NONE;
687 type = ops->type;
688 BUG_ON(type <= KOBJ_NS_TYPE_NONE);
689 BUG_ON(type >= KOBJ_NS_TYPES);
690 BUG_ON(!kobj_ns_type_registered(type));
692 return type;
696 * sysfs_create_dir - create a directory for an object.
697 * @kobj: object we're creating directory for.
699 int sysfs_create_dir(struct kobject * kobj)
701 enum kobj_ns_type type;
702 struct sysfs_dirent *parent_sd, *sd;
703 const void *ns = NULL;
704 int error = 0;
706 BUG_ON(!kobj);
708 if (kobj->parent)
709 parent_sd = kobj->parent->sd;
710 else
711 parent_sd = &sysfs_root;
713 if (sysfs_ns_type(parent_sd))
714 ns = kobj->ktype->namespace(kobj);
715 type = sysfs_read_ns_type(kobj);
717 error = create_dir(kobj, parent_sd, type, ns, kobject_name(kobj), &sd);
718 if (!error)
719 kobj->sd = sd;
720 return error;
723 static struct dentry * sysfs_lookup(struct inode *dir, struct dentry *dentry,
724 struct nameidata *nd)
726 struct dentry *ret = NULL;
727 struct dentry *parent = dentry->d_parent;
728 struct sysfs_dirent *parent_sd = parent->d_fsdata;
729 struct sysfs_dirent *sd;
730 struct inode *inode;
731 enum kobj_ns_type type;
732 const void *ns;
734 mutex_lock(&sysfs_mutex);
736 type = sysfs_ns_type(parent_sd);
737 ns = sysfs_info(dir->i_sb)->ns[type];
739 sd = sysfs_find_dirent(parent_sd, ns, dentry->d_name.name);
741 /* no such entry */
742 if (!sd) {
743 ret = ERR_PTR(-ENOENT);
744 goto out_unlock;
747 /* attach dentry and inode */
748 inode = sysfs_get_inode(dir->i_sb, sd);
749 if (!inode) {
750 ret = ERR_PTR(-ENOMEM);
751 goto out_unlock;
754 /* instantiate and hash dentry */
755 ret = d_find_alias(inode);
756 if (!ret) {
757 d_set_d_op(dentry, &sysfs_dentry_ops);
758 dentry->d_fsdata = sysfs_get(sd);
759 d_add(dentry, inode);
760 } else {
761 d_move(ret, dentry);
762 iput(inode);
765 out_unlock:
766 mutex_unlock(&sysfs_mutex);
767 return ret;
770 const struct inode_operations sysfs_dir_inode_operations = {
771 .lookup = sysfs_lookup,
772 .permission = sysfs_permission,
773 .setattr = sysfs_setattr,
774 .getattr = sysfs_getattr,
775 .setxattr = sysfs_setxattr,
778 static void remove_dir(struct sysfs_dirent *sd)
780 struct sysfs_addrm_cxt acxt;
782 sysfs_addrm_start(&acxt, sd->s_parent);
783 sysfs_remove_one(&acxt, sd);
784 sysfs_addrm_finish(&acxt);
787 void sysfs_remove_subdir(struct sysfs_dirent *sd)
789 remove_dir(sd);
793 static void __sysfs_remove_dir(struct sysfs_dirent *dir_sd)
795 struct sysfs_addrm_cxt acxt;
796 struct sysfs_dirent **pos;
798 if (!dir_sd)
799 return;
801 pr_debug("sysfs %s: removing dir\n", dir_sd->s_name);
802 sysfs_addrm_start(&acxt, dir_sd);
803 pos = &dir_sd->s_dir.children;
804 while (*pos) {
805 struct sysfs_dirent *sd = *pos;
807 if (sysfs_type(sd) != SYSFS_DIR)
808 sysfs_remove_one(&acxt, sd);
809 else
810 pos = &(*pos)->s_sibling;
812 sysfs_addrm_finish(&acxt);
814 remove_dir(dir_sd);
818 * sysfs_remove_dir - remove an object's directory.
819 * @kobj: object.
821 * The only thing special about this is that we remove any files in
822 * the directory before we remove the directory, and we've inlined
823 * what used to be sysfs_rmdir() below, instead of calling separately.
826 void sysfs_remove_dir(struct kobject * kobj)
828 struct sysfs_dirent *sd = kobj->sd;
830 spin_lock(&sysfs_assoc_lock);
831 kobj->sd = NULL;
832 spin_unlock(&sysfs_assoc_lock);
834 __sysfs_remove_dir(sd);
837 int sysfs_rename(struct sysfs_dirent *sd,
838 struct sysfs_dirent *new_parent_sd, const void *new_ns,
839 const char *new_name)
841 const char *dup_name = NULL;
842 int error;
844 mutex_lock(&sysfs_mutex);
846 error = 0;
847 if ((sd->s_parent == new_parent_sd) && (sd->s_ns == new_ns) &&
848 (strcmp(sd->s_name, new_name) == 0))
849 goto out; /* nothing to rename */
851 error = -EEXIST;
852 if (sysfs_find_dirent(new_parent_sd, new_ns, new_name))
853 goto out;
855 /* rename sysfs_dirent */
856 if (strcmp(sd->s_name, new_name) != 0) {
857 error = -ENOMEM;
858 new_name = dup_name = kstrdup(new_name, GFP_KERNEL);
859 if (!new_name)
860 goto out;
862 dup_name = sd->s_name;
863 sd->s_name = new_name;
866 /* Remove from old parent's list and insert into new parent's list. */
867 if (sd->s_parent != new_parent_sd) {
868 sysfs_unlink_sibling(sd);
869 sysfs_get(new_parent_sd);
870 sysfs_put(sd->s_parent);
871 sd->s_parent = new_parent_sd;
872 sysfs_link_sibling(sd);
874 sd->s_ns = new_ns;
876 error = 0;
877 out:
878 mutex_unlock(&sysfs_mutex);
879 kfree(dup_name);
880 return error;
883 int sysfs_rename_dir(struct kobject *kobj, const char *new_name)
885 struct sysfs_dirent *parent_sd = kobj->sd->s_parent;
886 const void *new_ns = NULL;
888 if (sysfs_ns_type(parent_sd))
889 new_ns = kobj->ktype->namespace(kobj);
891 return sysfs_rename(kobj->sd, parent_sd, new_ns, new_name);
894 int sysfs_move_dir(struct kobject *kobj, struct kobject *new_parent_kobj)
896 struct sysfs_dirent *sd = kobj->sd;
897 struct sysfs_dirent *new_parent_sd;
898 const void *new_ns = NULL;
900 BUG_ON(!sd->s_parent);
901 if (sysfs_ns_type(sd->s_parent))
902 new_ns = kobj->ktype->namespace(kobj);
903 new_parent_sd = new_parent_kobj && new_parent_kobj->sd ?
904 new_parent_kobj->sd : &sysfs_root;
906 return sysfs_rename(sd, new_parent_sd, new_ns, sd->s_name);
909 /* Relationship between s_mode and the DT_xxx types */
910 static inline unsigned char dt_type(struct sysfs_dirent *sd)
912 return (sd->s_mode >> 12) & 15;
915 static int sysfs_dir_release(struct inode *inode, struct file *filp)
917 sysfs_put(filp->private_data);
918 return 0;
921 static struct sysfs_dirent *sysfs_dir_pos(const void *ns,
922 struct sysfs_dirent *parent_sd, ino_t ino, struct sysfs_dirent *pos)
924 if (pos) {
925 int valid = !(pos->s_flags & SYSFS_FLAG_REMOVED) &&
926 pos->s_parent == parent_sd &&
927 ino == pos->s_ino;
928 sysfs_put(pos);
929 if (!valid)
930 pos = NULL;
932 if (!pos && (ino > 1) && (ino < INT_MAX)) {
933 pos = parent_sd->s_dir.children;
934 while (pos && (ino > pos->s_ino))
935 pos = pos->s_sibling;
937 while (pos && pos->s_ns && pos->s_ns != ns)
938 pos = pos->s_sibling;
939 return pos;
942 static struct sysfs_dirent *sysfs_dir_next_pos(const void *ns,
943 struct sysfs_dirent *parent_sd, ino_t ino, struct sysfs_dirent *pos)
945 pos = sysfs_dir_pos(ns, parent_sd, ino, pos);
946 if (pos)
947 pos = pos->s_sibling;
948 while (pos && pos->s_ns && pos->s_ns != ns)
949 pos = pos->s_sibling;
950 return pos;
953 static int sysfs_readdir(struct file * filp, void * dirent, filldir_t filldir)
955 struct dentry *dentry = filp->f_path.dentry;
956 struct sysfs_dirent * parent_sd = dentry->d_fsdata;
957 struct sysfs_dirent *pos = filp->private_data;
958 enum kobj_ns_type type;
959 const void *ns;
960 ino_t ino;
962 type = sysfs_ns_type(parent_sd);
963 ns = sysfs_info(dentry->d_sb)->ns[type];
965 if (filp->f_pos == 0) {
966 ino = parent_sd->s_ino;
967 if (filldir(dirent, ".", 1, filp->f_pos, ino, DT_DIR) == 0)
968 filp->f_pos++;
970 if (filp->f_pos == 1) {
971 if (parent_sd->s_parent)
972 ino = parent_sd->s_parent->s_ino;
973 else
974 ino = parent_sd->s_ino;
975 if (filldir(dirent, "..", 2, filp->f_pos, ino, DT_DIR) == 0)
976 filp->f_pos++;
978 mutex_lock(&sysfs_mutex);
979 for (pos = sysfs_dir_pos(ns, parent_sd, filp->f_pos, pos);
980 pos;
981 pos = sysfs_dir_next_pos(ns, parent_sd, filp->f_pos, pos)) {
982 const char * name;
983 unsigned int type;
984 int len, ret;
986 name = pos->s_name;
987 len = strlen(name);
988 ino = pos->s_ino;
989 type = dt_type(pos);
990 filp->f_pos = ino;
991 filp->private_data = sysfs_get(pos);
993 mutex_unlock(&sysfs_mutex);
994 ret = filldir(dirent, name, len, filp->f_pos, ino, type);
995 mutex_lock(&sysfs_mutex);
996 if (ret < 0)
997 break;
999 mutex_unlock(&sysfs_mutex);
1000 if ((filp->f_pos > 1) && !pos) { /* EOF */
1001 filp->f_pos = INT_MAX;
1002 filp->private_data = NULL;
1004 return 0;
1008 const struct file_operations sysfs_dir_operations = {
1009 .read = generic_read_dir,
1010 .readdir = sysfs_readdir,
1011 .release = sysfs_dir_release,
1012 .llseek = generic_file_llseek,