blob: e565ec096ae997e16369ec7a698d1a43ae1edce3 [file] [log] [blame]
Tejun Heob8441ed2013-11-24 09:54:58 -05001/*
2 * fs/kernfs/dir.c - kernfs directory implementation
3 *
4 * Copyright (c) 2001-3 Patrick Mochel
5 * Copyright (c) 2007 SUSE Linux Products GmbH
6 * Copyright (c) 2007, 2013 Tejun Heo <tj@kernel.org>
7 *
8 * This file is released under the GPLv2.
9 */
Tejun Heofd7b9f72013-11-28 14:54:33 -050010
Tejun Heoea1c4722014-01-10 08:57:19 -050011#include <linux/sched.h>
Tejun Heofd7b9f72013-11-28 14:54:33 -050012#include <linux/fs.h>
13#include <linux/namei.h>
14#include <linux/idr.h>
15#include <linux/slab.h>
16#include <linux/security.h>
17#include <linux/hash.h>
18
19#include "kernfs-internal.h"
20
Tejun Heoa797bfc2013-12-11 14:11:57 -050021DEFINE_MUTEX(kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -050022
Tejun Heoadc5e8b2013-12-11 14:11:54 -050023#define rb_to_kn(X) rb_entry((X), struct kernfs_node, rb)
Tejun Heofd7b9f72013-11-28 14:54:33 -050024
Tejun Heoa69d0012014-01-10 08:57:20 -050025static bool kernfs_lockdep(struct kernfs_node *kn)
26{
27#ifdef CONFIG_DEBUG_LOCK_ALLOC
28 return kn->flags & KERNFS_LOCKDEP;
29#else
30 return false;
31#endif
32}
33
Tejun Heofd7b9f72013-11-28 14:54:33 -050034/**
Tejun Heoc637b8a2013-12-11 14:11:58 -050035 * kernfs_name_hash
Tejun Heofd7b9f72013-11-28 14:54:33 -050036 * @name: Null terminated string to hash
37 * @ns: Namespace tag to hash
38 *
39 * Returns 31 bit hash of ns + name (so it fits in an off_t )
40 */
Tejun Heoc637b8a2013-12-11 14:11:58 -050041static unsigned int kernfs_name_hash(const char *name, const void *ns)
Tejun Heofd7b9f72013-11-28 14:54:33 -050042{
43 unsigned long hash = init_name_hash();
44 unsigned int len = strlen(name);
45 while (len--)
46 hash = partial_name_hash(*name++, hash);
47 hash = (end_name_hash(hash) ^ hash_ptr((void *)ns, 31));
48 hash &= 0x7fffffffU;
49 /* Reserve hash numbers 0, 1 and INT_MAX for magic directory entries */
50 if (hash < 1)
51 hash += 2;
52 if (hash >= INT_MAX)
53 hash = INT_MAX - 1;
54 return hash;
55}
56
Tejun Heoc637b8a2013-12-11 14:11:58 -050057static int kernfs_name_compare(unsigned int hash, const char *name,
58 const void *ns, const struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -050059{
Tejun Heoadc5e8b2013-12-11 14:11:54 -050060 if (hash != kn->hash)
61 return hash - kn->hash;
62 if (ns != kn->ns)
63 return ns - kn->ns;
64 return strcmp(name, kn->name);
Tejun Heofd7b9f72013-11-28 14:54:33 -050065}
66
Tejun Heoc637b8a2013-12-11 14:11:58 -050067static int kernfs_sd_compare(const struct kernfs_node *left,
68 const struct kernfs_node *right)
Tejun Heofd7b9f72013-11-28 14:54:33 -050069{
Tejun Heoc637b8a2013-12-11 14:11:58 -050070 return kernfs_name_compare(left->hash, left->name, left->ns, right);
Tejun Heofd7b9f72013-11-28 14:54:33 -050071}
72
73/**
Tejun Heoc637b8a2013-12-11 14:11:58 -050074 * kernfs_link_sibling - link kernfs_node into sibling rbtree
Tejun Heo324a56e2013-12-11 14:11:53 -050075 * @kn: kernfs_node of interest
Tejun Heofd7b9f72013-11-28 14:54:33 -050076 *
Tejun Heo324a56e2013-12-11 14:11:53 -050077 * Link @kn into its sibling rbtree which starts from
Tejun Heoadc5e8b2013-12-11 14:11:54 -050078 * @kn->parent->dir.children.
Tejun Heofd7b9f72013-11-28 14:54:33 -050079 *
80 * Locking:
Tejun Heoa797bfc2013-12-11 14:11:57 -050081 * mutex_lock(kernfs_mutex)
Tejun Heofd7b9f72013-11-28 14:54:33 -050082 *
83 * RETURNS:
84 * 0 on susccess -EEXIST on failure.
85 */
Tejun Heoc637b8a2013-12-11 14:11:58 -050086static int kernfs_link_sibling(struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -050087{
Tejun Heoadc5e8b2013-12-11 14:11:54 -050088 struct rb_node **node = &kn->parent->dir.children.rb_node;
Tejun Heofd7b9f72013-11-28 14:54:33 -050089 struct rb_node *parent = NULL;
90
Tejun Heodf23fc32013-12-11 14:11:56 -050091 if (kernfs_type(kn) == KERNFS_DIR)
Tejun Heoadc5e8b2013-12-11 14:11:54 -050092 kn->parent->dir.subdirs++;
Tejun Heofd7b9f72013-11-28 14:54:33 -050093
94 while (*node) {
Tejun Heo324a56e2013-12-11 14:11:53 -050095 struct kernfs_node *pos;
Tejun Heofd7b9f72013-11-28 14:54:33 -050096 int result;
97
Tejun Heo324a56e2013-12-11 14:11:53 -050098 pos = rb_to_kn(*node);
Tejun Heofd7b9f72013-11-28 14:54:33 -050099 parent = *node;
Tejun Heoc637b8a2013-12-11 14:11:58 -0500100 result = kernfs_sd_compare(kn, pos);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500101 if (result < 0)
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500102 node = &pos->rb.rb_left;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500103 else if (result > 0)
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500104 node = &pos->rb.rb_right;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500105 else
106 return -EEXIST;
107 }
108 /* add new node and rebalance the tree */
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500109 rb_link_node(&kn->rb, parent, node);
110 rb_insert_color(&kn->rb, &kn->parent->dir.children);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500111 return 0;
112}
113
114/**
Tejun Heoc637b8a2013-12-11 14:11:58 -0500115 * kernfs_unlink_sibling - unlink kernfs_node from sibling rbtree
Tejun Heo324a56e2013-12-11 14:11:53 -0500116 * @kn: kernfs_node of interest
Tejun Heofd7b9f72013-11-28 14:54:33 -0500117 *
Tejun Heo324a56e2013-12-11 14:11:53 -0500118 * Unlink @kn from its sibling rbtree which starts from
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500119 * kn->parent->dir.children.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500120 *
121 * Locking:
Tejun Heoa797bfc2013-12-11 14:11:57 -0500122 * mutex_lock(kernfs_mutex)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500123 */
Greg Kroah-Hartman55f6e302014-01-13 14:27:16 -0800124static void kernfs_unlink_sibling(struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500125{
Tejun Heodf23fc32013-12-11 14:11:56 -0500126 if (kernfs_type(kn) == KERNFS_DIR)
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500127 kn->parent->dir.subdirs--;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500128
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500129 rb_erase(&kn->rb, &kn->parent->dir.children);
Tejun Heoae343722014-01-10 08:57:21 -0500130 RB_CLEAR_NODE(&kn->rb);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500131}
132
133/**
Tejun Heoc637b8a2013-12-11 14:11:58 -0500134 * kernfs_get_active - get an active reference to kernfs_node
Tejun Heo324a56e2013-12-11 14:11:53 -0500135 * @kn: kernfs_node to get an active reference to
Tejun Heofd7b9f72013-11-28 14:54:33 -0500136 *
Tejun Heo324a56e2013-12-11 14:11:53 -0500137 * Get an active reference of @kn. This function is noop if @kn
Tejun Heofd7b9f72013-11-28 14:54:33 -0500138 * is NULL.
139 *
140 * RETURNS:
Tejun Heo324a56e2013-12-11 14:11:53 -0500141 * Pointer to @kn on success, NULL on failure.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500142 */
Tejun Heoc637b8a2013-12-11 14:11:58 -0500143struct kernfs_node *kernfs_get_active(struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500144{
Tejun Heo324a56e2013-12-11 14:11:53 -0500145 if (unlikely(!kn))
Tejun Heofd7b9f72013-11-28 14:54:33 -0500146 return NULL;
147
Greg Kroah-Hartmanf4b3e632014-01-13 14:13:39 -0800148 if (!atomic_inc_unless_negative(&kn->active))
149 return NULL;
150
Tejun Heoa69d0012014-01-10 08:57:20 -0500151 if (kernfs_lockdep(kn))
Tejun Heo324a56e2013-12-11 14:11:53 -0500152 rwsem_acquire_read(&kn->dep_map, 0, 1, _RET_IP_);
Greg Kroah-Hartmanf4b3e632014-01-13 14:13:39 -0800153 return kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500154}
155
156/**
Tejun Heoc637b8a2013-12-11 14:11:58 -0500157 * kernfs_put_active - put an active reference to kernfs_node
Tejun Heo324a56e2013-12-11 14:11:53 -0500158 * @kn: kernfs_node to put an active reference to
Tejun Heofd7b9f72013-11-28 14:54:33 -0500159 *
Tejun Heo324a56e2013-12-11 14:11:53 -0500160 * Put an active reference to @kn. This function is noop if @kn
Tejun Heofd7b9f72013-11-28 14:54:33 -0500161 * is NULL.
162 */
Tejun Heoc637b8a2013-12-11 14:11:58 -0500163void kernfs_put_active(struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500164{
Tejun Heoea1c4722014-01-10 08:57:19 -0500165 struct kernfs_root *root = kernfs_root(kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500166 int v;
167
Tejun Heo324a56e2013-12-11 14:11:53 -0500168 if (unlikely(!kn))
Tejun Heofd7b9f72013-11-28 14:54:33 -0500169 return;
170
Tejun Heoa69d0012014-01-10 08:57:20 -0500171 if (kernfs_lockdep(kn))
Tejun Heo324a56e2013-12-11 14:11:53 -0500172 rwsem_release(&kn->dep_map, 1, _RET_IP_);
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500173 v = atomic_dec_return(&kn->active);
Tejun Heodf23fc32013-12-11 14:11:56 -0500174 if (likely(v != KN_DEACTIVATED_BIAS))
Tejun Heofd7b9f72013-11-28 14:54:33 -0500175 return;
176
Tejun Heoea1c4722014-01-10 08:57:19 -0500177 wake_up_all(&root->deactivate_waitq);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500178}
179
180/**
Tejun Heoae343722014-01-10 08:57:21 -0500181 * kernfs_drain - drain kernfs_node
182 * @kn: kernfs_node to drain
Tejun Heofd7b9f72013-11-28 14:54:33 -0500183 *
Tejun Heo45a140e2014-01-10 08:57:22 -0500184 * Drain existing usages of @kn. Mutiple removers may invoke this function
185 * concurrently on @kn and all will return after draining is complete.
186 * Returns %true if drain is performed and kernfs_mutex was temporarily
187 * released. %false if @kn was already drained and no operation was
188 * necessary.
189 *
190 * The caller is responsible for ensuring @kn stays pinned while this
191 * function is in progress even if it gets removed by someone else.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500192 */
Tejun Heo45a140e2014-01-10 08:57:22 -0500193static bool kernfs_drain(struct kernfs_node *kn)
194 __releases(&kernfs_mutex) __acquires(&kernfs_mutex)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500195{
Tejun Heoea1c4722014-01-10 08:57:19 -0500196 struct kernfs_root *root = kernfs_root(kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500197
Tejun Heo45a140e2014-01-10 08:57:22 -0500198 lockdep_assert_held(&kernfs_mutex);
Tejun Heoae343722014-01-10 08:57:21 -0500199 WARN_ON_ONCE(atomic_read(&kn->active) >= 0);
Tejun Heoea1c4722014-01-10 08:57:19 -0500200
Tejun Heo45a140e2014-01-10 08:57:22 -0500201 /*
202 * We want to go through the active ref lockdep annotation at least
203 * once for all node removals, but the lockdep annotation can't be
204 * nested inside kernfs_mutex and deactivation can't make forward
205 * progress if we keep dropping the mutex. Use JUST_ACTIVATED to
206 * force the slow path once for each deactivation if lockdep is
207 * enabled.
208 */
209 if ((!kernfs_lockdep(kn) || !(kn->flags & KERNFS_JUST_DEACTIVATED)) &&
210 atomic_read(&kn->active) == KN_DEACTIVATED_BIAS)
211 return false;
212
213 kn->flags &= ~KERNFS_JUST_DEACTIVATED;
214 mutex_unlock(&kernfs_mutex);
215
Tejun Heoa69d0012014-01-10 08:57:20 -0500216 if (kernfs_lockdep(kn)) {
217 rwsem_acquire(&kn->dep_map, 0, 0, _RET_IP_);
218 if (atomic_read(&kn->active) != KN_DEACTIVATED_BIAS)
219 lock_contended(&kn->dep_map, _RET_IP_);
220 }
Tejun Heoea1c4722014-01-10 08:57:19 -0500221
222 wait_event(root->deactivate_waitq,
223 atomic_read(&kn->active) == KN_DEACTIVATED_BIAS);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500224
Tejun Heoa69d0012014-01-10 08:57:20 -0500225 if (kernfs_lockdep(kn)) {
226 lock_acquired(&kn->dep_map, _RET_IP_);
227 rwsem_release(&kn->dep_map, 1, _RET_IP_);
228 }
Tejun Heo45a140e2014-01-10 08:57:22 -0500229
230 mutex_lock(&kernfs_mutex);
231 return true;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500232}
233
Tejun Heofd7b9f72013-11-28 14:54:33 -0500234/**
Tejun Heo324a56e2013-12-11 14:11:53 -0500235 * kernfs_get - get a reference count on a kernfs_node
236 * @kn: the target kernfs_node
Tejun Heofd7b9f72013-11-28 14:54:33 -0500237 */
Tejun Heo324a56e2013-12-11 14:11:53 -0500238void kernfs_get(struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500239{
Tejun Heo324a56e2013-12-11 14:11:53 -0500240 if (kn) {
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500241 WARN_ON(!atomic_read(&kn->count));
242 atomic_inc(&kn->count);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500243 }
244}
245EXPORT_SYMBOL_GPL(kernfs_get);
246
247/**
Tejun Heo324a56e2013-12-11 14:11:53 -0500248 * kernfs_put - put a reference count on a kernfs_node
249 * @kn: the target kernfs_node
Tejun Heofd7b9f72013-11-28 14:54:33 -0500250 *
Tejun Heo324a56e2013-12-11 14:11:53 -0500251 * Put a reference count of @kn and destroy it if it reached zero.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500252 */
Tejun Heo324a56e2013-12-11 14:11:53 -0500253void kernfs_put(struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500254{
Tejun Heo324a56e2013-12-11 14:11:53 -0500255 struct kernfs_node *parent;
Tejun Heoba7443b2013-11-28 14:54:40 -0500256 struct kernfs_root *root;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500257
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500258 if (!kn || !atomic_dec_and_test(&kn->count))
Tejun Heofd7b9f72013-11-28 14:54:33 -0500259 return;
Tejun Heo324a56e2013-12-11 14:11:53 -0500260 root = kernfs_root(kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500261 repeat:
Tejun Heoae343722014-01-10 08:57:21 -0500262 /*
263 * Moving/renaming is always done while holding reference.
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500264 * kn->parent won't change beneath us.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500265 */
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500266 parent = kn->parent;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500267
Tejun Heoae343722014-01-10 08:57:21 -0500268 WARN_ONCE(atomic_read(&kn->active) != KN_DEACTIVATED_BIAS,
269 "kernfs_put: %s/%s: released with incorrect active_ref %d\n",
270 parent ? parent->name : "", kn->name, atomic_read(&kn->active));
Tejun Heofd7b9f72013-11-28 14:54:33 -0500271
Tejun Heodf23fc32013-12-11 14:11:56 -0500272 if (kernfs_type(kn) == KERNFS_LINK)
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500273 kernfs_put(kn->symlink.target_kn);
Tejun Heo2063d602013-12-11 16:02:57 -0500274 if (!(kn->flags & KERNFS_STATIC_NAME))
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500275 kfree(kn->name);
276 if (kn->iattr) {
277 if (kn->iattr->ia_secdata)
278 security_release_secctx(kn->iattr->ia_secdata,
279 kn->iattr->ia_secdata_len);
280 simple_xattrs_free(&kn->iattr->xattrs);
Tejun Heo23223922013-11-23 17:40:02 -0500281 }
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500282 kfree(kn->iattr);
283 ida_simple_remove(&root->ino_ida, kn->ino);
Tejun Heoa797bfc2013-12-11 14:11:57 -0500284 kmem_cache_free(kernfs_node_cache, kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500285
Tejun Heo324a56e2013-12-11 14:11:53 -0500286 kn = parent;
287 if (kn) {
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500288 if (atomic_dec_and_test(&kn->count))
Tejun Heoba7443b2013-11-28 14:54:40 -0500289 goto repeat;
290 } else {
Tejun Heo324a56e2013-12-11 14:11:53 -0500291 /* just released the root kn, free @root too */
Tejun Heobc755552013-11-28 14:54:41 -0500292 ida_destroy(&root->ino_ida);
Tejun Heoba7443b2013-11-28 14:54:40 -0500293 kfree(root);
294 }
Tejun Heofd7b9f72013-11-28 14:54:33 -0500295}
296EXPORT_SYMBOL_GPL(kernfs_put);
297
Tejun Heoc637b8a2013-12-11 14:11:58 -0500298static int kernfs_dop_revalidate(struct dentry *dentry, unsigned int flags)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500299{
Tejun Heo324a56e2013-12-11 14:11:53 -0500300 struct kernfs_node *kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500301
302 if (flags & LOOKUP_RCU)
303 return -ECHILD;
304
Tejun Heo19bbb922013-12-11 16:02:59 -0500305 /* Always perform fresh lookup for negatives */
306 if (!dentry->d_inode)
307 goto out_bad_unlocked;
308
Tejun Heo324a56e2013-12-11 14:11:53 -0500309 kn = dentry->d_fsdata;
Tejun Heoa797bfc2013-12-11 14:11:57 -0500310 mutex_lock(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500311
Tejun Heoae343722014-01-10 08:57:21 -0500312 /* Force fresh lookup if removed */
313 if (kn->parent && RB_EMPTY_NODE(&kn->rb))
Tejun Heofd7b9f72013-11-28 14:54:33 -0500314 goto out_bad;
315
Tejun Heoc637b8a2013-12-11 14:11:58 -0500316 /* The kernfs node has been moved? */
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500317 if (dentry->d_parent->d_fsdata != kn->parent)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500318 goto out_bad;
319
Tejun Heoc637b8a2013-12-11 14:11:58 -0500320 /* The kernfs node has been renamed */
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500321 if (strcmp(dentry->d_name.name, kn->name) != 0)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500322 goto out_bad;
323
Tejun Heoc637b8a2013-12-11 14:11:58 -0500324 /* The kernfs node has been moved to a different namespace */
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500325 if (kn->parent && kernfs_ns_enabled(kn->parent) &&
Tejun Heoc525aad2013-12-11 14:11:55 -0500326 kernfs_info(dentry->d_sb)->ns != kn->ns)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500327 goto out_bad;
328
Tejun Heoa797bfc2013-12-11 14:11:57 -0500329 mutex_unlock(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500330out_valid:
331 return 1;
332out_bad:
Tejun Heoa797bfc2013-12-11 14:11:57 -0500333 mutex_unlock(&kernfs_mutex);
Tejun Heo19bbb922013-12-11 16:02:59 -0500334out_bad_unlocked:
335 /*
336 * @dentry doesn't match the underlying kernfs node, drop the
337 * dentry and force lookup. If we have submounts we must allow the
338 * vfs caches to lie about the state of the filesystem to prevent
339 * leaks and other nasty things, so use check_submounts_and_drop()
340 * instead of d_drop().
Tejun Heofd7b9f72013-11-28 14:54:33 -0500341 */
342 if (check_submounts_and_drop(dentry) != 0)
343 goto out_valid;
344
345 return 0;
346}
347
Tejun Heoc637b8a2013-12-11 14:11:58 -0500348static void kernfs_dop_release(struct dentry *dentry)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500349{
350 kernfs_put(dentry->d_fsdata);
351}
352
Tejun Heoa797bfc2013-12-11 14:11:57 -0500353const struct dentry_operations kernfs_dops = {
Tejun Heoc637b8a2013-12-11 14:11:58 -0500354 .d_revalidate = kernfs_dop_revalidate,
Tejun Heoc637b8a2013-12-11 14:11:58 -0500355 .d_release = kernfs_dop_release,
Tejun Heofd7b9f72013-11-28 14:54:33 -0500356};
357
Tejun Heoc637b8a2013-12-11 14:11:58 -0500358struct kernfs_node *kernfs_new_node(struct kernfs_root *root, const char *name,
Tejun Heo2063d602013-12-11 16:02:57 -0500359 umode_t mode, unsigned flags)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500360{
361 char *dup_name = NULL;
Tejun Heo324a56e2013-12-11 14:11:53 -0500362 struct kernfs_node *kn;
Tejun Heobc755552013-11-28 14:54:41 -0500363 int ret;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500364
Tejun Heo2063d602013-12-11 16:02:57 -0500365 if (!(flags & KERNFS_STATIC_NAME)) {
Tejun Heofd7b9f72013-11-28 14:54:33 -0500366 name = dup_name = kstrdup(name, GFP_KERNEL);
367 if (!name)
368 return NULL;
369 }
370
Tejun Heoa797bfc2013-12-11 14:11:57 -0500371 kn = kmem_cache_zalloc(kernfs_node_cache, GFP_KERNEL);
Tejun Heo324a56e2013-12-11 14:11:53 -0500372 if (!kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500373 goto err_out1;
374
Tejun Heobc755552013-11-28 14:54:41 -0500375 ret = ida_simple_get(&root->ino_ida, 1, 0, GFP_KERNEL);
376 if (ret < 0)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500377 goto err_out2;
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500378 kn->ino = ret;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500379
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500380 atomic_set(&kn->count, 1);
Tejun Heoae343722014-01-10 08:57:21 -0500381 atomic_set(&kn->active, KN_DEACTIVATED_BIAS);
382 RB_CLEAR_NODE(&kn->rb);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500383
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500384 kn->name = name;
385 kn->mode = mode;
Tejun Heoae343722014-01-10 08:57:21 -0500386 kn->flags = flags;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500387
Tejun Heo324a56e2013-12-11 14:11:53 -0500388 return kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500389
390 err_out2:
Tejun Heoa797bfc2013-12-11 14:11:57 -0500391 kmem_cache_free(kernfs_node_cache, kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500392 err_out1:
393 kfree(dup_name);
394 return NULL;
395}
396
397/**
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800398 * kernfs_addrm_start - prepare for kernfs_node add/remove
399 * @acxt: pointer to kernfs_addrm_cxt to be used
400 *
401 * This function is called when the caller is about to add or remove
402 * kernfs_node. This function acquires kernfs_mutex. @acxt is used
403 * to keep and pass context to other addrm functions.
404 *
405 * LOCKING:
406 * Kernel thread context (may sleep). kernfs_mutex is locked on
407 * return.
408 */
409void kernfs_addrm_start(struct kernfs_addrm_cxt *acxt)
410 __acquires(kernfs_mutex)
411{
412 memset(acxt, 0, sizeof(*acxt));
413
414 mutex_lock(&kernfs_mutex);
415}
416
417/**
Tejun Heoc637b8a2013-12-11 14:11:58 -0500418 * kernfs_add_one - add kernfs_node to parent without warning
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800419 * @acxt: addrm context to use
Tejun Heo324a56e2013-12-11 14:11:53 -0500420 * @kn: kernfs_node to be added
421 * @parent: the parent kernfs_node to add @kn to
Tejun Heofd7b9f72013-11-28 14:54:33 -0500422 *
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500423 * Get @parent and set @kn->parent to it and increment nlink of the
424 * parent inode if @kn is a directory and link into the children list
425 * of the parent.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500426 *
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800427 * This function should be called between calls to
428 * kernfs_addrm_start() and kernfs_addrm_finish() and should be passed
429 * the same @acxt as passed to kernfs_addrm_start().
430 *
431 * LOCKING:
432 * Determined by kernfs_addrm_start().
433 *
Tejun Heofd7b9f72013-11-28 14:54:33 -0500434 * RETURNS:
435 * 0 on success, -EEXIST if entry with the given name already
436 * exists.
437 */
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800438int kernfs_add_one(struct kernfs_addrm_cxt *acxt, struct kernfs_node *kn,
439 struct kernfs_node *parent)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500440{
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800441 bool has_ns = kernfs_ns_enabled(parent);
Tejun Heoc525aad2013-12-11 14:11:55 -0500442 struct kernfs_iattrs *ps_iattr;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500443 int ret;
444
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800445 WARN_ON_ONCE(atomic_read(&parent->active) < 0);
Tejun Heoae343722014-01-10 08:57:21 -0500446
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800447 if (has_ns != (bool)kn->ns) {
448 WARN(1, KERN_WARNING "kernfs: ns %s in '%s' for '%s'\n",
449 has_ns ? "required" : "invalid", parent->name, kn->name);
450 return -EINVAL;
451 }
Tejun Heofd7b9f72013-11-28 14:54:33 -0500452
Tejun Heodf23fc32013-12-11 14:11:56 -0500453 if (kernfs_type(parent) != KERNFS_DIR)
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800454 return -EINVAL;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500455
Tejun Heoc637b8a2013-12-11 14:11:58 -0500456 kn->hash = kernfs_name_hash(kn->name, kn->ns);
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500457 kn->parent = parent;
Tejun Heo324a56e2013-12-11 14:11:53 -0500458 kernfs_get(parent);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500459
Tejun Heoc637b8a2013-12-11 14:11:58 -0500460 ret = kernfs_link_sibling(kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500461 if (ret)
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800462 return ret;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500463
464 /* Update timestamps on the parent */
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500465 ps_iattr = parent->iattr;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500466 if (ps_iattr) {
467 struct iattr *ps_iattrs = &ps_iattr->ia_iattr;
468 ps_iattrs->ia_ctime = ps_iattrs->ia_mtime = CURRENT_TIME;
469 }
470
471 /* Mark the entry added into directory tree */
Tejun Heoae343722014-01-10 08:57:21 -0500472 atomic_sub(KN_DEACTIVATED_BIAS, &kn->active);
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800473 return 0;
474}
475
476/**
477 * kernfs_addrm_finish - finish up kernfs_node add/remove
478 * @acxt: addrm context to finish up
479 *
480 * Finish up kernfs_node add/remove. Resources acquired by
481 * kernfs_addrm_start() are released and removed kernfs_nodes are
482 * cleaned up.
483 *
484 * LOCKING:
485 * kernfs_mutex is released.
486 */
487void kernfs_addrm_finish(struct kernfs_addrm_cxt *acxt)
488 __releases(kernfs_mutex)
489{
490 /* release resources acquired by kernfs_addrm_start() */
Tejun Heoa797bfc2013-12-11 14:11:57 -0500491 mutex_unlock(&kernfs_mutex);
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800492
493 /* kill removed kernfs_nodes */
494 while (acxt->removed) {
495 struct kernfs_node *kn = acxt->removed;
496
497 acxt->removed = kn->u.removed_list;
498
Greg Kroah-Hartman55f6e302014-01-13 14:27:16 -0800499 kernfs_unmap_bin_file(kn);
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800500 kernfs_put(kn);
501 }
Tejun Heofd7b9f72013-11-28 14:54:33 -0500502}
503
504/**
Tejun Heo324a56e2013-12-11 14:11:53 -0500505 * kernfs_find_ns - find kernfs_node with the given name
506 * @parent: kernfs_node to search under
Tejun Heofd7b9f72013-11-28 14:54:33 -0500507 * @name: name to look for
508 * @ns: the namespace tag to use
509 *
Tejun Heo324a56e2013-12-11 14:11:53 -0500510 * Look for kernfs_node with name @name under @parent. Returns pointer to
511 * the found kernfs_node on success, %NULL on failure.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500512 */
Tejun Heo324a56e2013-12-11 14:11:53 -0500513static struct kernfs_node *kernfs_find_ns(struct kernfs_node *parent,
514 const unsigned char *name,
515 const void *ns)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500516{
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500517 struct rb_node *node = parent->dir.children.rb_node;
Tejun Heoac9bba02013-11-29 17:19:09 -0500518 bool has_ns = kernfs_ns_enabled(parent);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500519 unsigned int hash;
520
Tejun Heoa797bfc2013-12-11 14:11:57 -0500521 lockdep_assert_held(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500522
523 if (has_ns != (bool)ns) {
Tejun Heoc637b8a2013-12-11 14:11:58 -0500524 WARN(1, KERN_WARNING "kernfs: ns %s in '%s' for '%s'\n",
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500525 has_ns ? "required" : "invalid", parent->name, name);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500526 return NULL;
527 }
528
Tejun Heoc637b8a2013-12-11 14:11:58 -0500529 hash = kernfs_name_hash(name, ns);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500530 while (node) {
Tejun Heo324a56e2013-12-11 14:11:53 -0500531 struct kernfs_node *kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500532 int result;
533
Tejun Heo324a56e2013-12-11 14:11:53 -0500534 kn = rb_to_kn(node);
Tejun Heoc637b8a2013-12-11 14:11:58 -0500535 result = kernfs_name_compare(hash, name, ns, kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500536 if (result < 0)
537 node = node->rb_left;
538 else if (result > 0)
539 node = node->rb_right;
540 else
Tejun Heo324a56e2013-12-11 14:11:53 -0500541 return kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500542 }
543 return NULL;
544}
545
546/**
Tejun Heo324a56e2013-12-11 14:11:53 -0500547 * kernfs_find_and_get_ns - find and get kernfs_node with the given name
548 * @parent: kernfs_node to search under
Tejun Heofd7b9f72013-11-28 14:54:33 -0500549 * @name: name to look for
550 * @ns: the namespace tag to use
551 *
Tejun Heo324a56e2013-12-11 14:11:53 -0500552 * Look for kernfs_node with name @name under @parent and get a reference
Tejun Heofd7b9f72013-11-28 14:54:33 -0500553 * if found. This function may sleep and returns pointer to the found
Tejun Heo324a56e2013-12-11 14:11:53 -0500554 * kernfs_node on success, %NULL on failure.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500555 */
Tejun Heo324a56e2013-12-11 14:11:53 -0500556struct kernfs_node *kernfs_find_and_get_ns(struct kernfs_node *parent,
557 const char *name, const void *ns)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500558{
Tejun Heo324a56e2013-12-11 14:11:53 -0500559 struct kernfs_node *kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500560
Tejun Heoa797bfc2013-12-11 14:11:57 -0500561 mutex_lock(&kernfs_mutex);
Tejun Heo324a56e2013-12-11 14:11:53 -0500562 kn = kernfs_find_ns(parent, name, ns);
563 kernfs_get(kn);
Tejun Heoa797bfc2013-12-11 14:11:57 -0500564 mutex_unlock(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500565
Tejun Heo324a56e2013-12-11 14:11:53 -0500566 return kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500567}
568EXPORT_SYMBOL_GPL(kernfs_find_and_get_ns);
569
570/**
Tejun Heoba7443b2013-11-28 14:54:40 -0500571 * kernfs_create_root - create a new kernfs hierarchy
Tejun Heo80b9bbe2013-12-11 16:03:00 -0500572 * @kdops: optional directory syscall operations for the hierarchy
Tejun Heoba7443b2013-11-28 14:54:40 -0500573 * @priv: opaque data associated with the new directory
574 *
575 * Returns the root of the new hierarchy on success, ERR_PTR() value on
576 * failure.
577 */
Tejun Heo80b9bbe2013-12-11 16:03:00 -0500578struct kernfs_root *kernfs_create_root(struct kernfs_dir_ops *kdops, void *priv)
Tejun Heoba7443b2013-11-28 14:54:40 -0500579{
580 struct kernfs_root *root;
Tejun Heo324a56e2013-12-11 14:11:53 -0500581 struct kernfs_node *kn;
Tejun Heoba7443b2013-11-28 14:54:40 -0500582
583 root = kzalloc(sizeof(*root), GFP_KERNEL);
584 if (!root)
585 return ERR_PTR(-ENOMEM);
586
Tejun Heobc755552013-11-28 14:54:41 -0500587 ida_init(&root->ino_ida);
588
Tejun Heoc637b8a2013-12-11 14:11:58 -0500589 kn = kernfs_new_node(root, "", S_IFDIR | S_IRUGO | S_IXUGO, KERNFS_DIR);
Tejun Heo324a56e2013-12-11 14:11:53 -0500590 if (!kn) {
Tejun Heobc755552013-11-28 14:54:41 -0500591 ida_destroy(&root->ino_ida);
Tejun Heoba7443b2013-11-28 14:54:40 -0500592 kfree(root);
593 return ERR_PTR(-ENOMEM);
594 }
595
Tejun Heoae343722014-01-10 08:57:21 -0500596 atomic_sub(KN_DEACTIVATED_BIAS, &kn->active);
Tejun Heo324a56e2013-12-11 14:11:53 -0500597 kn->priv = priv;
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500598 kn->dir.root = root;
Tejun Heoba7443b2013-11-28 14:54:40 -0500599
Tejun Heo80b9bbe2013-12-11 16:03:00 -0500600 root->dir_ops = kdops;
Tejun Heo324a56e2013-12-11 14:11:53 -0500601 root->kn = kn;
Tejun Heoea1c4722014-01-10 08:57:19 -0500602 init_waitqueue_head(&root->deactivate_waitq);
Tejun Heoba7443b2013-11-28 14:54:40 -0500603
604 return root;
605}
606
607/**
608 * kernfs_destroy_root - destroy a kernfs hierarchy
609 * @root: root of the hierarchy to destroy
610 *
611 * Destroy the hierarchy anchored at @root by removing all existing
612 * directories and destroying @root.
613 */
614void kernfs_destroy_root(struct kernfs_root *root)
615{
Tejun Heo324a56e2013-12-11 14:11:53 -0500616 kernfs_remove(root->kn); /* will also free @root */
Tejun Heoba7443b2013-11-28 14:54:40 -0500617}
618
619/**
Tejun Heofd7b9f72013-11-28 14:54:33 -0500620 * kernfs_create_dir_ns - create a directory
621 * @parent: parent in which to create a new directory
622 * @name: name of the new directory
Tejun Heobb8b9d02013-12-11 16:02:55 -0500623 * @mode: mode of the new directory
Tejun Heofd7b9f72013-11-28 14:54:33 -0500624 * @priv: opaque data associated with the new directory
625 * @ns: optional namespace tag of the directory
626 *
627 * Returns the created node on success, ERR_PTR() value on failure.
628 */
Tejun Heo324a56e2013-12-11 14:11:53 -0500629struct kernfs_node *kernfs_create_dir_ns(struct kernfs_node *parent,
Tejun Heobb8b9d02013-12-11 16:02:55 -0500630 const char *name, umode_t mode,
631 void *priv, const void *ns)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500632{
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800633 struct kernfs_addrm_cxt acxt;
Tejun Heo324a56e2013-12-11 14:11:53 -0500634 struct kernfs_node *kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500635 int rc;
636
637 /* allocate */
Tejun Heobb8b9d02013-12-11 16:02:55 -0500638 kn = kernfs_new_node(kernfs_root(parent), name, mode | S_IFDIR,
639 KERNFS_DIR);
Tejun Heo324a56e2013-12-11 14:11:53 -0500640 if (!kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500641 return ERR_PTR(-ENOMEM);
642
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500643 kn->dir.root = parent->dir.root;
644 kn->ns = ns;
Tejun Heo324a56e2013-12-11 14:11:53 -0500645 kn->priv = priv;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500646
647 /* link in */
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800648 rc = -ENOENT;
649 if (kernfs_get_active(parent)) {
650 kernfs_addrm_start(&acxt);
651 rc = kernfs_add_one(&acxt, kn, parent);
652 kernfs_addrm_finish(&acxt);
653 kernfs_put_active(parent);
654 }
655
Tejun Heofd7b9f72013-11-28 14:54:33 -0500656 if (!rc)
Tejun Heo324a56e2013-12-11 14:11:53 -0500657 return kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500658
Tejun Heo324a56e2013-12-11 14:11:53 -0500659 kernfs_put(kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500660 return ERR_PTR(rc);
661}
662
Tejun Heoc637b8a2013-12-11 14:11:58 -0500663static struct dentry *kernfs_iop_lookup(struct inode *dir,
664 struct dentry *dentry,
665 unsigned int flags)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500666{
Tejun Heo19bbb922013-12-11 16:02:59 -0500667 struct dentry *ret;
Tejun Heo324a56e2013-12-11 14:11:53 -0500668 struct kernfs_node *parent = dentry->d_parent->d_fsdata;
669 struct kernfs_node *kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500670 struct inode *inode;
671 const void *ns = NULL;
672
Tejun Heoa797bfc2013-12-11 14:11:57 -0500673 mutex_lock(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500674
Tejun Heo324a56e2013-12-11 14:11:53 -0500675 if (kernfs_ns_enabled(parent))
Tejun Heoc525aad2013-12-11 14:11:55 -0500676 ns = kernfs_info(dir->i_sb)->ns;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500677
Tejun Heo324a56e2013-12-11 14:11:53 -0500678 kn = kernfs_find_ns(parent, dentry->d_name.name, ns);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500679
680 /* no such entry */
Tejun Heo324a56e2013-12-11 14:11:53 -0500681 if (!kn) {
Tejun Heo19bbb922013-12-11 16:02:59 -0500682 ret = NULL;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500683 goto out_unlock;
684 }
Tejun Heo324a56e2013-12-11 14:11:53 -0500685 kernfs_get(kn);
686 dentry->d_fsdata = kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500687
688 /* attach dentry and inode */
Tejun Heoc637b8a2013-12-11 14:11:58 -0500689 inode = kernfs_get_inode(dir->i_sb, kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500690 if (!inode) {
691 ret = ERR_PTR(-ENOMEM);
692 goto out_unlock;
693 }
694
695 /* instantiate and hash dentry */
696 ret = d_materialise_unique(dentry, inode);
697 out_unlock:
Tejun Heoa797bfc2013-12-11 14:11:57 -0500698 mutex_unlock(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500699 return ret;
700}
701
Tejun Heo80b9bbe2013-12-11 16:03:00 -0500702static int kernfs_iop_mkdir(struct inode *dir, struct dentry *dentry,
703 umode_t mode)
704{
705 struct kernfs_node *parent = dir->i_private;
706 struct kernfs_dir_ops *kdops = kernfs_root(parent)->dir_ops;
707
708 if (!kdops || !kdops->mkdir)
709 return -EPERM;
710
711 return kdops->mkdir(parent, dentry->d_name.name, mode);
712}
713
714static int kernfs_iop_rmdir(struct inode *dir, struct dentry *dentry)
715{
716 struct kernfs_node *kn = dentry->d_fsdata;
717 struct kernfs_dir_ops *kdops = kernfs_root(kn)->dir_ops;
718
719 if (!kdops || !kdops->rmdir)
720 return -EPERM;
721
722 return kdops->rmdir(kn);
723}
724
725static int kernfs_iop_rename(struct inode *old_dir, struct dentry *old_dentry,
726 struct inode *new_dir, struct dentry *new_dentry)
727{
728 struct kernfs_node *kn = old_dentry->d_fsdata;
729 struct kernfs_node *new_parent = new_dir->i_private;
730 struct kernfs_dir_ops *kdops = kernfs_root(kn)->dir_ops;
731
732 if (!kdops || !kdops->rename)
733 return -EPERM;
734
735 return kdops->rename(kn, new_parent, new_dentry->d_name.name);
736}
737
Tejun Heoa797bfc2013-12-11 14:11:57 -0500738const struct inode_operations kernfs_dir_iops = {
Tejun Heoc637b8a2013-12-11 14:11:58 -0500739 .lookup = kernfs_iop_lookup,
740 .permission = kernfs_iop_permission,
741 .setattr = kernfs_iop_setattr,
742 .getattr = kernfs_iop_getattr,
743 .setxattr = kernfs_iop_setxattr,
744 .removexattr = kernfs_iop_removexattr,
745 .getxattr = kernfs_iop_getxattr,
746 .listxattr = kernfs_iop_listxattr,
Tejun Heo80b9bbe2013-12-11 16:03:00 -0500747
748 .mkdir = kernfs_iop_mkdir,
749 .rmdir = kernfs_iop_rmdir,
750 .rename = kernfs_iop_rename,
Tejun Heofd7b9f72013-11-28 14:54:33 -0500751};
752
Tejun Heoc637b8a2013-12-11 14:11:58 -0500753static struct kernfs_node *kernfs_leftmost_descendant(struct kernfs_node *pos)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500754{
Tejun Heo324a56e2013-12-11 14:11:53 -0500755 struct kernfs_node *last;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500756
757 while (true) {
758 struct rb_node *rbn;
759
760 last = pos;
761
Tejun Heodf23fc32013-12-11 14:11:56 -0500762 if (kernfs_type(pos) != KERNFS_DIR)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500763 break;
764
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500765 rbn = rb_first(&pos->dir.children);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500766 if (!rbn)
767 break;
768
Tejun Heo324a56e2013-12-11 14:11:53 -0500769 pos = rb_to_kn(rbn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500770 }
771
772 return last;
773}
774
775/**
Tejun Heoc637b8a2013-12-11 14:11:58 -0500776 * kernfs_next_descendant_post - find the next descendant for post-order walk
Tejun Heofd7b9f72013-11-28 14:54:33 -0500777 * @pos: the current position (%NULL to initiate traversal)
Tejun Heo324a56e2013-12-11 14:11:53 -0500778 * @root: kernfs_node whose descendants to walk
Tejun Heofd7b9f72013-11-28 14:54:33 -0500779 *
780 * Find the next descendant to visit for post-order traversal of @root's
781 * descendants. @root is included in the iteration and the last node to be
782 * visited.
783 */
Tejun Heoc637b8a2013-12-11 14:11:58 -0500784static struct kernfs_node *kernfs_next_descendant_post(struct kernfs_node *pos,
785 struct kernfs_node *root)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500786{
787 struct rb_node *rbn;
788
Tejun Heoa797bfc2013-12-11 14:11:57 -0500789 lockdep_assert_held(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500790
791 /* if first iteration, visit leftmost descendant which may be root */
792 if (!pos)
Tejun Heoc637b8a2013-12-11 14:11:58 -0500793 return kernfs_leftmost_descendant(root);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500794
795 /* if we visited @root, we're done */
796 if (pos == root)
797 return NULL;
798
799 /* if there's an unvisited sibling, visit its leftmost descendant */
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500800 rbn = rb_next(&pos->rb);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500801 if (rbn)
Tejun Heoc637b8a2013-12-11 14:11:58 -0500802 return kernfs_leftmost_descendant(rb_to_kn(rbn));
Tejun Heofd7b9f72013-11-28 14:54:33 -0500803
804 /* no sibling left, visit parent */
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500805 return pos->parent;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500806}
807
Tejun Heo45a140e2014-01-10 08:57:22 -0500808static void __kernfs_deactivate(struct kernfs_node *kn)
809{
810 struct kernfs_node *pos;
811
812 lockdep_assert_held(&kernfs_mutex);
813
814 /* prevent any new usage under @kn by deactivating all nodes */
815 pos = NULL;
816 while ((pos = kernfs_next_descendant_post(pos, kn))) {
Greg Kroah-Hartman9b0925a2014-01-13 14:09:38 -0800817 if (atomic_read(&pos->active) >= 0) {
Tejun Heo45a140e2014-01-10 08:57:22 -0500818 atomic_add(KN_DEACTIVATED_BIAS, &pos->active);
819 pos->flags |= KERNFS_JUST_DEACTIVATED;
820 }
821 }
822
823 /*
824 * Drain the subtree. If kernfs_drain() blocked to drain, which is
825 * indicated by %true return, it temporarily released kernfs_mutex
826 * and the rbtree might have been modified inbetween breaking our
827 * future walk. Restart the walk after each %true return.
828 */
829 pos = NULL;
830 while ((pos = kernfs_next_descendant_post(pos, kn))) {
831 bool drained;
832
833 kernfs_get(pos);
834 drained = kernfs_drain(pos);
835 kernfs_put(pos);
836 if (drained)
837 pos = NULL;
838 }
839}
840
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800841static void __kernfs_remove(struct kernfs_addrm_cxt *acxt,
842 struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500843{
Tejun Heo45a140e2014-01-10 08:57:22 -0500844 struct kernfs_node *pos;
845
846 lockdep_assert_held(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500847
Greg Kroah-Hartmance9b4992014-01-13 13:50:31 -0800848 if (!kn)
849 return;
850
Tejun Heoc637b8a2013-12-11 14:11:58 -0500851 pr_debug("kernfs %s: removing\n", kn->name);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500852
Tejun Heo45a140e2014-01-10 08:57:22 -0500853 __kernfs_deactivate(kn);
854
855 /* unlink the subtree node-by-node */
Tejun Heofd7b9f72013-11-28 14:54:33 -0500856 do {
Greg Kroah-Hartman55f6e302014-01-13 14:27:16 -0800857 struct kernfs_iattrs *ps_iattr;
858
Tejun Heo45a140e2014-01-10 08:57:22 -0500859 pos = kernfs_leftmost_descendant(kn);
860
Greg Kroah-Hartman55f6e302014-01-13 14:27:16 -0800861 if (pos->parent) {
862 kernfs_unlink_sibling(pos);
Tejun Heo45a140e2014-01-10 08:57:22 -0500863
864 /* update timestamps on the parent */
Greg Kroah-Hartman55f6e302014-01-13 14:27:16 -0800865 ps_iattr = pos->parent->iattr;
Tejun Heo45a140e2014-01-10 08:57:22 -0500866 if (ps_iattr) {
867 ps_iattr->ia_iattr.ia_ctime = CURRENT_TIME;
868 ps_iattr->ia_iattr.ia_mtime = CURRENT_TIME;
869 }
870 }
871
Greg Kroah-Hartman55f6e302014-01-13 14:27:16 -0800872 pos->u.removed_list = acxt->removed;
873 acxt->removed = pos;
Tejun Heo45a140e2014-01-10 08:57:22 -0500874 } while (pos != kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500875}
876
877/**
Tejun Heo324a56e2013-12-11 14:11:53 -0500878 * kernfs_remove - remove a kernfs_node recursively
879 * @kn: the kernfs_node to remove
Tejun Heofd7b9f72013-11-28 14:54:33 -0500880 *
Tejun Heo324a56e2013-12-11 14:11:53 -0500881 * Remove @kn along with all its subdirectories and files.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500882 */
Tejun Heo324a56e2013-12-11 14:11:53 -0500883void kernfs_remove(struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500884{
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800885 struct kernfs_addrm_cxt acxt;
886
887 kernfs_addrm_start(&acxt);
888 __kernfs_remove(&acxt, kn);
889 kernfs_addrm_finish(&acxt);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500890}
891
892/**
Tejun Heo324a56e2013-12-11 14:11:53 -0500893 * kernfs_remove_by_name_ns - find a kernfs_node by name and remove it
894 * @parent: parent of the target
895 * @name: name of the kernfs_node to remove
896 * @ns: namespace tag of the kernfs_node to remove
Tejun Heofd7b9f72013-11-28 14:54:33 -0500897 *
Tejun Heo324a56e2013-12-11 14:11:53 -0500898 * Look for the kernfs_node with @name and @ns under @parent and remove it.
899 * Returns 0 on success, -ENOENT if such entry doesn't exist.
Tejun Heofd7b9f72013-11-28 14:54:33 -0500900 */
Tejun Heo324a56e2013-12-11 14:11:53 -0500901int kernfs_remove_by_name_ns(struct kernfs_node *parent, const char *name,
Tejun Heofd7b9f72013-11-28 14:54:33 -0500902 const void *ns)
903{
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800904 struct kernfs_addrm_cxt acxt;
Tejun Heo324a56e2013-12-11 14:11:53 -0500905 struct kernfs_node *kn;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500906
Tejun Heo324a56e2013-12-11 14:11:53 -0500907 if (!parent) {
Tejun Heoc637b8a2013-12-11 14:11:58 -0500908 WARN(1, KERN_WARNING "kernfs: can not remove '%s', no directory\n",
Tejun Heofd7b9f72013-11-28 14:54:33 -0500909 name);
910 return -ENOENT;
911 }
912
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800913 kernfs_addrm_start(&acxt);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500914
Tejun Heo324a56e2013-12-11 14:11:53 -0500915 kn = kernfs_find_ns(parent, name, ns);
916 if (kn)
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800917 __kernfs_remove(&acxt, kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500918
Greg Kroah-Hartman7653fe92014-01-13 14:20:56 -0800919 kernfs_addrm_finish(&acxt);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500920
Tejun Heo324a56e2013-12-11 14:11:53 -0500921 if (kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500922 return 0;
923 else
924 return -ENOENT;
925}
926
927/**
928 * kernfs_rename_ns - move and rename a kernfs_node
Tejun Heo324a56e2013-12-11 14:11:53 -0500929 * @kn: target node
Tejun Heofd7b9f72013-11-28 14:54:33 -0500930 * @new_parent: new parent to put @sd under
931 * @new_name: new name
932 * @new_ns: new namespace tag
933 */
Tejun Heo324a56e2013-12-11 14:11:53 -0500934int kernfs_rename_ns(struct kernfs_node *kn, struct kernfs_node *new_parent,
Tejun Heofd7b9f72013-11-28 14:54:33 -0500935 const char *new_name, const void *new_ns)
936{
937 int error;
938
Tejun Heod0ae3d42013-12-11 16:02:56 -0500939 error = -ENOENT;
Tejun Heoae343722014-01-10 08:57:21 -0500940 if (!kernfs_get_active(new_parent))
Tejun Heod0ae3d42013-12-11 16:02:56 -0500941 goto out;
Tejun Heoae343722014-01-10 08:57:21 -0500942 if (!kernfs_get_active(kn))
943 goto out_put_new_parent;
944
945 mutex_lock(&kernfs_mutex);
Tejun Heod0ae3d42013-12-11 16:02:56 -0500946
Tejun Heofd7b9f72013-11-28 14:54:33 -0500947 error = 0;
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500948 if ((kn->parent == new_parent) && (kn->ns == new_ns) &&
949 (strcmp(kn->name, new_name) == 0))
Tejun Heoae343722014-01-10 08:57:21 -0500950 goto out_unlock; /* nothing to rename */
Tejun Heofd7b9f72013-11-28 14:54:33 -0500951
952 error = -EEXIST;
953 if (kernfs_find_ns(new_parent, new_name, new_ns))
Tejun Heoae343722014-01-10 08:57:21 -0500954 goto out_unlock;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500955
Tejun Heo324a56e2013-12-11 14:11:53 -0500956 /* rename kernfs_node */
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500957 if (strcmp(kn->name, new_name) != 0) {
Tejun Heofd7b9f72013-11-28 14:54:33 -0500958 error = -ENOMEM;
959 new_name = kstrdup(new_name, GFP_KERNEL);
960 if (!new_name)
Tejun Heoae343722014-01-10 08:57:21 -0500961 goto out_unlock;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500962
Tejun Heo47a52e92013-12-11 16:02:58 -0500963 if (kn->flags & KERNFS_STATIC_NAME)
964 kn->flags &= ~KERNFS_STATIC_NAME;
965 else
966 kfree(kn->name);
967
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500968 kn->name = new_name;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500969 }
970
971 /*
972 * Move to the appropriate place in the appropriate directories rbtree.
973 */
Tejun Heoc637b8a2013-12-11 14:11:58 -0500974 kernfs_unlink_sibling(kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500975 kernfs_get(new_parent);
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500976 kernfs_put(kn->parent);
977 kn->ns = new_ns;
Tejun Heoc637b8a2013-12-11 14:11:58 -0500978 kn->hash = kernfs_name_hash(kn->name, kn->ns);
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500979 kn->parent = new_parent;
Tejun Heoc637b8a2013-12-11 14:11:58 -0500980 kernfs_link_sibling(kn);
Tejun Heofd7b9f72013-11-28 14:54:33 -0500981
982 error = 0;
Tejun Heoae343722014-01-10 08:57:21 -0500983out_unlock:
Tejun Heoa797bfc2013-12-11 14:11:57 -0500984 mutex_unlock(&kernfs_mutex);
Tejun Heoae343722014-01-10 08:57:21 -0500985 kernfs_put_active(kn);
986out_put_new_parent:
987 kernfs_put_active(new_parent);
988out:
Tejun Heofd7b9f72013-11-28 14:54:33 -0500989 return error;
990}
991
Tejun Heofd7b9f72013-11-28 14:54:33 -0500992/* Relationship between s_mode and the DT_xxx types */
Tejun Heo324a56e2013-12-11 14:11:53 -0500993static inline unsigned char dt_type(struct kernfs_node *kn)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500994{
Tejun Heoadc5e8b2013-12-11 14:11:54 -0500995 return (kn->mode >> 12) & 15;
Tejun Heofd7b9f72013-11-28 14:54:33 -0500996}
997
Tejun Heoc637b8a2013-12-11 14:11:58 -0500998static int kernfs_dir_fop_release(struct inode *inode, struct file *filp)
Tejun Heofd7b9f72013-11-28 14:54:33 -0500999{
1000 kernfs_put(filp->private_data);
1001 return 0;
1002}
1003
Tejun Heoc637b8a2013-12-11 14:11:58 -05001004static struct kernfs_node *kernfs_dir_pos(const void *ns,
Tejun Heo324a56e2013-12-11 14:11:53 -05001005 struct kernfs_node *parent, loff_t hash, struct kernfs_node *pos)
Tejun Heofd7b9f72013-11-28 14:54:33 -05001006{
1007 if (pos) {
Tejun Heoae343722014-01-10 08:57:21 -05001008 int valid = pos->parent == parent && hash == pos->hash;
Tejun Heofd7b9f72013-11-28 14:54:33 -05001009 kernfs_put(pos);
1010 if (!valid)
1011 pos = NULL;
1012 }
1013 if (!pos && (hash > 1) && (hash < INT_MAX)) {
Tejun Heoadc5e8b2013-12-11 14:11:54 -05001014 struct rb_node *node = parent->dir.children.rb_node;
Tejun Heofd7b9f72013-11-28 14:54:33 -05001015 while (node) {
Tejun Heo324a56e2013-12-11 14:11:53 -05001016 pos = rb_to_kn(node);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001017
Tejun Heoadc5e8b2013-12-11 14:11:54 -05001018 if (hash < pos->hash)
Tejun Heofd7b9f72013-11-28 14:54:33 -05001019 node = node->rb_left;
Tejun Heoadc5e8b2013-12-11 14:11:54 -05001020 else if (hash > pos->hash)
Tejun Heofd7b9f72013-11-28 14:54:33 -05001021 node = node->rb_right;
1022 else
1023 break;
1024 }
1025 }
1026 /* Skip over entries in the wrong namespace */
Tejun Heoadc5e8b2013-12-11 14:11:54 -05001027 while (pos && pos->ns != ns) {
1028 struct rb_node *node = rb_next(&pos->rb);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001029 if (!node)
1030 pos = NULL;
1031 else
Tejun Heo324a56e2013-12-11 14:11:53 -05001032 pos = rb_to_kn(node);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001033 }
1034 return pos;
1035}
1036
Tejun Heoc637b8a2013-12-11 14:11:58 -05001037static struct kernfs_node *kernfs_dir_next_pos(const void *ns,
Tejun Heo324a56e2013-12-11 14:11:53 -05001038 struct kernfs_node *parent, ino_t ino, struct kernfs_node *pos)
Tejun Heofd7b9f72013-11-28 14:54:33 -05001039{
Tejun Heoc637b8a2013-12-11 14:11:58 -05001040 pos = kernfs_dir_pos(ns, parent, ino, pos);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001041 if (pos)
1042 do {
Tejun Heoadc5e8b2013-12-11 14:11:54 -05001043 struct rb_node *node = rb_next(&pos->rb);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001044 if (!node)
1045 pos = NULL;
1046 else
Tejun Heo324a56e2013-12-11 14:11:53 -05001047 pos = rb_to_kn(node);
Tejun Heoadc5e8b2013-12-11 14:11:54 -05001048 } while (pos && pos->ns != ns);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001049 return pos;
1050}
1051
Tejun Heoc637b8a2013-12-11 14:11:58 -05001052static int kernfs_fop_readdir(struct file *file, struct dir_context *ctx)
Tejun Heofd7b9f72013-11-28 14:54:33 -05001053{
1054 struct dentry *dentry = file->f_path.dentry;
Tejun Heo324a56e2013-12-11 14:11:53 -05001055 struct kernfs_node *parent = dentry->d_fsdata;
1056 struct kernfs_node *pos = file->private_data;
Tejun Heofd7b9f72013-11-28 14:54:33 -05001057 const void *ns = NULL;
1058
1059 if (!dir_emit_dots(file, ctx))
1060 return 0;
Tejun Heoa797bfc2013-12-11 14:11:57 -05001061 mutex_lock(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001062
Tejun Heo324a56e2013-12-11 14:11:53 -05001063 if (kernfs_ns_enabled(parent))
Tejun Heoc525aad2013-12-11 14:11:55 -05001064 ns = kernfs_info(dentry->d_sb)->ns;
Tejun Heofd7b9f72013-11-28 14:54:33 -05001065
Tejun Heoc637b8a2013-12-11 14:11:58 -05001066 for (pos = kernfs_dir_pos(ns, parent, ctx->pos, pos);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001067 pos;
Tejun Heoc637b8a2013-12-11 14:11:58 -05001068 pos = kernfs_dir_next_pos(ns, parent, ctx->pos, pos)) {
Tejun Heoadc5e8b2013-12-11 14:11:54 -05001069 const char *name = pos->name;
Tejun Heofd7b9f72013-11-28 14:54:33 -05001070 unsigned int type = dt_type(pos);
1071 int len = strlen(name);
Tejun Heoadc5e8b2013-12-11 14:11:54 -05001072 ino_t ino = pos->ino;
Tejun Heofd7b9f72013-11-28 14:54:33 -05001073
Tejun Heoadc5e8b2013-12-11 14:11:54 -05001074 ctx->pos = pos->hash;
Tejun Heofd7b9f72013-11-28 14:54:33 -05001075 file->private_data = pos;
1076 kernfs_get(pos);
1077
Tejun Heoa797bfc2013-12-11 14:11:57 -05001078 mutex_unlock(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001079 if (!dir_emit(ctx, name, len, ino, type))
1080 return 0;
Tejun Heoa797bfc2013-12-11 14:11:57 -05001081 mutex_lock(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001082 }
Tejun Heoa797bfc2013-12-11 14:11:57 -05001083 mutex_unlock(&kernfs_mutex);
Tejun Heofd7b9f72013-11-28 14:54:33 -05001084 file->private_data = NULL;
1085 ctx->pos = INT_MAX;
1086 return 0;
1087}
1088
Tejun Heoc637b8a2013-12-11 14:11:58 -05001089static loff_t kernfs_dir_fop_llseek(struct file *file, loff_t offset,
1090 int whence)
Tejun Heofd7b9f72013-11-28 14:54:33 -05001091{
1092 struct inode *inode = file_inode(file);
1093 loff_t ret;
1094
1095 mutex_lock(&inode->i_mutex);
1096 ret = generic_file_llseek(file, offset, whence);
1097 mutex_unlock(&inode->i_mutex);
1098
1099 return ret;
1100}
1101
Tejun Heoa797bfc2013-12-11 14:11:57 -05001102const struct file_operations kernfs_dir_fops = {
Tejun Heofd7b9f72013-11-28 14:54:33 -05001103 .read = generic_read_dir,
Tejun Heoc637b8a2013-12-11 14:11:58 -05001104 .iterate = kernfs_fop_readdir,
1105 .release = kernfs_dir_fop_release,
1106 .llseek = kernfs_dir_fop_llseek,
Tejun Heofd7b9f72013-11-28 14:54:33 -05001107};