Revert "kernfs: implement kernfs_{de|re}activate[_self]()"
[deliverable/linux.git] / fs / kernfs / dir.c
CommitLineData
b8441ed2
TH
1/*
2 * fs/kernfs/dir.c - kernfs directory implementation
3 *
4 * Copyright (c) 2001-3 Patrick Mochel
5 * Copyright (c) 2007 SUSE Linux Products GmbH
6 * Copyright (c) 2007, 2013 Tejun Heo <tj@kernel.org>
7 *
8 * This file is released under the GPLv2.
9 */
fd7b9f7b 10
ea1c472d 11#include <linux/sched.h>
fd7b9f7b
TH
12#include <linux/fs.h>
13#include <linux/namei.h>
14#include <linux/idr.h>
15#include <linux/slab.h>
16#include <linux/security.h>
17#include <linux/hash.h>
18
19#include "kernfs-internal.h"
20
a797bfc3 21DEFINE_MUTEX(kernfs_mutex);
fd7b9f7b 22
adc5e8b5 23#define rb_to_kn(X) rb_entry((X), struct kernfs_node, rb)
fd7b9f7b 24
a69d001c
TH
25static bool kernfs_lockdep(struct kernfs_node *kn)
26{
27#ifdef CONFIG_DEBUG_LOCK_ALLOC
28 return kn->flags & KERNFS_LOCKDEP;
29#else
30 return false;
31#endif
32}
33
fd7b9f7b 34/**
c637b8ac 35 * kernfs_name_hash
fd7b9f7b
TH
36 * @name: Null terminated string to hash
37 * @ns: Namespace tag to hash
38 *
39 * Returns 31 bit hash of ns + name (so it fits in an off_t )
40 */
c637b8ac 41static unsigned int kernfs_name_hash(const char *name, const void *ns)
fd7b9f7b
TH
42{
43 unsigned long hash = init_name_hash();
44 unsigned int len = strlen(name);
45 while (len--)
46 hash = partial_name_hash(*name++, hash);
47 hash = (end_name_hash(hash) ^ hash_ptr((void *)ns, 31));
48 hash &= 0x7fffffffU;
49 /* Reserve hash numbers 0, 1 and INT_MAX for magic directory entries */
50 if (hash < 1)
51 hash += 2;
52 if (hash >= INT_MAX)
53 hash = INT_MAX - 1;
54 return hash;
55}
56
c637b8ac
TH
57static int kernfs_name_compare(unsigned int hash, const char *name,
58 const void *ns, const struct kernfs_node *kn)
fd7b9f7b 59{
adc5e8b5
TH
60 if (hash != kn->hash)
61 return hash - kn->hash;
62 if (ns != kn->ns)
63 return ns - kn->ns;
64 return strcmp(name, kn->name);
fd7b9f7b
TH
65}
66
c637b8ac
TH
67static int kernfs_sd_compare(const struct kernfs_node *left,
68 const struct kernfs_node *right)
fd7b9f7b 69{
c637b8ac 70 return kernfs_name_compare(left->hash, left->name, left->ns, right);
fd7b9f7b
TH
71}
72
73/**
c637b8ac 74 * kernfs_link_sibling - link kernfs_node into sibling rbtree
324a56e1 75 * @kn: kernfs_node of interest
fd7b9f7b 76 *
324a56e1 77 * Link @kn into its sibling rbtree which starts from
adc5e8b5 78 * @kn->parent->dir.children.
fd7b9f7b
TH
79 *
80 * Locking:
a797bfc3 81 * mutex_lock(kernfs_mutex)
fd7b9f7b
TH
82 *
83 * RETURNS:
84 * 0 on susccess -EEXIST on failure.
85 */
c637b8ac 86static int kernfs_link_sibling(struct kernfs_node *kn)
fd7b9f7b 87{
adc5e8b5 88 struct rb_node **node = &kn->parent->dir.children.rb_node;
fd7b9f7b
TH
89 struct rb_node *parent = NULL;
90
df23fc39 91 if (kernfs_type(kn) == KERNFS_DIR)
adc5e8b5 92 kn->parent->dir.subdirs++;
fd7b9f7b
TH
93
94 while (*node) {
324a56e1 95 struct kernfs_node *pos;
fd7b9f7b
TH
96 int result;
97
324a56e1 98 pos = rb_to_kn(*node);
fd7b9f7b 99 parent = *node;
c637b8ac 100 result = kernfs_sd_compare(kn, pos);
fd7b9f7b 101 if (result < 0)
adc5e8b5 102 node = &pos->rb.rb_left;
fd7b9f7b 103 else if (result > 0)
adc5e8b5 104 node = &pos->rb.rb_right;
fd7b9f7b
TH
105 else
106 return -EEXIST;
107 }
108 /* add new node and rebalance the tree */
adc5e8b5
TH
109 rb_link_node(&kn->rb, parent, node);
110 rb_insert_color(&kn->rb, &kn->parent->dir.children);
fd7b9f7b
TH
111 return 0;
112}
113
114/**
c637b8ac 115 * kernfs_unlink_sibling - unlink kernfs_node from sibling rbtree
324a56e1 116 * @kn: kernfs_node of interest
fd7b9f7b 117 *
324a56e1 118 * Unlink @kn from its sibling rbtree which starts from
adc5e8b5 119 * kn->parent->dir.children.
fd7b9f7b
TH
120 *
121 * Locking:
a797bfc3 122 * mutex_lock(kernfs_mutex)
fd7b9f7b 123 */
f601f9a2 124static bool kernfs_unlink_sibling(struct kernfs_node *kn)
fd7b9f7b 125{
f601f9a2
TH
126 if (RB_EMPTY_NODE(&kn->rb))
127 return false;
128
df23fc39 129 if (kernfs_type(kn) == KERNFS_DIR)
adc5e8b5 130 kn->parent->dir.subdirs--;
fd7b9f7b 131
adc5e8b5 132 rb_erase(&kn->rb, &kn->parent->dir.children);
ae34372e 133 RB_CLEAR_NODE(&kn->rb);
f601f9a2 134 return true;
fd7b9f7b
TH
135}
136
137/**
c637b8ac 138 * kernfs_get_active - get an active reference to kernfs_node
324a56e1 139 * @kn: kernfs_node to get an active reference to
fd7b9f7b 140 *
324a56e1 141 * Get an active reference of @kn. This function is noop if @kn
fd7b9f7b
TH
142 * is NULL.
143 *
144 * RETURNS:
324a56e1 145 * Pointer to @kn on success, NULL on failure.
fd7b9f7b 146 */
c637b8ac 147struct kernfs_node *kernfs_get_active(struct kernfs_node *kn)
fd7b9f7b 148{
324a56e1 149 if (unlikely(!kn))
fd7b9f7b
TH
150 return NULL;
151
a69d001c 152 if (kernfs_lockdep(kn))
324a56e1 153 rwsem_acquire_read(&kn->dep_map, 0, 1, _RET_IP_);
895a068a
TH
154
155 /*
156 * Try to obtain an active ref. If @kn is deactivated, we block
157 * till either it's reactivated or killed.
158 */
159 do {
160 if (atomic_inc_unless_negative(&kn->active))
161 return kn;
162
163 wait_event(kernfs_root(kn)->deactivate_waitq,
164 atomic_read(&kn->active) >= 0 ||
165 RB_EMPTY_NODE(&kn->rb));
166 } while (!RB_EMPTY_NODE(&kn->rb));
167
168 if (kernfs_lockdep(kn))
169 rwsem_release(&kn->dep_map, 1, _RET_IP_);
170 return NULL;
fd7b9f7b
TH
171}
172
173/**
c637b8ac 174 * kernfs_put_active - put an active reference to kernfs_node
324a56e1 175 * @kn: kernfs_node to put an active reference to
fd7b9f7b 176 *
324a56e1 177 * Put an active reference to @kn. This function is noop if @kn
fd7b9f7b
TH
178 * is NULL.
179 */
c637b8ac 180void kernfs_put_active(struct kernfs_node *kn)
fd7b9f7b 181{
ea1c472d 182 struct kernfs_root *root = kernfs_root(kn);
fd7b9f7b
TH
183 int v;
184
324a56e1 185 if (unlikely(!kn))
fd7b9f7b
TH
186 return;
187
a69d001c 188 if (kernfs_lockdep(kn))
324a56e1 189 rwsem_release(&kn->dep_map, 1, _RET_IP_);
adc5e8b5 190 v = atomic_dec_return(&kn->active);
df23fc39 191 if (likely(v != KN_DEACTIVATED_BIAS))
fd7b9f7b
TH
192 return;
193
ea1c472d 194 wake_up_all(&root->deactivate_waitq);
fd7b9f7b
TH
195}
196
197/**
ae34372e
TH
198 * kernfs_drain - drain kernfs_node
199 * @kn: kernfs_node to drain
fd7b9f7b 200 *
45a140e5
TH
201 * Drain existing usages of @kn. Mutiple removers may invoke this function
202 * concurrently on @kn and all will return after draining is complete.
203 * Returns %true if drain is performed and kernfs_mutex was temporarily
204 * released. %false if @kn was already drained and no operation was
205 * necessary.
206 *
207 * The caller is responsible for ensuring @kn stays pinned while this
208 * function is in progress even if it gets removed by someone else.
fd7b9f7b 209 */
45a140e5
TH
210static bool kernfs_drain(struct kernfs_node *kn)
211 __releases(&kernfs_mutex) __acquires(&kernfs_mutex)
fd7b9f7b 212{
ea1c472d 213 struct kernfs_root *root = kernfs_root(kn);
fd7b9f7b 214
45a140e5 215 lockdep_assert_held(&kernfs_mutex);
ae34372e 216 WARN_ON_ONCE(atomic_read(&kn->active) >= 0);
ea1c472d 217
45a140e5
TH
218 /*
219 * We want to go through the active ref lockdep annotation at least
220 * once for all node removals, but the lockdep annotation can't be
221 * nested inside kernfs_mutex and deactivation can't make forward
222 * progress if we keep dropping the mutex. Use JUST_ACTIVATED to
223 * force the slow path once for each deactivation if lockdep is
224 * enabled.
225 */
226 if ((!kernfs_lockdep(kn) || !(kn->flags & KERNFS_JUST_DEACTIVATED)) &&
227 atomic_read(&kn->active) == KN_DEACTIVATED_BIAS)
228 return false;
229
230 kn->flags &= ~KERNFS_JUST_DEACTIVATED;
231 mutex_unlock(&kernfs_mutex);
232
a69d001c
TH
233 if (kernfs_lockdep(kn)) {
234 rwsem_acquire(&kn->dep_map, 0, 0, _RET_IP_);
235 if (atomic_read(&kn->active) != KN_DEACTIVATED_BIAS)
236 lock_contended(&kn->dep_map, _RET_IP_);
237 }
ea1c472d
TH
238
239 wait_event(root->deactivate_waitq,
240 atomic_read(&kn->active) == KN_DEACTIVATED_BIAS);
fd7b9f7b 241
a69d001c
TH
242 if (kernfs_lockdep(kn)) {
243 lock_acquired(&kn->dep_map, _RET_IP_);
244 rwsem_release(&kn->dep_map, 1, _RET_IP_);
245 }
45a140e5
TH
246
247 mutex_lock(&kernfs_mutex);
248 return true;
fd7b9f7b
TH
249}
250
fd7b9f7b 251/**
324a56e1
TH
252 * kernfs_get - get a reference count on a kernfs_node
253 * @kn: the target kernfs_node
fd7b9f7b 254 */
324a56e1 255void kernfs_get(struct kernfs_node *kn)
fd7b9f7b 256{
324a56e1 257 if (kn) {
adc5e8b5
TH
258 WARN_ON(!atomic_read(&kn->count));
259 atomic_inc(&kn->count);
fd7b9f7b
TH
260 }
261}
262EXPORT_SYMBOL_GPL(kernfs_get);
263
264/**
324a56e1
TH
265 * kernfs_put - put a reference count on a kernfs_node
266 * @kn: the target kernfs_node
fd7b9f7b 267 *
324a56e1 268 * Put a reference count of @kn and destroy it if it reached zero.
fd7b9f7b 269 */
324a56e1 270void kernfs_put(struct kernfs_node *kn)
fd7b9f7b 271{
324a56e1 272 struct kernfs_node *parent;
ba7443bc 273 struct kernfs_root *root;
fd7b9f7b 274
adc5e8b5 275 if (!kn || !atomic_dec_and_test(&kn->count))
fd7b9f7b 276 return;
324a56e1 277 root = kernfs_root(kn);
fd7b9f7b 278 repeat:
ae34372e
TH
279 /*
280 * Moving/renaming is always done while holding reference.
adc5e8b5 281 * kn->parent won't change beneath us.
fd7b9f7b 282 */
adc5e8b5 283 parent = kn->parent;
fd7b9f7b 284
ae34372e
TH
285 WARN_ONCE(atomic_read(&kn->active) != KN_DEACTIVATED_BIAS,
286 "kernfs_put: %s/%s: released with incorrect active_ref %d\n",
287 parent ? parent->name : "", kn->name, atomic_read(&kn->active));
324a56e1 288
df23fc39 289 if (kernfs_type(kn) == KERNFS_LINK)
adc5e8b5 290 kernfs_put(kn->symlink.target_kn);
2063d608 291 if (!(kn->flags & KERNFS_STATIC_NAME))
adc5e8b5
TH
292 kfree(kn->name);
293 if (kn->iattr) {
294 if (kn->iattr->ia_secdata)
295 security_release_secctx(kn->iattr->ia_secdata,
296 kn->iattr->ia_secdata_len);
297 simple_xattrs_free(&kn->iattr->xattrs);
2322392b 298 }
adc5e8b5
TH
299 kfree(kn->iattr);
300 ida_simple_remove(&root->ino_ida, kn->ino);
a797bfc3 301 kmem_cache_free(kernfs_node_cache, kn);
fd7b9f7b 302
324a56e1
TH
303 kn = parent;
304 if (kn) {
adc5e8b5 305 if (atomic_dec_and_test(&kn->count))
ba7443bc
TH
306 goto repeat;
307 } else {
324a56e1 308 /* just released the root kn, free @root too */
bc755553 309 ida_destroy(&root->ino_ida);
ba7443bc
TH
310 kfree(root);
311 }
fd7b9f7b
TH
312}
313EXPORT_SYMBOL_GPL(kernfs_put);
314
c637b8ac 315static int kernfs_dop_revalidate(struct dentry *dentry, unsigned int flags)
fd7b9f7b 316{
324a56e1 317 struct kernfs_node *kn;
fd7b9f7b
TH
318
319 if (flags & LOOKUP_RCU)
320 return -ECHILD;
321
19bbb926
TH
322 /* Always perform fresh lookup for negatives */
323 if (!dentry->d_inode)
324 goto out_bad_unlocked;
325
324a56e1 326 kn = dentry->d_fsdata;
a797bfc3 327 mutex_lock(&kernfs_mutex);
fd7b9f7b 328
ae34372e
TH
329 /* Force fresh lookup if removed */
330 if (kn->parent && RB_EMPTY_NODE(&kn->rb))
fd7b9f7b
TH
331 goto out_bad;
332
c637b8ac 333 /* The kernfs node has been moved? */
adc5e8b5 334 if (dentry->d_parent->d_fsdata != kn->parent)
fd7b9f7b
TH
335 goto out_bad;
336
c637b8ac 337 /* The kernfs node has been renamed */
adc5e8b5 338 if (strcmp(dentry->d_name.name, kn->name) != 0)
fd7b9f7b
TH
339 goto out_bad;
340
c637b8ac 341 /* The kernfs node has been moved to a different namespace */
adc5e8b5 342 if (kn->parent && kernfs_ns_enabled(kn->parent) &&
c525aadd 343 kernfs_info(dentry->d_sb)->ns != kn->ns)
fd7b9f7b
TH
344 goto out_bad;
345
a797bfc3 346 mutex_unlock(&kernfs_mutex);
fd7b9f7b
TH
347out_valid:
348 return 1;
349out_bad:
a797bfc3 350 mutex_unlock(&kernfs_mutex);
19bbb926
TH
351out_bad_unlocked:
352 /*
353 * @dentry doesn't match the underlying kernfs node, drop the
354 * dentry and force lookup. If we have submounts we must allow the
355 * vfs caches to lie about the state of the filesystem to prevent
356 * leaks and other nasty things, so use check_submounts_and_drop()
357 * instead of d_drop().
fd7b9f7b
TH
358 */
359 if (check_submounts_and_drop(dentry) != 0)
360 goto out_valid;
361
362 return 0;
363}
364
c637b8ac 365static void kernfs_dop_release(struct dentry *dentry)
fd7b9f7b
TH
366{
367 kernfs_put(dentry->d_fsdata);
368}
369
a797bfc3 370const struct dentry_operations kernfs_dops = {
c637b8ac 371 .d_revalidate = kernfs_dop_revalidate,
c637b8ac 372 .d_release = kernfs_dop_release,
fd7b9f7b
TH
373};
374
c637b8ac 375struct kernfs_node *kernfs_new_node(struct kernfs_root *root, const char *name,
2063d608 376 umode_t mode, unsigned flags)
fd7b9f7b
TH
377{
378 char *dup_name = NULL;
324a56e1 379 struct kernfs_node *kn;
bc755553 380 int ret;
fd7b9f7b 381
2063d608 382 if (!(flags & KERNFS_STATIC_NAME)) {
fd7b9f7b
TH
383 name = dup_name = kstrdup(name, GFP_KERNEL);
384 if (!name)
385 return NULL;
386 }
387
a797bfc3 388 kn = kmem_cache_zalloc(kernfs_node_cache, GFP_KERNEL);
324a56e1 389 if (!kn)
fd7b9f7b
TH
390 goto err_out1;
391
bc755553
TH
392 ret = ida_simple_get(&root->ino_ida, 1, 0, GFP_KERNEL);
393 if (ret < 0)
fd7b9f7b 394 goto err_out2;
adc5e8b5 395 kn->ino = ret;
fd7b9f7b 396
adc5e8b5 397 atomic_set(&kn->count, 1);
ae34372e
TH
398 atomic_set(&kn->active, KN_DEACTIVATED_BIAS);
399 RB_CLEAR_NODE(&kn->rb);
fd7b9f7b 400
adc5e8b5
TH
401 kn->name = name;
402 kn->mode = mode;
ae34372e 403 kn->flags = flags;
fd7b9f7b 404
324a56e1 405 return kn;
fd7b9f7b
TH
406
407 err_out2:
a797bfc3 408 kmem_cache_free(kernfs_node_cache, kn);
fd7b9f7b
TH
409 err_out1:
410 kfree(dup_name);
411 return NULL;
412}
413
fd7b9f7b 414/**
c637b8ac 415 * kernfs_add_one - add kernfs_node to parent without warning
324a56e1
TH
416 * @kn: kernfs_node to be added
417 * @parent: the parent kernfs_node to add @kn to
fd7b9f7b 418 *
adc5e8b5
TH
419 * Get @parent and set @kn->parent to it and increment nlink of the
420 * parent inode if @kn is a directory and link into the children list
421 * of the parent.
fd7b9f7b 422 *
fd7b9f7b
TH
423 * RETURNS:
424 * 0 on success, -EEXIST if entry with the given name already
425 * exists.
426 */
99177a34 427int kernfs_add_one(struct kernfs_node *kn, struct kernfs_node *parent)
fd7b9f7b 428{
c525aadd 429 struct kernfs_iattrs *ps_iattr;
99177a34 430 bool has_ns;
fd7b9f7b
TH
431 int ret;
432
99177a34
TH
433 if (!kernfs_get_active(parent))
434 return -ENOENT;
ae34372e 435
99177a34
TH
436 mutex_lock(&kernfs_mutex);
437
438 ret = -EINVAL;
439 has_ns = kernfs_ns_enabled(parent);
440 if (WARN(has_ns != (bool)kn->ns, KERN_WARNING "kernfs: ns %s in '%s' for '%s'\n",
441 has_ns ? "required" : "invalid", parent->name, kn->name))
442 goto out_unlock;
fd7b9f7b 443
df23fc39 444 if (kernfs_type(parent) != KERNFS_DIR)
99177a34 445 goto out_unlock;
fd7b9f7b 446
c637b8ac 447 kn->hash = kernfs_name_hash(kn->name, kn->ns);
adc5e8b5 448 kn->parent = parent;
324a56e1 449 kernfs_get(parent);
fd7b9f7b 450
c637b8ac 451 ret = kernfs_link_sibling(kn);
fd7b9f7b 452 if (ret)
99177a34 453 goto out_unlock;
fd7b9f7b
TH
454
455 /* Update timestamps on the parent */
adc5e8b5 456 ps_iattr = parent->iattr;
fd7b9f7b
TH
457 if (ps_iattr) {
458 struct iattr *ps_iattrs = &ps_iattr->ia_iattr;
459 ps_iattrs->ia_ctime = ps_iattrs->ia_mtime = CURRENT_TIME;
460 }
461
462 /* Mark the entry added into directory tree */
ae34372e 463 atomic_sub(KN_DEACTIVATED_BIAS, &kn->active);
99177a34
TH
464 ret = 0;
465out_unlock:
a797bfc3 466 mutex_unlock(&kernfs_mutex);
99177a34
TH
467 kernfs_put_active(parent);
468 return ret;
fd7b9f7b
TH
469}
470
471/**
324a56e1
TH
472 * kernfs_find_ns - find kernfs_node with the given name
473 * @parent: kernfs_node to search under
fd7b9f7b
TH
474 * @name: name to look for
475 * @ns: the namespace tag to use
476 *
324a56e1
TH
477 * Look for kernfs_node with name @name under @parent. Returns pointer to
478 * the found kernfs_node on success, %NULL on failure.
fd7b9f7b 479 */
324a56e1
TH
480static struct kernfs_node *kernfs_find_ns(struct kernfs_node *parent,
481 const unsigned char *name,
482 const void *ns)
fd7b9f7b 483{
adc5e8b5 484 struct rb_node *node = parent->dir.children.rb_node;
ac9bba03 485 bool has_ns = kernfs_ns_enabled(parent);
fd7b9f7b
TH
486 unsigned int hash;
487
a797bfc3 488 lockdep_assert_held(&kernfs_mutex);
fd7b9f7b
TH
489
490 if (has_ns != (bool)ns) {
c637b8ac 491 WARN(1, KERN_WARNING "kernfs: ns %s in '%s' for '%s'\n",
adc5e8b5 492 has_ns ? "required" : "invalid", parent->name, name);
fd7b9f7b
TH
493 return NULL;
494 }
495
c637b8ac 496 hash = kernfs_name_hash(name, ns);
fd7b9f7b 497 while (node) {
324a56e1 498 struct kernfs_node *kn;
fd7b9f7b
TH
499 int result;
500
324a56e1 501 kn = rb_to_kn(node);
c637b8ac 502 result = kernfs_name_compare(hash, name, ns, kn);
fd7b9f7b
TH
503 if (result < 0)
504 node = node->rb_left;
505 else if (result > 0)
506 node = node->rb_right;
507 else
324a56e1 508 return kn;
fd7b9f7b
TH
509 }
510 return NULL;
511}
512
513/**
324a56e1
TH
514 * kernfs_find_and_get_ns - find and get kernfs_node with the given name
515 * @parent: kernfs_node to search under
fd7b9f7b
TH
516 * @name: name to look for
517 * @ns: the namespace tag to use
518 *
324a56e1 519 * Look for kernfs_node with name @name under @parent and get a reference
fd7b9f7b 520 * if found. This function may sleep and returns pointer to the found
324a56e1 521 * kernfs_node on success, %NULL on failure.
fd7b9f7b 522 */
324a56e1
TH
523struct kernfs_node *kernfs_find_and_get_ns(struct kernfs_node *parent,
524 const char *name, const void *ns)
fd7b9f7b 525{
324a56e1 526 struct kernfs_node *kn;
fd7b9f7b 527
a797bfc3 528 mutex_lock(&kernfs_mutex);
324a56e1
TH
529 kn = kernfs_find_ns(parent, name, ns);
530 kernfs_get(kn);
a797bfc3 531 mutex_unlock(&kernfs_mutex);
fd7b9f7b 532
324a56e1 533 return kn;
fd7b9f7b
TH
534}
535EXPORT_SYMBOL_GPL(kernfs_find_and_get_ns);
536
ba7443bc
TH
537/**
538 * kernfs_create_root - create a new kernfs hierarchy
80b9bbef 539 * @kdops: optional directory syscall operations for the hierarchy
ba7443bc
TH
540 * @priv: opaque data associated with the new directory
541 *
542 * Returns the root of the new hierarchy on success, ERR_PTR() value on
543 * failure.
544 */
80b9bbef 545struct kernfs_root *kernfs_create_root(struct kernfs_dir_ops *kdops, void *priv)
ba7443bc
TH
546{
547 struct kernfs_root *root;
324a56e1 548 struct kernfs_node *kn;
ba7443bc
TH
549
550 root = kzalloc(sizeof(*root), GFP_KERNEL);
551 if (!root)
552 return ERR_PTR(-ENOMEM);
553
bc755553
TH
554 ida_init(&root->ino_ida);
555
c637b8ac 556 kn = kernfs_new_node(root, "", S_IFDIR | S_IRUGO | S_IXUGO, KERNFS_DIR);
324a56e1 557 if (!kn) {
bc755553 558 ida_destroy(&root->ino_ida);
ba7443bc
TH
559 kfree(root);
560 return ERR_PTR(-ENOMEM);
561 }
562
ae34372e 563 atomic_sub(KN_DEACTIVATED_BIAS, &kn->active);
324a56e1 564 kn->priv = priv;
adc5e8b5 565 kn->dir.root = root;
ba7443bc 566
80b9bbef 567 root->dir_ops = kdops;
324a56e1 568 root->kn = kn;
ea1c472d 569 init_waitqueue_head(&root->deactivate_waitq);
ba7443bc
TH
570
571 return root;
572}
573
574/**
575 * kernfs_destroy_root - destroy a kernfs hierarchy
576 * @root: root of the hierarchy to destroy
577 *
578 * Destroy the hierarchy anchored at @root by removing all existing
579 * directories and destroying @root.
580 */
581void kernfs_destroy_root(struct kernfs_root *root)
582{
324a56e1 583 kernfs_remove(root->kn); /* will also free @root */
ba7443bc
TH
584}
585
fd7b9f7b
TH
586/**
587 * kernfs_create_dir_ns - create a directory
588 * @parent: parent in which to create a new directory
589 * @name: name of the new directory
bb8b9d09 590 * @mode: mode of the new directory
fd7b9f7b
TH
591 * @priv: opaque data associated with the new directory
592 * @ns: optional namespace tag of the directory
593 *
594 * Returns the created node on success, ERR_PTR() value on failure.
595 */
324a56e1 596struct kernfs_node *kernfs_create_dir_ns(struct kernfs_node *parent,
bb8b9d09
TH
597 const char *name, umode_t mode,
598 void *priv, const void *ns)
fd7b9f7b 599{
324a56e1 600 struct kernfs_node *kn;
fd7b9f7b
TH
601 int rc;
602
603 /* allocate */
bb8b9d09
TH
604 kn = kernfs_new_node(kernfs_root(parent), name, mode | S_IFDIR,
605 KERNFS_DIR);
324a56e1 606 if (!kn)
fd7b9f7b
TH
607 return ERR_PTR(-ENOMEM);
608
adc5e8b5
TH
609 kn->dir.root = parent->dir.root;
610 kn->ns = ns;
324a56e1 611 kn->priv = priv;
fd7b9f7b
TH
612
613 /* link in */
99177a34 614 rc = kernfs_add_one(kn, parent);
fd7b9f7b 615 if (!rc)
324a56e1 616 return kn;
fd7b9f7b 617
324a56e1 618 kernfs_put(kn);
fd7b9f7b
TH
619 return ERR_PTR(rc);
620}
621
c637b8ac
TH
622static struct dentry *kernfs_iop_lookup(struct inode *dir,
623 struct dentry *dentry,
624 unsigned int flags)
fd7b9f7b 625{
19bbb926 626 struct dentry *ret;
324a56e1
TH
627 struct kernfs_node *parent = dentry->d_parent->d_fsdata;
628 struct kernfs_node *kn;
fd7b9f7b
TH
629 struct inode *inode;
630 const void *ns = NULL;
631
a797bfc3 632 mutex_lock(&kernfs_mutex);
fd7b9f7b 633
324a56e1 634 if (kernfs_ns_enabled(parent))
c525aadd 635 ns = kernfs_info(dir->i_sb)->ns;
fd7b9f7b 636
324a56e1 637 kn = kernfs_find_ns(parent, dentry->d_name.name, ns);
fd7b9f7b
TH
638
639 /* no such entry */
324a56e1 640 if (!kn) {
19bbb926 641 ret = NULL;
fd7b9f7b
TH
642 goto out_unlock;
643 }
324a56e1
TH
644 kernfs_get(kn);
645 dentry->d_fsdata = kn;
fd7b9f7b
TH
646
647 /* attach dentry and inode */
c637b8ac 648 inode = kernfs_get_inode(dir->i_sb, kn);
fd7b9f7b
TH
649 if (!inode) {
650 ret = ERR_PTR(-ENOMEM);
651 goto out_unlock;
652 }
653
654 /* instantiate and hash dentry */
655 ret = d_materialise_unique(dentry, inode);
656 out_unlock:
a797bfc3 657 mutex_unlock(&kernfs_mutex);
fd7b9f7b
TH
658 return ret;
659}
660
80b9bbef
TH
661static int kernfs_iop_mkdir(struct inode *dir, struct dentry *dentry,
662 umode_t mode)
663{
664 struct kernfs_node *parent = dir->i_private;
665 struct kernfs_dir_ops *kdops = kernfs_root(parent)->dir_ops;
666
667 if (!kdops || !kdops->mkdir)
668 return -EPERM;
669
670 return kdops->mkdir(parent, dentry->d_name.name, mode);
671}
672
673static int kernfs_iop_rmdir(struct inode *dir, struct dentry *dentry)
674{
675 struct kernfs_node *kn = dentry->d_fsdata;
676 struct kernfs_dir_ops *kdops = kernfs_root(kn)->dir_ops;
677
678 if (!kdops || !kdops->rmdir)
679 return -EPERM;
680
681 return kdops->rmdir(kn);
682}
683
684static int kernfs_iop_rename(struct inode *old_dir, struct dentry *old_dentry,
685 struct inode *new_dir, struct dentry *new_dentry)
686{
687 struct kernfs_node *kn = old_dentry->d_fsdata;
688 struct kernfs_node *new_parent = new_dir->i_private;
689 struct kernfs_dir_ops *kdops = kernfs_root(kn)->dir_ops;
690
691 if (!kdops || !kdops->rename)
692 return -EPERM;
693
694 return kdops->rename(kn, new_parent, new_dentry->d_name.name);
695}
696
a797bfc3 697const struct inode_operations kernfs_dir_iops = {
c637b8ac
TH
698 .lookup = kernfs_iop_lookup,
699 .permission = kernfs_iop_permission,
700 .setattr = kernfs_iop_setattr,
701 .getattr = kernfs_iop_getattr,
702 .setxattr = kernfs_iop_setxattr,
703 .removexattr = kernfs_iop_removexattr,
704 .getxattr = kernfs_iop_getxattr,
705 .listxattr = kernfs_iop_listxattr,
80b9bbef
TH
706
707 .mkdir = kernfs_iop_mkdir,
708 .rmdir = kernfs_iop_rmdir,
709 .rename = kernfs_iop_rename,
fd7b9f7b
TH
710};
711
c637b8ac 712static struct kernfs_node *kernfs_leftmost_descendant(struct kernfs_node *pos)
fd7b9f7b 713{
324a56e1 714 struct kernfs_node *last;
fd7b9f7b
TH
715
716 while (true) {
717 struct rb_node *rbn;
718
719 last = pos;
720
df23fc39 721 if (kernfs_type(pos) != KERNFS_DIR)
fd7b9f7b
TH
722 break;
723
adc5e8b5 724 rbn = rb_first(&pos->dir.children);
fd7b9f7b
TH
725 if (!rbn)
726 break;
727
324a56e1 728 pos = rb_to_kn(rbn);
fd7b9f7b
TH
729 }
730
731 return last;
732}
733
734/**
c637b8ac 735 * kernfs_next_descendant_post - find the next descendant for post-order walk
fd7b9f7b 736 * @pos: the current position (%NULL to initiate traversal)
324a56e1 737 * @root: kernfs_node whose descendants to walk
fd7b9f7b
TH
738 *
739 * Find the next descendant to visit for post-order traversal of @root's
740 * descendants. @root is included in the iteration and the last node to be
741 * visited.
742 */
c637b8ac
TH
743static struct kernfs_node *kernfs_next_descendant_post(struct kernfs_node *pos,
744 struct kernfs_node *root)
fd7b9f7b
TH
745{
746 struct rb_node *rbn;
747
a797bfc3 748 lockdep_assert_held(&kernfs_mutex);
fd7b9f7b
TH
749
750 /* if first iteration, visit leftmost descendant which may be root */
751 if (!pos)
c637b8ac 752 return kernfs_leftmost_descendant(root);
fd7b9f7b
TH
753
754 /* if we visited @root, we're done */
755 if (pos == root)
756 return NULL;
757
758 /* if there's an unvisited sibling, visit its leftmost descendant */
adc5e8b5 759 rbn = rb_next(&pos->rb);
fd7b9f7b 760 if (rbn)
c637b8ac 761 return kernfs_leftmost_descendant(rb_to_kn(rbn));
fd7b9f7b
TH
762
763 /* no sibling left, visit parent */
adc5e8b5 764 return pos->parent;
fd7b9f7b
TH
765}
766
45a140e5
TH
767static void __kernfs_deactivate(struct kernfs_node *kn)
768{
769 struct kernfs_node *pos;
770
771 lockdep_assert_held(&kernfs_mutex);
772
773 /* prevent any new usage under @kn by deactivating all nodes */
774 pos = NULL;
775 while ((pos = kernfs_next_descendant_post(pos, kn))) {
9b0925a6 776 if (atomic_read(&pos->active) >= 0) {
45a140e5
TH
777 atomic_add(KN_DEACTIVATED_BIAS, &pos->active);
778 pos->flags |= KERNFS_JUST_DEACTIVATED;
779 }
780 }
781
782 /*
783 * Drain the subtree. If kernfs_drain() blocked to drain, which is
784 * indicated by %true return, it temporarily released kernfs_mutex
785 * and the rbtree might have been modified inbetween breaking our
786 * future walk. Restart the walk after each %true return.
787 */
788 pos = NULL;
789 while ((pos = kernfs_next_descendant_post(pos, kn))) {
790 bool drained;
791
792 kernfs_get(pos);
793 drained = kernfs_drain(pos);
794 kernfs_put(pos);
795 if (drained)
796 pos = NULL;
797 }
798}
799
99177a34 800static void __kernfs_remove(struct kernfs_node *kn)
fd7b9f7b 801{
895a068a 802 struct kernfs_root *root = kernfs_root(kn);
45a140e5
TH
803 struct kernfs_node *pos;
804
805 lockdep_assert_held(&kernfs_mutex);
fd7b9f7b 806
ce9b499c
GKH
807 if (!kn)
808 return;
809
c637b8ac 810 pr_debug("kernfs %s: removing\n", kn->name);
fd7b9f7b 811
45a140e5
TH
812 __kernfs_deactivate(kn);
813
814 /* unlink the subtree node-by-node */
fd7b9f7b 815 do {
45a140e5
TH
816 pos = kernfs_leftmost_descendant(kn);
817
f601f9a2
TH
818 /*
819 * We're gonna release kernfs_mutex to unmap bin files,
820 * Make sure @pos doesn't go away inbetween.
821 */
822 kernfs_get(pos);
823
824 /*
825 * This must be come before unlinking; otherwise, when
826 * there are multiple removers, some may finish before
827 * unmapping is complete.
828 */
829 if (pos->flags & KERNFS_HAS_MMAP) {
830 mutex_unlock(&kernfs_mutex);
831 kernfs_unmap_file(pos);
832 mutex_lock(&kernfs_mutex);
833 }
834
835 /*
836 * kernfs_unlink_sibling() succeeds once per node. Use it
837 * to decide who's responsible for cleanups.
838 */
839 if (!pos->parent || kernfs_unlink_sibling(pos)) {
840 struct kernfs_iattrs *ps_iattr =
841 pos->parent ? pos->parent->iattr : NULL;
45a140e5
TH
842
843 /* update timestamps on the parent */
45a140e5
TH
844 if (ps_iattr) {
845 ps_iattr->ia_iattr.ia_ctime = CURRENT_TIME;
846 ps_iattr->ia_iattr.ia_mtime = CURRENT_TIME;
847 }
f601f9a2 848
99177a34 849 kernfs_put(pos);
45a140e5
TH
850 }
851
f601f9a2 852 kernfs_put(pos);
45a140e5 853 } while (pos != kn);
895a068a
TH
854
855 /* some nodes killed, kick get_active waiters */
856 wake_up_all(&root->deactivate_waitq);
fd7b9f7b
TH
857}
858
859/**
324a56e1
TH
860 * kernfs_remove - remove a kernfs_node recursively
861 * @kn: the kernfs_node to remove
fd7b9f7b 862 *
324a56e1 863 * Remove @kn along with all its subdirectories and files.
fd7b9f7b 864 */
324a56e1 865void kernfs_remove(struct kernfs_node *kn)
fd7b9f7b 866{
99177a34
TH
867 mutex_lock(&kernfs_mutex);
868 __kernfs_remove(kn);
869 mutex_unlock(&kernfs_mutex);
fd7b9f7b
TH
870}
871
872/**
324a56e1
TH
873 * kernfs_remove_by_name_ns - find a kernfs_node by name and remove it
874 * @parent: parent of the target
875 * @name: name of the kernfs_node to remove
876 * @ns: namespace tag of the kernfs_node to remove
fd7b9f7b 877 *
324a56e1
TH
878 * Look for the kernfs_node with @name and @ns under @parent and remove it.
879 * Returns 0 on success, -ENOENT if such entry doesn't exist.
fd7b9f7b 880 */
324a56e1 881int kernfs_remove_by_name_ns(struct kernfs_node *parent, const char *name,
fd7b9f7b
TH
882 const void *ns)
883{
324a56e1 884 struct kernfs_node *kn;
fd7b9f7b 885
324a56e1 886 if (!parent) {
c637b8ac 887 WARN(1, KERN_WARNING "kernfs: can not remove '%s', no directory\n",
fd7b9f7b
TH
888 name);
889 return -ENOENT;
890 }
891
99177a34 892 mutex_lock(&kernfs_mutex);
fd7b9f7b 893
324a56e1
TH
894 kn = kernfs_find_ns(parent, name, ns);
895 if (kn)
99177a34 896 __kernfs_remove(kn);
fd7b9f7b 897
99177a34 898 mutex_unlock(&kernfs_mutex);
fd7b9f7b 899
324a56e1 900 if (kn)
fd7b9f7b
TH
901 return 0;
902 else
903 return -ENOENT;
904}
905
906/**
907 * kernfs_rename_ns - move and rename a kernfs_node
324a56e1 908 * @kn: target node
fd7b9f7b
TH
909 * @new_parent: new parent to put @sd under
910 * @new_name: new name
911 * @new_ns: new namespace tag
912 */
324a56e1 913int kernfs_rename_ns(struct kernfs_node *kn, struct kernfs_node *new_parent,
fd7b9f7b
TH
914 const char *new_name, const void *new_ns)
915{
916 int error;
917
d0ae3d43 918 error = -ENOENT;
ae34372e 919 if (!kernfs_get_active(new_parent))
d0ae3d43 920 goto out;
ae34372e
TH
921 if (!kernfs_get_active(kn))
922 goto out_put_new_parent;
923
924 mutex_lock(&kernfs_mutex);
d0ae3d43 925
fd7b9f7b 926 error = 0;
adc5e8b5
TH
927 if ((kn->parent == new_parent) && (kn->ns == new_ns) &&
928 (strcmp(kn->name, new_name) == 0))
ae34372e 929 goto out_unlock; /* nothing to rename */
fd7b9f7b
TH
930
931 error = -EEXIST;
932 if (kernfs_find_ns(new_parent, new_name, new_ns))
ae34372e 933 goto out_unlock;
fd7b9f7b 934
324a56e1 935 /* rename kernfs_node */
adc5e8b5 936 if (strcmp(kn->name, new_name) != 0) {
fd7b9f7b
TH
937 error = -ENOMEM;
938 new_name = kstrdup(new_name, GFP_KERNEL);
939 if (!new_name)
ae34372e 940 goto out_unlock;
fd7b9f7b 941
47a52e91
TH
942 if (kn->flags & KERNFS_STATIC_NAME)
943 kn->flags &= ~KERNFS_STATIC_NAME;
944 else
945 kfree(kn->name);
946
adc5e8b5 947 kn->name = new_name;
fd7b9f7b
TH
948 }
949
950 /*
951 * Move to the appropriate place in the appropriate directories rbtree.
952 */
c637b8ac 953 kernfs_unlink_sibling(kn);
fd7b9f7b 954 kernfs_get(new_parent);
adc5e8b5
TH
955 kernfs_put(kn->parent);
956 kn->ns = new_ns;
c637b8ac 957 kn->hash = kernfs_name_hash(kn->name, kn->ns);
adc5e8b5 958 kn->parent = new_parent;
c637b8ac 959 kernfs_link_sibling(kn);
fd7b9f7b
TH
960
961 error = 0;
ae34372e 962out_unlock:
a797bfc3 963 mutex_unlock(&kernfs_mutex);
ae34372e
TH
964 kernfs_put_active(kn);
965out_put_new_parent:
966 kernfs_put_active(new_parent);
967out:
fd7b9f7b
TH
968 return error;
969}
970
fd7b9f7b 971/* Relationship between s_mode and the DT_xxx types */
324a56e1 972static inline unsigned char dt_type(struct kernfs_node *kn)
fd7b9f7b 973{
adc5e8b5 974 return (kn->mode >> 12) & 15;
fd7b9f7b
TH
975}
976
c637b8ac 977static int kernfs_dir_fop_release(struct inode *inode, struct file *filp)
fd7b9f7b
TH
978{
979 kernfs_put(filp->private_data);
980 return 0;
981}
982
c637b8ac 983static struct kernfs_node *kernfs_dir_pos(const void *ns,
324a56e1 984 struct kernfs_node *parent, loff_t hash, struct kernfs_node *pos)
fd7b9f7b
TH
985{
986 if (pos) {
ae34372e 987 int valid = pos->parent == parent && hash == pos->hash;
fd7b9f7b
TH
988 kernfs_put(pos);
989 if (!valid)
990 pos = NULL;
991 }
992 if (!pos && (hash > 1) && (hash < INT_MAX)) {
adc5e8b5 993 struct rb_node *node = parent->dir.children.rb_node;
fd7b9f7b 994 while (node) {
324a56e1 995 pos = rb_to_kn(node);
fd7b9f7b 996
adc5e8b5 997 if (hash < pos->hash)
fd7b9f7b 998 node = node->rb_left;
adc5e8b5 999 else if (hash > pos->hash)
fd7b9f7b
TH
1000 node = node->rb_right;
1001 else
1002 break;
1003 }
1004 }
1005 /* Skip over entries in the wrong namespace */
adc5e8b5
TH
1006 while (pos && pos->ns != ns) {
1007 struct rb_node *node = rb_next(&pos->rb);
fd7b9f7b
TH
1008 if (!node)
1009 pos = NULL;
1010 else
324a56e1 1011 pos = rb_to_kn(node);
fd7b9f7b
TH
1012 }
1013 return pos;
1014}
1015
c637b8ac 1016static struct kernfs_node *kernfs_dir_next_pos(const void *ns,
324a56e1 1017 struct kernfs_node *parent, ino_t ino, struct kernfs_node *pos)
fd7b9f7b 1018{
c637b8ac 1019 pos = kernfs_dir_pos(ns, parent, ino, pos);
fd7b9f7b
TH
1020 if (pos)
1021 do {
adc5e8b5 1022 struct rb_node *node = rb_next(&pos->rb);
fd7b9f7b
TH
1023 if (!node)
1024 pos = NULL;
1025 else
324a56e1 1026 pos = rb_to_kn(node);
adc5e8b5 1027 } while (pos && pos->ns != ns);
fd7b9f7b
TH
1028 return pos;
1029}
1030
c637b8ac 1031static int kernfs_fop_readdir(struct file *file, struct dir_context *ctx)
fd7b9f7b
TH
1032{
1033 struct dentry *dentry = file->f_path.dentry;
324a56e1
TH
1034 struct kernfs_node *parent = dentry->d_fsdata;
1035 struct kernfs_node *pos = file->private_data;
fd7b9f7b
TH
1036 const void *ns = NULL;
1037
1038 if (!dir_emit_dots(file, ctx))
1039 return 0;
a797bfc3 1040 mutex_lock(&kernfs_mutex);
fd7b9f7b 1041
324a56e1 1042 if (kernfs_ns_enabled(parent))
c525aadd 1043 ns = kernfs_info(dentry->d_sb)->ns;
fd7b9f7b 1044
c637b8ac 1045 for (pos = kernfs_dir_pos(ns, parent, ctx->pos, pos);
fd7b9f7b 1046 pos;
c637b8ac 1047 pos = kernfs_dir_next_pos(ns, parent, ctx->pos, pos)) {
adc5e8b5 1048 const char *name = pos->name;
fd7b9f7b
TH
1049 unsigned int type = dt_type(pos);
1050 int len = strlen(name);
adc5e8b5 1051 ino_t ino = pos->ino;
fd7b9f7b 1052
adc5e8b5 1053 ctx->pos = pos->hash;
fd7b9f7b
TH
1054 file->private_data = pos;
1055 kernfs_get(pos);
1056
a797bfc3 1057 mutex_unlock(&kernfs_mutex);
fd7b9f7b
TH
1058 if (!dir_emit(ctx, name, len, ino, type))
1059 return 0;
a797bfc3 1060 mutex_lock(&kernfs_mutex);
fd7b9f7b 1061 }
a797bfc3 1062 mutex_unlock(&kernfs_mutex);
fd7b9f7b
TH
1063 file->private_data = NULL;
1064 ctx->pos = INT_MAX;
1065 return 0;
1066}
1067
c637b8ac
TH
1068static loff_t kernfs_dir_fop_llseek(struct file *file, loff_t offset,
1069 int whence)
fd7b9f7b
TH
1070{
1071 struct inode *inode = file_inode(file);
1072 loff_t ret;
1073
1074 mutex_lock(&inode->i_mutex);
1075 ret = generic_file_llseek(file, offset, whence);
1076 mutex_unlock(&inode->i_mutex);
1077
1078 return ret;
1079}
1080
a797bfc3 1081const struct file_operations kernfs_dir_fops = {
fd7b9f7b 1082 .read = generic_read_dir,
c637b8ac
TH
1083 .iterate = kernfs_fop_readdir,
1084 .release = kernfs_dir_fop_release,
1085 .llseek = kernfs_dir_fop_llseek,
fd7b9f7b 1086};
This page took 0.176622 seconds and 5 git commands to generate.