Commit | Line | Data |
---|---|---|
d7e09d03 PT |
1 | /* |
2 | * GPL HEADER START | |
3 | * | |
4 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. | |
5 | * | |
6 | * This program is free software; you can redistribute it and/or modify | |
7 | * it under the terms of the GNU General Public License version 2 only, | |
8 | * as published by the Free Software Foundation. | |
9 | * | |
10 | * This program is distributed in the hope that it will be useful, but | |
11 | * WITHOUT ANY WARRANTY; without even the implied warranty of | |
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
13 | * General Public License version 2 for more details (a copy is included | |
14 | * in the LICENSE file that accompanied this code). | |
15 | * | |
16 | * You should have received a copy of the GNU General Public License | |
17 | * version 2 along with this program; If not, see | |
18 | * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf | |
19 | * | |
20 | * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara, | |
21 | * CA 95054 USA or visit www.sun.com if you need additional information or | |
22 | * have any questions. | |
23 | * | |
24 | * GPL HEADER END | |
25 | */ | |
26 | /* | |
27 | * Copyright (c) 2002, 2010, Oracle and/or its affiliates. All rights reserved. | |
28 | * Use is subject to license terms. | |
29 | * | |
30 | * Copyright (c) 2011, 2012, Intel Corporation. | |
31 | */ | |
32 | /* | |
33 | * This file is part of Lustre, http://www.lustre.org/ | |
34 | * Lustre is a trademark of Sun Microsystems, Inc. | |
35 | */ | |
36 | ||
37 | #include <linux/fs.h> | |
38 | #include <linux/sched.h> | |
39 | #include <linux/mm.h> | |
40 | #include <linux/quotaops.h> | |
41 | #include <linux/highmem.h> | |
42 | #include <linux/pagemap.h> | |
43 | #include <linux/security.h> | |
44 | ||
45 | #define DEBUG_SUBSYSTEM S_LLITE | |
46 | ||
47 | #include <obd_support.h> | |
48 | #include <lustre_fid.h> | |
49 | #include <lustre_lite.h> | |
50 | #include <lustre_dlm.h> | |
51 | #include <lustre_ver.h> | |
52 | #include "llite_internal.h" | |
53 | ||
54 | static int ll_create_it(struct inode *, struct dentry *, | |
55 | int, struct lookup_intent *); | |
56 | ||
57 | /* | |
58 | * Check if we have something mounted at the named dchild. | |
59 | * In such a case there would always be dentry present. | |
60 | */ | |
61 | static int ll_d_mountpoint(struct dentry *dparent, struct dentry *dchild, | |
62 | struct qstr *name) | |
63 | { | |
64 | int mounted = 0; | |
65 | ||
66 | if (unlikely(dchild)) { | |
67 | mounted = d_mountpoint(dchild); | |
68 | } else if (dparent) { | |
69 | dchild = d_lookup(dparent, name); | |
70 | if (dchild) { | |
71 | mounted = d_mountpoint(dchild); | |
72 | dput(dchild); | |
73 | } | |
74 | } | |
75 | return mounted; | |
76 | } | |
77 | ||
78 | int ll_unlock(__u32 mode, struct lustre_handle *lockh) | |
79 | { | |
80 | ENTRY; | |
81 | ||
82 | ldlm_lock_decref(lockh, mode); | |
83 | ||
84 | RETURN(0); | |
85 | } | |
86 | ||
87 | ||
88 | /* called from iget5_locked->find_inode() under inode_lock spinlock */ | |
89 | static int ll_test_inode(struct inode *inode, void *opaque) | |
90 | { | |
91 | struct ll_inode_info *lli = ll_i2info(inode); | |
92 | struct lustre_md *md = opaque; | |
93 | ||
94 | if (unlikely(!(md->body->valid & OBD_MD_FLID))) { | |
95 | CERROR("MDS body missing FID\n"); | |
96 | return 0; | |
97 | } | |
98 | ||
99 | if (!lu_fid_eq(&lli->lli_fid, &md->body->fid1)) | |
100 | return 0; | |
101 | ||
102 | return 1; | |
103 | } | |
104 | ||
105 | static int ll_set_inode(struct inode *inode, void *opaque) | |
106 | { | |
107 | struct ll_inode_info *lli = ll_i2info(inode); | |
108 | struct mdt_body *body = ((struct lustre_md *)opaque)->body; | |
109 | ||
110 | if (unlikely(!(body->valid & OBD_MD_FLID))) { | |
111 | CERROR("MDS body missing FID\n"); | |
112 | return -EINVAL; | |
113 | } | |
114 | ||
115 | lli->lli_fid = body->fid1; | |
116 | if (unlikely(!(body->valid & OBD_MD_FLTYPE))) { | |
117 | CERROR("Can not initialize inode "DFID" without object type: " | |
118 | "valid = "LPX64"\n", PFID(&lli->lli_fid), body->valid); | |
119 | return -EINVAL; | |
120 | } | |
121 | ||
122 | inode->i_mode = (inode->i_mode & ~S_IFMT) | (body->mode & S_IFMT); | |
123 | if (unlikely(inode->i_mode == 0)) { | |
124 | CERROR("Invalid inode "DFID" type\n", PFID(&lli->lli_fid)); | |
125 | return -EINVAL; | |
126 | } | |
127 | ||
128 | ll_lli_init(lli); | |
129 | ||
130 | return 0; | |
131 | } | |
132 | ||
133 | ||
134 | /* | |
135 | * Get an inode by inode number (already instantiated by the intent lookup). | |
136 | * Returns inode or NULL | |
137 | */ | |
138 | struct inode *ll_iget(struct super_block *sb, ino_t hash, | |
139 | struct lustre_md *md) | |
140 | { | |
141 | struct inode *inode; | |
142 | ENTRY; | |
143 | ||
144 | LASSERT(hash != 0); | |
145 | inode = iget5_locked(sb, hash, ll_test_inode, ll_set_inode, md); | |
146 | ||
147 | if (inode) { | |
148 | if (inode->i_state & I_NEW) { | |
149 | int rc = 0; | |
150 | ||
151 | ll_read_inode2(inode, md); | |
152 | if (S_ISREG(inode->i_mode) && | |
153 | ll_i2info(inode)->lli_clob == NULL) { | |
154 | CDEBUG(D_INODE, | |
155 | "%s: apply lsm %p to inode "DFID".\n", | |
156 | ll_get_fsname(sb, NULL, 0), md->lsm, | |
157 | PFID(ll_inode2fid(inode))); | |
158 | rc = cl_file_inode_init(inode, md); | |
159 | } | |
160 | if (rc != 0) { | |
161 | make_bad_inode(inode); | |
162 | unlock_new_inode(inode); | |
163 | iput(inode); | |
164 | inode = ERR_PTR(rc); | |
165 | } else | |
166 | unlock_new_inode(inode); | |
167 | } else if (!(inode->i_state & (I_FREEING | I_CLEAR))) | |
168 | ll_update_inode(inode, md); | |
169 | CDEBUG(D_VFSTRACE, "got inode: %p for "DFID"\n", | |
170 | inode, PFID(&md->body->fid1)); | |
171 | } | |
172 | RETURN(inode); | |
173 | } | |
174 | ||
175 | static void ll_invalidate_negative_children(struct inode *dir) | |
176 | { | |
177 | struct dentry *dentry, *tmp_subdir; | |
178 | struct ll_d_hlist_node *p; | |
179 | ||
180 | ll_lock_dcache(dir); | |
181 | ll_d_hlist_for_each_entry(dentry, p, &dir->i_dentry, d_alias) { | |
182 | spin_lock(&dentry->d_lock); | |
183 | if (!list_empty(&dentry->d_subdirs)) { | |
184 | struct dentry *child; | |
185 | ||
186 | list_for_each_entry_safe(child, tmp_subdir, | |
187 | &dentry->d_subdirs, | |
188 | d_u.d_child) { | |
189 | if (child->d_inode == NULL) | |
190 | d_lustre_invalidate(child); | |
191 | } | |
192 | } | |
193 | spin_unlock(&dentry->d_lock); | |
194 | } | |
195 | ll_unlock_dcache(dir); | |
196 | } | |
197 | ||
198 | int ll_md_blocking_ast(struct ldlm_lock *lock, struct ldlm_lock_desc *desc, | |
199 | void *data, int flag) | |
200 | { | |
201 | int rc; | |
202 | struct lustre_handle lockh; | |
203 | ENTRY; | |
204 | ||
205 | switch (flag) { | |
206 | case LDLM_CB_BLOCKING: | |
207 | ldlm_lock2handle(lock, &lockh); | |
208 | rc = ldlm_cli_cancel(&lockh, LCF_ASYNC); | |
209 | if (rc < 0) { | |
210 | CDEBUG(D_INODE, "ldlm_cli_cancel: %d\n", rc); | |
211 | RETURN(rc); | |
212 | } | |
213 | break; | |
214 | case LDLM_CB_CANCELING: { | |
215 | struct inode *inode = ll_inode_from_resource_lock(lock); | |
216 | struct ll_inode_info *lli; | |
217 | __u64 bits = lock->l_policy_data.l_inodebits.bits; | |
218 | struct lu_fid *fid; | |
219 | ldlm_mode_t mode = lock->l_req_mode; | |
220 | ||
221 | /* Inode is set to lock->l_resource->lr_lvb_inode | |
222 | * for mdc - bug 24555 */ | |
223 | LASSERT(lock->l_ast_data == NULL); | |
224 | ||
225 | /* Invalidate all dentries associated with this inode */ | |
226 | if (inode == NULL) | |
227 | break; | |
228 | ||
229 | LASSERT(lock->l_flags & LDLM_FL_CANCELING); | |
230 | /* For OPEN locks we differentiate between lock modes | |
231 | * LCK_CR, LCK_CW, LCK_PR - bug 22891 */ | |
232 | if (bits & (MDS_INODELOCK_LOOKUP | MDS_INODELOCK_UPDATE | | |
233 | MDS_INODELOCK_LAYOUT | MDS_INODELOCK_PERM)) | |
234 | ll_have_md_lock(inode, &bits, LCK_MINMODE); | |
235 | ||
236 | if (bits & MDS_INODELOCK_OPEN) | |
237 | ll_have_md_lock(inode, &bits, mode); | |
238 | ||
239 | fid = ll_inode2fid(inode); | |
240 | if (lock->l_resource->lr_name.name[0] != fid_seq(fid) || | |
241 | lock->l_resource->lr_name.name[1] != fid_oid(fid) || | |
242 | lock->l_resource->lr_name.name[2] != fid_ver(fid)) { | |
243 | LDLM_ERROR(lock, "data mismatch with object " | |
244 | DFID" (%p)", PFID(fid), inode); | |
245 | } | |
246 | ||
247 | if (bits & MDS_INODELOCK_OPEN) { | |
248 | int flags = 0; | |
249 | switch (lock->l_req_mode) { | |
250 | case LCK_CW: | |
251 | flags = FMODE_WRITE; | |
252 | break; | |
253 | case LCK_PR: | |
254 | flags = FMODE_EXEC; | |
255 | break; | |
256 | case LCK_CR: | |
257 | flags = FMODE_READ; | |
258 | break; | |
259 | default: | |
260 | CERROR("Unexpected lock mode for OPEN lock " | |
261 | "%d, inode %ld\n", lock->l_req_mode, | |
262 | inode->i_ino); | |
263 | } | |
264 | ll_md_real_close(inode, flags); | |
265 | } | |
266 | ||
267 | lli = ll_i2info(inode); | |
268 | if (bits & MDS_INODELOCK_LAYOUT) { | |
269 | struct cl_object_conf conf = { { 0 } }; | |
270 | ||
271 | conf.coc_opc = OBJECT_CONF_INVALIDATE; | |
272 | conf.coc_inode = inode; | |
273 | rc = ll_layout_conf(inode, &conf); | |
274 | if (rc) | |
275 | CDEBUG(D_INODE, "invaliding layout %d.\n", rc); | |
276 | } | |
277 | ||
278 | if (bits & MDS_INODELOCK_UPDATE) | |
279 | lli->lli_flags &= ~LLIF_MDS_SIZE_LOCK; | |
280 | ||
281 | if (S_ISDIR(inode->i_mode) && | |
282 | (bits & MDS_INODELOCK_UPDATE)) { | |
283 | CDEBUG(D_INODE, "invalidating inode %lu\n", | |
284 | inode->i_ino); | |
285 | truncate_inode_pages(inode->i_mapping, 0); | |
286 | ll_invalidate_negative_children(inode); | |
287 | } | |
288 | ||
289 | if (inode->i_sb->s_root && | |
290 | inode != inode->i_sb->s_root->d_inode && | |
291 | (bits & (MDS_INODELOCK_LOOKUP | MDS_INODELOCK_PERM))) | |
292 | ll_invalidate_aliases(inode); | |
293 | iput(inode); | |
294 | break; | |
295 | } | |
296 | default: | |
297 | LBUG(); | |
298 | } | |
299 | ||
300 | RETURN(0); | |
301 | } | |
302 | ||
303 | __u32 ll_i2suppgid(struct inode *i) | |
304 | { | |
305 | if (current_is_in_group(i->i_gid)) | |
306 | return (__u32)i->i_gid; | |
307 | else | |
308 | return (__u32)(-1); | |
309 | } | |
310 | ||
311 | /* Pack the required supplementary groups into the supplied groups array. | |
312 | * If we don't need to use the groups from the target inode(s) then we | |
313 | * instead pack one or more groups from the user's supplementary group | |
314 | * array in case it might be useful. Not needed if doing an MDS-side upcall. */ | |
315 | void ll_i2gids(__u32 *suppgids, struct inode *i1, struct inode *i2) | |
316 | { | |
317 | #if 0 | |
318 | int i; | |
319 | #endif | |
320 | ||
321 | LASSERT(i1 != NULL); | |
322 | LASSERT(suppgids != NULL); | |
323 | ||
324 | suppgids[0] = ll_i2suppgid(i1); | |
325 | ||
326 | if (i2) | |
327 | suppgids[1] = ll_i2suppgid(i2); | |
328 | else | |
329 | suppgids[1] = -1; | |
330 | ||
331 | #if 0 | |
332 | for (i = 0; i < current_ngroups; i++) { | |
333 | if (suppgids[0] == -1) { | |
334 | if (current_groups[i] != suppgids[1]) | |
335 | suppgids[0] = current_groups[i]; | |
336 | continue; | |
337 | } | |
338 | if (suppgids[1] == -1) { | |
339 | if (current_groups[i] != suppgids[0]) | |
340 | suppgids[1] = current_groups[i]; | |
341 | continue; | |
342 | } | |
343 | break; | |
344 | } | |
345 | #endif | |
346 | } | |
347 | ||
348 | /* | |
349 | * try to reuse three types of dentry: | |
350 | * 1. unhashed alias, this one is unhashed by d_invalidate (but it may be valid | |
351 | * by concurrent .revalidate). | |
352 | * 2. INVALID alias (common case for no valid ldlm lock held, but this flag may | |
353 | * be cleared by others calling d_lustre_revalidate). | |
354 | * 3. DISCONNECTED alias. | |
355 | */ | |
356 | static struct dentry *ll_find_alias(struct inode *inode, struct dentry *dentry) | |
357 | { | |
358 | struct dentry *alias, *discon_alias, *invalid_alias; | |
359 | struct ll_d_hlist_node *p; | |
360 | ||
361 | if (ll_d_hlist_empty(&inode->i_dentry)) | |
362 | return NULL; | |
363 | ||
364 | discon_alias = invalid_alias = NULL; | |
365 | ||
366 | ll_lock_dcache(inode); | |
367 | ll_d_hlist_for_each_entry(alias, p, &inode->i_dentry, d_alias) { | |
368 | LASSERT(alias != dentry); | |
369 | ||
370 | spin_lock(&alias->d_lock); | |
371 | if (alias->d_flags & DCACHE_DISCONNECTED) | |
372 | /* LASSERT(last_discon == NULL); LU-405, bz 20055 */ | |
373 | discon_alias = alias; | |
374 | else if (alias->d_parent == dentry->d_parent && | |
375 | alias->d_name.hash == dentry->d_name.hash && | |
376 | alias->d_name.len == dentry->d_name.len && | |
377 | memcmp(alias->d_name.name, dentry->d_name.name, | |
378 | dentry->d_name.len) == 0) | |
379 | invalid_alias = alias; | |
380 | spin_unlock(&alias->d_lock); | |
381 | ||
382 | if (invalid_alias) | |
383 | break; | |
384 | } | |
385 | alias = invalid_alias ?: discon_alias ?: NULL; | |
386 | if (alias) { | |
387 | spin_lock(&alias->d_lock); | |
388 | dget_dlock(alias); | |
389 | spin_unlock(&alias->d_lock); | |
390 | } | |
391 | ll_unlock_dcache(inode); | |
392 | ||
393 | return alias; | |
394 | } | |
395 | ||
396 | /* | |
397 | * Similar to d_splice_alias(), but lustre treats invalid alias | |
398 | * similar to DCACHE_DISCONNECTED, and tries to use it anyway. | |
399 | */ | |
400 | struct dentry *ll_splice_alias(struct inode *inode, struct dentry *de) | |
401 | { | |
402 | struct dentry *new; | |
403 | ||
404 | if (inode) { | |
405 | new = ll_find_alias(inode, de); | |
406 | if (new) { | |
407 | ll_dops_init(new, 1, 1); | |
408 | d_move(new, de); | |
409 | iput(inode); | |
410 | CDEBUG(D_DENTRY, | |
411 | "Reuse dentry %p inode %p refc %d flags %#x\n", | |
412 | new, new->d_inode, d_refcount(new), new->d_flags); | |
413 | return new; | |
414 | } | |
415 | } | |
416 | ll_dops_init(de, 1, 1); | |
417 | __d_lustre_invalidate(de); | |
418 | d_add(de, inode); | |
419 | CDEBUG(D_DENTRY, "Add dentry %p inode %p refc %d flags %#x\n", | |
420 | de, de->d_inode, d_refcount(de), de->d_flags); | |
421 | return de; | |
422 | } | |
423 | ||
424 | int ll_lookup_it_finish(struct ptlrpc_request *request, | |
425 | struct lookup_intent *it, void *data) | |
426 | { | |
427 | struct it_cb_data *icbd = data; | |
428 | struct dentry **de = icbd->icbd_childp; | |
429 | struct inode *parent = icbd->icbd_parent; | |
430 | struct inode *inode = NULL; | |
431 | __u64 bits = 0; | |
432 | int rc; | |
433 | ENTRY; | |
434 | ||
435 | /* NB 1 request reference will be taken away by ll_intent_lock() | |
436 | * when I return */ | |
437 | CDEBUG(D_DENTRY, "it %p it_disposition %x\n", it, | |
438 | it->d.lustre.it_disposition); | |
439 | if (!it_disposition(it, DISP_LOOKUP_NEG)) { | |
440 | rc = ll_prep_inode(&inode, request, (*de)->d_sb, it); | |
441 | if (rc) | |
442 | RETURN(rc); | |
443 | ||
444 | ll_set_lock_data(ll_i2sbi(parent)->ll_md_exp, inode, it, &bits); | |
445 | ||
446 | /* We used to query real size from OSTs here, but actually | |
447 | this is not needed. For stat() calls size would be updated | |
448 | from subsequent do_revalidate()->ll_inode_revalidate_it() in | |
449 | 2.4 and | |
450 | vfs_getattr_it->ll_getattr()->ll_inode_revalidate_it() in 2.6 | |
451 | Everybody else who needs correct file size would call | |
452 | ll_glimpse_size or some equivalent themselves anyway. | |
453 | Also see bug 7198. */ | |
454 | } | |
455 | ||
456 | /* Only hash *de if it is unhashed (new dentry). | |
457 | * Atoimc_open may passin hashed dentries for open. | |
458 | */ | |
459 | if (d_unhashed(*de)) | |
460 | *de = ll_splice_alias(inode, *de); | |
461 | ||
462 | if (!it_disposition(it, DISP_LOOKUP_NEG)) { | |
463 | /* we have lookup look - unhide dentry */ | |
464 | if (bits & MDS_INODELOCK_LOOKUP) | |
465 | d_lustre_revalidate(*de); | |
466 | } else if (!it_disposition(it, DISP_OPEN_CREATE)) { | |
467 | /* If file created on server, don't depend on parent UPDATE | |
468 | * lock to unhide it. It is left hidden and next lookup can | |
469 | * find it in ll_splice_alias. | |
470 | */ | |
471 | /* Check that parent has UPDATE lock. */ | |
472 | struct lookup_intent parent_it = { | |
473 | .it_op = IT_GETATTR, | |
474 | .d.lustre.it_lock_handle = 0 }; | |
475 | ||
476 | if (md_revalidate_lock(ll_i2mdexp(parent), &parent_it, | |
477 | &ll_i2info(parent)->lli_fid, NULL)) { | |
478 | d_lustre_revalidate(*de); | |
479 | ll_intent_release(&parent_it); | |
480 | } | |
481 | } | |
482 | ||
483 | RETURN(0); | |
484 | } | |
485 | ||
486 | static struct dentry *ll_lookup_it(struct inode *parent, struct dentry *dentry, | |
487 | struct lookup_intent *it, int lookup_flags) | |
488 | { | |
489 | struct lookup_intent lookup_it = { .it_op = IT_LOOKUP }; | |
490 | struct dentry *save = dentry, *retval; | |
491 | struct ptlrpc_request *req = NULL; | |
492 | struct md_op_data *op_data; | |
493 | struct it_cb_data icbd; | |
494 | __u32 opc; | |
495 | int rc; | |
496 | ENTRY; | |
497 | ||
498 | if (dentry->d_name.len > ll_i2sbi(parent)->ll_namelen) | |
499 | RETURN(ERR_PTR(-ENAMETOOLONG)); | |
500 | ||
501 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p),intent=%s\n", | |
502 | dentry->d_name.len, dentry->d_name.name, parent->i_ino, | |
503 | parent->i_generation, parent, LL_IT2STR(it)); | |
504 | ||
505 | if (d_mountpoint(dentry)) | |
506 | CERROR("Tell Peter, lookup on mtpt, it %s\n", LL_IT2STR(it)); | |
507 | ||
508 | ll_frob_intent(&it, &lookup_it); | |
509 | ||
510 | /* As do_lookup is called before follow_mount, root dentry may be left | |
511 | * not valid, revalidate it here. */ | |
512 | if (parent->i_sb->s_root && (parent->i_sb->s_root->d_inode == parent) && | |
513 | (it->it_op & (IT_OPEN | IT_CREAT))) { | |
514 | rc = ll_inode_revalidate_it(parent->i_sb->s_root, it, | |
515 | MDS_INODELOCK_LOOKUP); | |
516 | if (rc) | |
517 | RETURN(ERR_PTR(rc)); | |
518 | } | |
519 | ||
520 | if (it->it_op == IT_GETATTR) { | |
521 | rc = ll_statahead_enter(parent, &dentry, 0); | |
522 | if (rc == 1) { | |
523 | if (dentry == save) | |
524 | GOTO(out, retval = NULL); | |
525 | GOTO(out, retval = dentry); | |
526 | } | |
527 | } | |
528 | ||
529 | icbd.icbd_childp = &dentry; | |
530 | icbd.icbd_parent = parent; | |
531 | ||
532 | if (it->it_op & IT_CREAT || | |
533 | (it->it_op & IT_OPEN && it->it_create_mode & O_CREAT)) | |
534 | opc = LUSTRE_OPC_CREATE; | |
535 | else | |
536 | opc = LUSTRE_OPC_ANY; | |
537 | ||
538 | op_data = ll_prep_md_op_data(NULL, parent, NULL, dentry->d_name.name, | |
539 | dentry->d_name.len, lookup_flags, opc, | |
540 | NULL); | |
541 | if (IS_ERR(op_data)) | |
542 | RETURN((void *)op_data); | |
543 | ||
544 | /* enforce umask if acl disabled or MDS doesn't support umask */ | |
545 | if (!IS_POSIXACL(parent) || !exp_connect_umask(ll_i2mdexp(parent))) | |
546 | it->it_create_mode &= ~current_umask(); | |
547 | ||
548 | rc = md_intent_lock(ll_i2mdexp(parent), op_data, NULL, 0, it, | |
549 | lookup_flags, &req, ll_md_blocking_ast, 0); | |
550 | ll_finish_md_op_data(op_data); | |
551 | if (rc < 0) | |
552 | GOTO(out, retval = ERR_PTR(rc)); | |
553 | ||
554 | rc = ll_lookup_it_finish(req, it, &icbd); | |
555 | if (rc != 0) { | |
556 | ll_intent_release(it); | |
557 | GOTO(out, retval = ERR_PTR(rc)); | |
558 | } | |
559 | ||
560 | if ((it->it_op & IT_OPEN) && dentry->d_inode && | |
561 | !S_ISREG(dentry->d_inode->i_mode) && | |
562 | !S_ISDIR(dentry->d_inode->i_mode)) { | |
563 | ll_release_openhandle(dentry, it); | |
564 | } | |
565 | ll_lookup_finish_locks(it, dentry); | |
566 | ||
567 | if (dentry == save) | |
568 | GOTO(out, retval = NULL); | |
569 | else | |
570 | GOTO(out, retval = dentry); | |
571 | out: | |
572 | if (req) | |
573 | ptlrpc_req_finished(req); | |
574 | if (it->it_op == IT_GETATTR && (retval == NULL || retval == dentry)) | |
575 | ll_statahead_mark(parent, dentry); | |
576 | return retval; | |
577 | } | |
578 | ||
579 | static struct dentry *ll_lookup_nd(struct inode *parent, struct dentry *dentry, | |
580 | unsigned int flags) | |
581 | { | |
582 | struct lookup_intent *itp, it = { .it_op = IT_GETATTR }; | |
583 | struct dentry *de; | |
584 | ||
585 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p),flags=%u\n", | |
586 | dentry->d_name.len, dentry->d_name.name, parent->i_ino, | |
587 | parent->i_generation, parent, flags); | |
588 | ||
589 | /* Optimize away (CREATE && !OPEN). Let .create handle the race. */ | |
590 | if ((flags & LOOKUP_CREATE ) && !(flags & LOOKUP_OPEN)) { | |
591 | ll_dops_init(dentry, 1, 1); | |
592 | __d_lustre_invalidate(dentry); | |
593 | d_add(dentry, NULL); | |
594 | return NULL; | |
595 | } | |
596 | ||
597 | if (flags & (LOOKUP_PARENT|LOOKUP_OPEN|LOOKUP_CREATE)) | |
598 | itp = NULL; | |
599 | else | |
600 | itp = ⁢ | |
601 | de = ll_lookup_it(parent, dentry, itp, 0); | |
602 | ||
603 | if (itp != NULL) | |
604 | ll_intent_release(itp); | |
605 | ||
606 | return de; | |
607 | } | |
608 | ||
609 | /* | |
610 | * For cached negative dentry and new dentry, handle lookup/create/open | |
611 | * together. | |
612 | */ | |
613 | static int ll_atomic_open(struct inode *dir, struct dentry *dentry, | |
614 | struct file *file, unsigned open_flags, | |
615 | umode_t mode, int *opened) | |
616 | { | |
617 | struct lookup_intent *it; | |
618 | struct dentry *de; | |
619 | long long lookup_flags = LOOKUP_OPEN; | |
620 | int rc = 0; | |
621 | ENTRY; | |
622 | ||
623 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p),file %p," | |
624 | "open_flags %x,mode %x opened %d\n", | |
625 | dentry->d_name.len, dentry->d_name.name, dir->i_ino, | |
626 | dir->i_generation, dir, file, open_flags, mode, *opened); | |
627 | ||
628 | OBD_ALLOC(it, sizeof(*it)); | |
629 | if (!it) | |
630 | RETURN(-ENOMEM); | |
631 | ||
632 | it->it_op = IT_OPEN; | |
633 | if (mode) { | |
634 | it->it_op |= IT_CREAT; | |
635 | lookup_flags |= LOOKUP_CREATE; | |
636 | } | |
637 | it->it_create_mode = (mode & S_IALLUGO) | S_IFREG; | |
638 | it->it_flags = (open_flags & ~O_ACCMODE) | OPEN_FMODE(open_flags); | |
639 | ||
640 | /* Dentry added to dcache tree in ll_lookup_it */ | |
641 | de = ll_lookup_it(dir, dentry, it, lookup_flags); | |
642 | if (IS_ERR(de)) | |
643 | rc = PTR_ERR(de); | |
644 | else if (de != NULL) | |
645 | dentry = de; | |
646 | ||
647 | if (!rc) { | |
648 | if (it_disposition(it, DISP_OPEN_CREATE)) { | |
649 | /* Dentry instantiated in ll_create_it. */ | |
650 | rc = ll_create_it(dir, dentry, mode, it); | |
651 | if (rc) { | |
652 | /* We dget in ll_splice_alias. */ | |
653 | if (de != NULL) | |
654 | dput(de); | |
655 | goto out_release; | |
656 | } | |
657 | ||
658 | *opened |= FILE_CREATED; | |
659 | } | |
660 | if (dentry->d_inode && it_disposition(it, DISP_OPEN_OPEN)) { | |
661 | /* Open dentry. */ | |
662 | if (S_ISFIFO(dentry->d_inode->i_mode)) { | |
663 | /* We cannot call open here as it would | |
664 | * deadlock. | |
665 | */ | |
666 | if (it_disposition(it, DISP_ENQ_OPEN_REF)) | |
667 | ptlrpc_req_finished( | |
668 | (struct ptlrpc_request *) | |
669 | it->d.lustre.it_data); | |
670 | rc = finish_no_open(file, de); | |
671 | } else { | |
672 | file->private_data = it; | |
673 | rc = finish_open(file, dentry, NULL, opened); | |
674 | /* We dget in ll_splice_alias. finish_open takes | |
675 | * care of dget for fd open. | |
676 | */ | |
677 | if (de != NULL) | |
678 | dput(de); | |
679 | } | |
680 | } else { | |
681 | rc = finish_no_open(file, de); | |
682 | } | |
683 | } | |
684 | ||
685 | out_release: | |
686 | ll_intent_release(it); | |
687 | OBD_FREE(it, sizeof(*it)); | |
688 | ||
689 | RETURN(rc); | |
690 | } | |
691 | ||
692 | ||
693 | /* We depend on "mode" being set with the proper file type/umask by now */ | |
694 | static struct inode *ll_create_node(struct inode *dir, const char *name, | |
695 | int namelen, const void *data, int datalen, | |
696 | int mode, __u64 extra, | |
697 | struct lookup_intent *it) | |
698 | { | |
699 | struct inode *inode = NULL; | |
700 | struct ptlrpc_request *request = NULL; | |
701 | struct ll_sb_info *sbi = ll_i2sbi(dir); | |
702 | int rc; | |
703 | ENTRY; | |
704 | ||
705 | LASSERT(it && it->d.lustre.it_disposition); | |
706 | ||
707 | LASSERT(it_disposition(it, DISP_ENQ_CREATE_REF)); | |
708 | request = it->d.lustre.it_data; | |
709 | it_clear_disposition(it, DISP_ENQ_CREATE_REF); | |
710 | rc = ll_prep_inode(&inode, request, dir->i_sb, it); | |
711 | if (rc) | |
712 | GOTO(out, inode = ERR_PTR(rc)); | |
713 | ||
714 | LASSERT(ll_d_hlist_empty(&inode->i_dentry)); | |
715 | ||
716 | /* We asked for a lock on the directory, but were granted a | |
717 | * lock on the inode. Since we finally have an inode pointer, | |
718 | * stuff it in the lock. */ | |
719 | CDEBUG(D_DLMTRACE, "setting l_ast_data to inode %p (%lu/%u)\n", | |
720 | inode, inode->i_ino, inode->i_generation); | |
721 | ll_set_lock_data(sbi->ll_md_exp, inode, it, NULL); | |
722 | EXIT; | |
723 | out: | |
724 | ptlrpc_req_finished(request); | |
725 | return inode; | |
726 | } | |
727 | ||
728 | /* | |
729 | * By the time this is called, we already have created the directory cache | |
730 | * entry for the new file, but it is so far negative - it has no inode. | |
731 | * | |
732 | * We defer creating the OBD object(s) until open, to keep the intent and | |
733 | * non-intent code paths similar, and also because we do not have the MDS | |
734 | * inode number before calling ll_create_node() (which is needed for LOV), | |
735 | * so we would need to do yet another RPC to the MDS to store the LOV EA | |
736 | * data on the MDS. If needed, we would pass the PACKED lmm as data and | |
737 | * lmm_size in datalen (the MDS still has code which will handle that). | |
738 | * | |
739 | * If the create succeeds, we fill in the inode information | |
740 | * with d_instantiate(). | |
741 | */ | |
742 | static int ll_create_it(struct inode *dir, struct dentry *dentry, int mode, | |
743 | struct lookup_intent *it) | |
744 | { | |
745 | struct inode *inode; | |
746 | int rc = 0; | |
747 | ENTRY; | |
748 | ||
749 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p),intent=%s\n", | |
750 | dentry->d_name.len, dentry->d_name.name, dir->i_ino, | |
751 | dir->i_generation, dir, LL_IT2STR(it)); | |
752 | ||
753 | rc = it_open_error(DISP_OPEN_CREATE, it); | |
754 | if (rc) | |
755 | RETURN(rc); | |
756 | ||
757 | inode = ll_create_node(dir, dentry->d_name.name, dentry->d_name.len, | |
758 | NULL, 0, mode, 0, it); | |
759 | if (IS_ERR(inode)) | |
760 | RETURN(PTR_ERR(inode)); | |
761 | ||
762 | if (filename_is_volatile(dentry->d_name.name, dentry->d_name.len, NULL)) | |
763 | ll_i2info(inode)->lli_volatile = true; | |
764 | ||
765 | d_instantiate(dentry, inode); | |
766 | RETURN(0); | |
767 | } | |
768 | ||
769 | static void ll_update_times(struct ptlrpc_request *request, | |
770 | struct inode *inode) | |
771 | { | |
772 | struct mdt_body *body = req_capsule_server_get(&request->rq_pill, | |
773 | &RMF_MDT_BODY); | |
774 | ||
775 | LASSERT(body); | |
776 | if (body->valid & OBD_MD_FLMTIME && | |
777 | body->mtime > LTIME_S(inode->i_mtime)) { | |
778 | CDEBUG(D_INODE, "setting ino %lu mtime from %lu to "LPU64"\n", | |
779 | inode->i_ino, LTIME_S(inode->i_mtime), body->mtime); | |
780 | LTIME_S(inode->i_mtime) = body->mtime; | |
781 | } | |
782 | if (body->valid & OBD_MD_FLCTIME && | |
783 | body->ctime > LTIME_S(inode->i_ctime)) | |
784 | LTIME_S(inode->i_ctime) = body->ctime; | |
785 | } | |
786 | ||
787 | static int ll_new_node(struct inode *dir, struct qstr *name, | |
788 | const char *tgt, int mode, int rdev, | |
789 | struct dentry *dchild, __u32 opc) | |
790 | { | |
791 | struct ptlrpc_request *request = NULL; | |
792 | struct md_op_data *op_data; | |
793 | struct inode *inode = NULL; | |
794 | struct ll_sb_info *sbi = ll_i2sbi(dir); | |
795 | int tgt_len = 0; | |
796 | int err; | |
797 | ||
798 | ENTRY; | |
799 | if (unlikely(tgt != NULL)) | |
800 | tgt_len = strlen(tgt) + 1; | |
801 | ||
802 | op_data = ll_prep_md_op_data(NULL, dir, NULL, name->name, | |
803 | name->len, 0, opc, NULL); | |
804 | if (IS_ERR(op_data)) | |
805 | GOTO(err_exit, err = PTR_ERR(op_data)); | |
806 | ||
807 | err = md_create(sbi->ll_md_exp, op_data, tgt, tgt_len, mode, | |
808 | current_fsuid(), current_fsgid(), | |
809 | cfs_curproc_cap_pack(), rdev, &request); | |
810 | ll_finish_md_op_data(op_data); | |
811 | if (err) | |
812 | GOTO(err_exit, err); | |
813 | ||
814 | ll_update_times(request, dir); | |
815 | ||
816 | if (dchild) { | |
817 | err = ll_prep_inode(&inode, request, dchild->d_sb, NULL); | |
818 | if (err) | |
819 | GOTO(err_exit, err); | |
820 | ||
821 | d_instantiate(dchild, inode); | |
822 | } | |
823 | EXIT; | |
824 | err_exit: | |
825 | ptlrpc_req_finished(request); | |
826 | ||
827 | return err; | |
828 | } | |
829 | ||
830 | static int ll_mknod_generic(struct inode *dir, struct qstr *name, int mode, | |
831 | unsigned rdev, struct dentry *dchild) | |
832 | { | |
833 | int err; | |
834 | ENTRY; | |
835 | ||
836 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p) mode %o dev %x\n", | |
837 | name->len, name->name, dir->i_ino, dir->i_generation, dir, | |
838 | mode, rdev); | |
839 | ||
840 | if (!IS_POSIXACL(dir) || !exp_connect_umask(ll_i2mdexp(dir))) | |
841 | mode &= ~current_umask(); | |
842 | ||
843 | switch (mode & S_IFMT) { | |
844 | case 0: | |
845 | mode |= S_IFREG; /* for mode = 0 case, fallthrough */ | |
846 | case S_IFREG: | |
847 | case S_IFCHR: | |
848 | case S_IFBLK: | |
849 | case S_IFIFO: | |
850 | case S_IFSOCK: | |
851 | err = ll_new_node(dir, name, NULL, mode, rdev, dchild, | |
852 | LUSTRE_OPC_MKNOD); | |
853 | break; | |
854 | case S_IFDIR: | |
855 | err = -EPERM; | |
856 | break; | |
857 | default: | |
858 | err = -EINVAL; | |
859 | } | |
860 | ||
861 | if (!err) | |
862 | ll_stats_ops_tally(ll_i2sbi(dir), LPROC_LL_MKNOD, 1); | |
863 | ||
864 | RETURN(err); | |
865 | } | |
866 | ||
867 | /* | |
868 | * Plain create. Intent create is handled in atomic_open. | |
869 | */ | |
870 | static int ll_create_nd(struct inode *dir, struct dentry *dentry, | |
871 | umode_t mode, bool want_excl) | |
872 | { | |
873 | int rc; | |
874 | ||
875 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p)," | |
876 | "flags=%u, excl=%d\n", | |
877 | dentry->d_name.len, dentry->d_name.name, dir->i_ino, | |
878 | dir->i_generation, dir, mode, want_excl); | |
879 | ||
880 | rc = ll_mknod_generic(dir, &dentry->d_name, mode, 0, dentry); | |
881 | ||
882 | ll_stats_ops_tally(ll_i2sbi(dir), LPROC_LL_CREATE, 1); | |
883 | ||
884 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s, unhashed %d\n", | |
885 | dentry->d_name.len, dentry->d_name.name, d_unhashed(dentry)); | |
886 | ||
887 | return rc; | |
888 | } | |
889 | ||
890 | static int ll_symlink_generic(struct inode *dir, struct qstr *name, | |
891 | const char *tgt, struct dentry *dchild) | |
892 | { | |
893 | int err; | |
894 | ENTRY; | |
895 | ||
896 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p),target=%.*s\n", | |
897 | name->len, name->name, dir->i_ino, dir->i_generation, | |
898 | dir, 3000, tgt); | |
899 | ||
900 | err = ll_new_node(dir, name, (char *)tgt, S_IFLNK | S_IRWXUGO, | |
901 | 0, dchild, LUSTRE_OPC_SYMLINK); | |
902 | ||
903 | if (!err) | |
904 | ll_stats_ops_tally(ll_i2sbi(dir), LPROC_LL_SYMLINK, 1); | |
905 | ||
906 | RETURN(err); | |
907 | } | |
908 | ||
909 | static int ll_link_generic(struct inode *src, struct inode *dir, | |
910 | struct qstr *name, struct dentry *dchild) | |
911 | { | |
912 | struct ll_sb_info *sbi = ll_i2sbi(dir); | |
913 | struct ptlrpc_request *request = NULL; | |
914 | struct md_op_data *op_data; | |
915 | int err; | |
916 | ||
917 | ENTRY; | |
918 | CDEBUG(D_VFSTRACE, | |
919 | "VFS Op: inode=%lu/%u(%p), dir=%lu/%u(%p), target=%.*s\n", | |
920 | src->i_ino, src->i_generation, src, dir->i_ino, | |
921 | dir->i_generation, dir, name->len, name->name); | |
922 | ||
923 | op_data = ll_prep_md_op_data(NULL, src, dir, name->name, name->len, | |
924 | 0, LUSTRE_OPC_ANY, NULL); | |
925 | if (IS_ERR(op_data)) | |
926 | RETURN(PTR_ERR(op_data)); | |
927 | ||
928 | err = md_link(sbi->ll_md_exp, op_data, &request); | |
929 | ll_finish_md_op_data(op_data); | |
930 | if (err) | |
931 | GOTO(out, err); | |
932 | ||
933 | ll_update_times(request, dir); | |
934 | ll_stats_ops_tally(sbi, LPROC_LL_LINK, 1); | |
935 | EXIT; | |
936 | out: | |
937 | ptlrpc_req_finished(request); | |
938 | RETURN(err); | |
939 | } | |
940 | ||
941 | static int ll_mkdir_generic(struct inode *dir, struct qstr *name, | |
942 | int mode, struct dentry *dchild) | |
943 | ||
944 | { | |
945 | int err; | |
946 | ENTRY; | |
947 | ||
948 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p)\n", | |
949 | name->len, name->name, dir->i_ino, dir->i_generation, dir); | |
950 | ||
951 | if (!IS_POSIXACL(dir) || !exp_connect_umask(ll_i2mdexp(dir))) | |
952 | mode &= ~current_umask(); | |
953 | mode = (mode & (S_IRWXUGO|S_ISVTX)) | S_IFDIR; | |
954 | err = ll_new_node(dir, name, NULL, mode, 0, dchild, LUSTRE_OPC_MKDIR); | |
955 | ||
956 | if (!err) | |
957 | ll_stats_ops_tally(ll_i2sbi(dir), LPROC_LL_MKDIR, 1); | |
958 | ||
959 | RETURN(err); | |
960 | } | |
961 | ||
962 | /* Try to find the child dentry by its name. | |
963 | If found, put the result fid into @fid. */ | |
964 | static void ll_get_child_fid(struct inode * dir, struct qstr *name, | |
965 | struct lu_fid *fid) | |
966 | { | |
967 | struct dentry *parent, *child; | |
968 | ||
969 | parent = ll_d_hlist_entry(dir->i_dentry, struct dentry, d_alias); | |
970 | child = d_lookup(parent, name); | |
971 | if (child) { | |
972 | if (child->d_inode) | |
973 | *fid = *ll_inode2fid(child->d_inode); | |
974 | dput(child); | |
975 | } | |
976 | } | |
977 | ||
978 | static int ll_rmdir_generic(struct inode *dir, struct dentry *dparent, | |
979 | struct dentry *dchild, struct qstr *name) | |
980 | { | |
981 | struct ptlrpc_request *request = NULL; | |
982 | struct md_op_data *op_data; | |
983 | int rc; | |
984 | ENTRY; | |
985 | ||
986 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p)\n", | |
987 | name->len, name->name, dir->i_ino, dir->i_generation, dir); | |
988 | ||
989 | if (unlikely(ll_d_mountpoint(dparent, dchild, name))) | |
990 | RETURN(-EBUSY); | |
991 | ||
992 | op_data = ll_prep_md_op_data(NULL, dir, NULL, name->name, name->len, | |
993 | S_IFDIR, LUSTRE_OPC_ANY, NULL); | |
994 | if (IS_ERR(op_data)) | |
995 | RETURN(PTR_ERR(op_data)); | |
996 | ||
997 | ll_get_child_fid(dir, name, &op_data->op_fid3); | |
998 | op_data->op_fid2 = op_data->op_fid3; | |
999 | rc = md_unlink(ll_i2sbi(dir)->ll_md_exp, op_data, &request); | |
1000 | ll_finish_md_op_data(op_data); | |
1001 | if (rc == 0) { | |
1002 | ll_update_times(request, dir); | |
1003 | ll_stats_ops_tally(ll_i2sbi(dir), LPROC_LL_RMDIR, 1); | |
1004 | } | |
1005 | ||
1006 | ptlrpc_req_finished(request); | |
1007 | RETURN(rc); | |
1008 | } | |
1009 | ||
1010 | /** | |
1011 | * Remove dir entry | |
1012 | **/ | |
1013 | int ll_rmdir_entry(struct inode *dir, char *name, int namelen) | |
1014 | { | |
1015 | struct ptlrpc_request *request = NULL; | |
1016 | struct md_op_data *op_data; | |
1017 | int rc; | |
1018 | ENTRY; | |
1019 | ||
1020 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p)\n", | |
1021 | namelen, name, dir->i_ino, dir->i_generation, dir); | |
1022 | ||
1023 | op_data = ll_prep_md_op_data(NULL, dir, NULL, name, strlen(name), | |
1024 | S_IFDIR, LUSTRE_OPC_ANY, NULL); | |
1025 | if (IS_ERR(op_data)) | |
1026 | RETURN(PTR_ERR(op_data)); | |
1027 | op_data->op_cli_flags |= CLI_RM_ENTRY; | |
1028 | rc = md_unlink(ll_i2sbi(dir)->ll_md_exp, op_data, &request); | |
1029 | ll_finish_md_op_data(op_data); | |
1030 | if (rc == 0) { | |
1031 | ll_update_times(request, dir); | |
1032 | ll_stats_ops_tally(ll_i2sbi(dir), LPROC_LL_RMDIR, 1); | |
1033 | } | |
1034 | ||
1035 | ptlrpc_req_finished(request); | |
1036 | RETURN(rc); | |
1037 | } | |
1038 | ||
1039 | int ll_objects_destroy(struct ptlrpc_request *request, struct inode *dir) | |
1040 | { | |
1041 | struct mdt_body *body; | |
1042 | struct lov_mds_md *eadata; | |
1043 | struct lov_stripe_md *lsm = NULL; | |
1044 | struct obd_trans_info oti = { 0 }; | |
1045 | struct obdo *oa; | |
1046 | struct obd_capa *oc = NULL; | |
1047 | int rc; | |
1048 | ENTRY; | |
1049 | ||
1050 | /* req is swabbed so this is safe */ | |
1051 | body = req_capsule_server_get(&request->rq_pill, &RMF_MDT_BODY); | |
1052 | if (!(body->valid & OBD_MD_FLEASIZE)) | |
1053 | RETURN(0); | |
1054 | ||
1055 | if (body->eadatasize == 0) { | |
1056 | CERROR("OBD_MD_FLEASIZE set but eadatasize zero\n"); | |
1057 | GOTO(out, rc = -EPROTO); | |
1058 | } | |
1059 | ||
1060 | /* The MDS sent back the EA because we unlinked the last reference | |
1061 | * to this file. Use this EA to unlink the objects on the OST. | |
1062 | * It's opaque so we don't swab here; we leave it to obd_unpackmd() to | |
1063 | * check it is complete and sensible. */ | |
1064 | eadata = req_capsule_server_sized_get(&request->rq_pill, &RMF_MDT_MD, | |
1065 | body->eadatasize); | |
1066 | LASSERT(eadata != NULL); | |
1067 | ||
1068 | rc = obd_unpackmd(ll_i2dtexp(dir), &lsm, eadata, body->eadatasize); | |
1069 | if (rc < 0) { | |
1070 | CERROR("obd_unpackmd: %d\n", rc); | |
1071 | GOTO(out, rc); | |
1072 | } | |
1073 | LASSERT(rc >= sizeof(*lsm)); | |
1074 | ||
1075 | OBDO_ALLOC(oa); | |
1076 | if (oa == NULL) | |
1077 | GOTO(out_free_memmd, rc = -ENOMEM); | |
1078 | ||
1079 | oa->o_oi = lsm->lsm_oi; | |
1080 | oa->o_mode = body->mode & S_IFMT; | |
1081 | oa->o_valid = OBD_MD_FLID | OBD_MD_FLTYPE | OBD_MD_FLGROUP; | |
1082 | ||
1083 | if (body->valid & OBD_MD_FLCOOKIE) { | |
1084 | oa->o_valid |= OBD_MD_FLCOOKIE; | |
1085 | oti.oti_logcookies = | |
1086 | req_capsule_server_sized_get(&request->rq_pill, | |
1087 | &RMF_LOGCOOKIES, | |
1088 | sizeof(struct llog_cookie) * | |
1089 | lsm->lsm_stripe_count); | |
1090 | if (oti.oti_logcookies == NULL) { | |
1091 | oa->o_valid &= ~OBD_MD_FLCOOKIE; | |
1092 | body->valid &= ~OBD_MD_FLCOOKIE; | |
1093 | } | |
1094 | } | |
1095 | ||
1096 | if (body->valid & OBD_MD_FLOSSCAPA) { | |
1097 | rc = md_unpack_capa(ll_i2mdexp(dir), request, &RMF_CAPA2, &oc); | |
1098 | if (rc) | |
1099 | GOTO(out_free_memmd, rc); | |
1100 | } | |
1101 | ||
1102 | rc = obd_destroy(NULL, ll_i2dtexp(dir), oa, lsm, &oti, | |
1103 | ll_i2mdexp(dir), oc); | |
1104 | capa_put(oc); | |
1105 | if (rc) | |
1106 | CERROR("obd destroy objid "DOSTID" error %d\n", | |
1107 | POSTID(&lsm->lsm_oi), rc); | |
1108 | out_free_memmd: | |
1109 | obd_free_memmd(ll_i2dtexp(dir), &lsm); | |
1110 | OBDO_FREE(oa); | |
1111 | out: | |
1112 | return rc; | |
1113 | } | |
1114 | ||
1115 | /* ll_unlink_generic() doesn't update the inode with the new link count. | |
1116 | * Instead, ll_ddelete() and ll_d_iput() will update it based upon if there | |
1117 | * is any lock existing. They will recycle dentries and inodes based upon locks | |
1118 | * too. b=20433 */ | |
1119 | static int ll_unlink_generic(struct inode *dir, struct dentry *dparent, | |
1120 | struct dentry *dchild, struct qstr *name) | |
1121 | { | |
1122 | struct ptlrpc_request *request = NULL; | |
1123 | struct md_op_data *op_data; | |
1124 | int rc; | |
1125 | ENTRY; | |
1126 | CDEBUG(D_VFSTRACE, "VFS Op:name=%.*s,dir=%lu/%u(%p)\n", | |
1127 | name->len, name->name, dir->i_ino, dir->i_generation, dir); | |
1128 | ||
1129 | /* | |
1130 | * XXX: unlink bind mountpoint maybe call to here, | |
1131 | * just check it as vfs_unlink does. | |
1132 | */ | |
1133 | if (unlikely(ll_d_mountpoint(dparent, dchild, name))) | |
1134 | RETURN(-EBUSY); | |
1135 | ||
1136 | op_data = ll_prep_md_op_data(NULL, dir, NULL, name->name, | |
1137 | name->len, 0, LUSTRE_OPC_ANY, NULL); | |
1138 | if (IS_ERR(op_data)) | |
1139 | RETURN(PTR_ERR(op_data)); | |
1140 | ||
1141 | ll_get_child_fid(dir, name, &op_data->op_fid3); | |
1142 | op_data->op_fid2 = op_data->op_fid3; | |
1143 | rc = md_unlink(ll_i2sbi(dir)->ll_md_exp, op_data, &request); | |
1144 | ll_finish_md_op_data(op_data); | |
1145 | if (rc) | |
1146 | GOTO(out, rc); | |
1147 | ||
1148 | ll_update_times(request, dir); | |
1149 | ll_stats_ops_tally(ll_i2sbi(dir), LPROC_LL_UNLINK, 1); | |
1150 | ||
1151 | rc = ll_objects_destroy(request, dir); | |
1152 | out: | |
1153 | ptlrpc_req_finished(request); | |
1154 | RETURN(rc); | |
1155 | } | |
1156 | ||
1157 | static int ll_rename_generic(struct inode *src, struct dentry *src_dparent, | |
1158 | struct dentry *src_dchild, struct qstr *src_name, | |
1159 | struct inode *tgt, struct dentry *tgt_dparent, | |
1160 | struct dentry *tgt_dchild, struct qstr *tgt_name) | |
1161 | { | |
1162 | struct ptlrpc_request *request = NULL; | |
1163 | struct ll_sb_info *sbi = ll_i2sbi(src); | |
1164 | struct md_op_data *op_data; | |
1165 | int err; | |
1166 | ENTRY; | |
1167 | CDEBUG(D_VFSTRACE,"VFS Op:oldname=%.*s,src_dir=%lu/%u(%p),newname=%.*s," | |
1168 | "tgt_dir=%lu/%u(%p)\n", src_name->len, src_name->name, | |
1169 | src->i_ino, src->i_generation, src, tgt_name->len, | |
1170 | tgt_name->name, tgt->i_ino, tgt->i_generation, tgt); | |
1171 | ||
1172 | if (unlikely(ll_d_mountpoint(src_dparent, src_dchild, src_name) || | |
1173 | ll_d_mountpoint(tgt_dparent, tgt_dchild, tgt_name))) | |
1174 | RETURN(-EBUSY); | |
1175 | ||
1176 | op_data = ll_prep_md_op_data(NULL, src, tgt, NULL, 0, 0, | |
1177 | LUSTRE_OPC_ANY, NULL); | |
1178 | if (IS_ERR(op_data)) | |
1179 | RETURN(PTR_ERR(op_data)); | |
1180 | ||
1181 | ll_get_child_fid(src, src_name, &op_data->op_fid3); | |
1182 | ll_get_child_fid(tgt, tgt_name, &op_data->op_fid4); | |
1183 | err = md_rename(sbi->ll_md_exp, op_data, | |
1184 | src_name->name, src_name->len, | |
1185 | tgt_name->name, tgt_name->len, &request); | |
1186 | ll_finish_md_op_data(op_data); | |
1187 | if (!err) { | |
1188 | ll_update_times(request, src); | |
1189 | ll_update_times(request, tgt); | |
1190 | ll_stats_ops_tally(sbi, LPROC_LL_RENAME, 1); | |
1191 | err = ll_objects_destroy(request, src); | |
1192 | } | |
1193 | ||
1194 | ptlrpc_req_finished(request); | |
1195 | ||
1196 | RETURN(err); | |
1197 | } | |
1198 | ||
1199 | static int ll_mknod(struct inode *dir, struct dentry *dchild, ll_umode_t mode, | |
1200 | dev_t rdev) | |
1201 | { | |
1202 | return ll_mknod_generic(dir, &dchild->d_name, mode, | |
1203 | old_encode_dev(rdev), dchild); | |
1204 | } | |
1205 | ||
1206 | static int ll_unlink(struct inode * dir, struct dentry *dentry) | |
1207 | { | |
1208 | return ll_unlink_generic(dir, NULL, dentry, &dentry->d_name); | |
1209 | } | |
1210 | ||
1211 | static int ll_mkdir(struct inode *dir, struct dentry *dentry, ll_umode_t mode) | |
1212 | { | |
1213 | return ll_mkdir_generic(dir, &dentry->d_name, mode, dentry); | |
1214 | } | |
1215 | ||
1216 | static int ll_rmdir(struct inode *dir, struct dentry *dentry) | |
1217 | { | |
1218 | return ll_rmdir_generic(dir, NULL, dentry, &dentry->d_name); | |
1219 | } | |
1220 | ||
1221 | static int ll_symlink(struct inode *dir, struct dentry *dentry, | |
1222 | const char *oldname) | |
1223 | { | |
1224 | return ll_symlink_generic(dir, &dentry->d_name, oldname, dentry); | |
1225 | } | |
1226 | ||
1227 | static int ll_link(struct dentry *old_dentry, struct inode *dir, | |
1228 | struct dentry *new_dentry) | |
1229 | { | |
1230 | return ll_link_generic(old_dentry->d_inode, dir, &new_dentry->d_name, | |
1231 | new_dentry); | |
1232 | } | |
1233 | ||
1234 | static int ll_rename(struct inode *old_dir, struct dentry *old_dentry, | |
1235 | struct inode *new_dir, struct dentry *new_dentry) | |
1236 | { | |
1237 | int err; | |
1238 | err = ll_rename_generic(old_dir, NULL, | |
1239 | old_dentry, &old_dentry->d_name, | |
1240 | new_dir, NULL, new_dentry, | |
1241 | &new_dentry->d_name); | |
1242 | if (!err) { | |
1243 | d_move(old_dentry, new_dentry); | |
1244 | } | |
1245 | return err; | |
1246 | } | |
1247 | ||
1248 | struct inode_operations ll_dir_inode_operations = { | |
1249 | .mknod = ll_mknod, | |
1250 | .atomic_open = ll_atomic_open, | |
1251 | .lookup = ll_lookup_nd, | |
1252 | .create = ll_create_nd, | |
1253 | /* We need all these non-raw things for NFSD, to not patch it. */ | |
1254 | .unlink = ll_unlink, | |
1255 | .mkdir = ll_mkdir, | |
1256 | .rmdir = ll_rmdir, | |
1257 | .symlink = ll_symlink, | |
1258 | .link = ll_link, | |
1259 | .rename = ll_rename, | |
1260 | .setattr = ll_setattr, | |
1261 | .getattr = ll_getattr, | |
1262 | .permission = ll_inode_permission, | |
1263 | .setxattr = ll_setxattr, | |
1264 | .getxattr = ll_getxattr, | |
1265 | .listxattr = ll_listxattr, | |
1266 | .removexattr = ll_removexattr, | |
1267 | .get_acl = ll_get_acl, | |
1268 | }; | |
1269 | ||
1270 | struct inode_operations ll_special_inode_operations = { | |
1271 | .setattr = ll_setattr, | |
1272 | .getattr = ll_getattr, | |
1273 | .permission = ll_inode_permission, | |
1274 | .setxattr = ll_setxattr, | |
1275 | .getxattr = ll_getxattr, | |
1276 | .listxattr = ll_listxattr, | |
1277 | .removexattr = ll_removexattr, | |
1278 | .get_acl = ll_get_acl, | |
1279 | }; |