Orangefs: improve the POSIXness of interrupted writes...
[deliverable/linux.git] / fs / orangefs / namei.c
CommitLineData
274dcf55
MM
1/*
2 * (C) 2001 Clemson University and The University of Chicago
3 *
4 * See COPYING in top-level directory.
5 */
6
7/*
8 * Linux VFS namei operations.
9 */
10
11#include "protocol.h"
575e9461 12#include "orangefs-kernel.h"
274dcf55
MM
13
14/*
15 * Get a newly allocated inode to go with a negative dentry.
16 */
8bb8aefd 17static int orangefs_create(struct inode *dir,
274dcf55
MM
18 struct dentry *dentry,
19 umode_t mode,
20 bool exclusive)
21{
8bb8aefd
YL
22 struct orangefs_inode_s *parent = ORANGEFS_I(dir);
23 struct orangefs_kernel_op_s *new_op;
274dcf55
MM
24 struct inode *inode;
25 int ret;
26
5253487e
MM
27 gossip_debug(GOSSIP_NAME_DEBUG, "%s: %s\n",
28 __func__,
29 dentry->d_name.name);
274dcf55 30
8bb8aefd 31 new_op = op_alloc(ORANGEFS_VFS_OP_CREATE);
274dcf55
MM
32 if (!new_op)
33 return -ENOMEM;
34
35 new_op->upcall.req.create.parent_refn = parent->refn;
36
37 fill_default_sys_attrs(new_op->upcall.req.create.attributes,
8bb8aefd 38 ORANGEFS_TYPE_METAFILE, mode);
274dcf55
MM
39
40 strncpy(new_op->upcall.req.create.d_name,
47b4948f 41 dentry->d_name.name, ORANGEFS_NAME_MAX);
274dcf55
MM
42
43 ret = service_operation(new_op, __func__, get_interruptible_flag(dir));
44
45 gossip_debug(GOSSIP_NAME_DEBUG,
5253487e
MM
46 "%s: %s: handle:%pU: fsid:%d: new_op:%p: ret:%d:\n",
47 __func__,
48 dentry->d_name.name,
274dcf55 49 &new_op->downcall.resp.create.refn.khandle,
5253487e
MM
50 new_op->downcall.resp.create.refn.fs_id,
51 new_op,
52 ret);
274dcf55 53
5253487e 54 if (ret < 0)
274dcf55 55 goto out;
274dcf55 56
8bb8aefd 57 inode = orangefs_new_inode(dir->i_sb, dir, S_IFREG | mode, 0,
274dcf55
MM
58 &new_op->downcall.resp.create.refn);
59 if (IS_ERR(inode)) {
5253487e
MM
60 gossip_err("%s: Failed to allocate inode for file :%s:\n",
61 __func__,
62 dentry->d_name.name);
274dcf55
MM
63 ret = PTR_ERR(inode);
64 goto out;
65 }
66
67 gossip_debug(GOSSIP_NAME_DEBUG,
5253487e
MM
68 "%s: Assigned inode :%pU: for file :%s:\n",
69 __func__,
70 get_khandle_from_ino(inode),
71 dentry->d_name.name);
274dcf55
MM
72
73 d_instantiate(dentry, inode);
74 unlock_new_inode(inode);
75
76 gossip_debug(GOSSIP_NAME_DEBUG,
5253487e
MM
77 "%s: dentry instantiated for %s\n",
78 __func__,
274dcf55
MM
79 dentry->d_name.name);
80
81 SetMtimeFlag(parent);
82 dir->i_mtime = dir->i_ctime = current_fs_time(dir->i_sb);
83 mark_inode_dirty_sync(dir);
84 ret = 0;
85out:
86 op_release(new_op);
5253487e
MM
87 gossip_debug(GOSSIP_NAME_DEBUG,
88 "%s: %s: returning %d\n",
89 __func__,
90 dentry->d_name.name,
91 ret);
274dcf55
MM
92 return ret;
93}
94
95/*
96 * Attempt to resolve an object name (dentry->d_name), parent handle, and
97 * fsid into a handle for the object.
98 */
8bb8aefd 99static struct dentry *orangefs_lookup(struct inode *dir, struct dentry *dentry,
274dcf55
MM
100 unsigned int flags)
101{
8bb8aefd
YL
102 struct orangefs_inode_s *parent = ORANGEFS_I(dir);
103 struct orangefs_kernel_op_s *new_op;
274dcf55
MM
104 struct inode *inode;
105 struct dentry *res;
106 int ret = -EINVAL;
107
108 /*
109 * in theory we could skip a lookup here (if the intent is to
110 * create) in order to avoid a potentially failed lookup, but
111 * leaving it in can skip a valid lookup and try to create a file
112 * that already exists (e.g. the vfs already handles checking for
113 * -EEXIST on O_EXCL opens, which is broken if we skip this lookup
114 * in the create path)
115 */
116 gossip_debug(GOSSIP_NAME_DEBUG, "%s called on %s\n",
117 __func__, dentry->d_name.name);
118
47b4948f 119 if (dentry->d_name.len > (ORANGEFS_NAME_MAX - 1))
274dcf55
MM
120 return ERR_PTR(-ENAMETOOLONG);
121
8bb8aefd 122 new_op = op_alloc(ORANGEFS_VFS_OP_LOOKUP);
274dcf55
MM
123 if (!new_op)
124 return ERR_PTR(-ENOMEM);
125
7cec28e9 126 new_op->upcall.req.lookup.sym_follow = ORANGEFS_LOOKUP_LINK_NO_FOLLOW;
274dcf55
MM
127
128 gossip_debug(GOSSIP_NAME_DEBUG, "%s:%s:%d using parent %pU\n",
129 __FILE__,
130 __func__,
131 __LINE__,
132 &parent->refn.khandle);
133 new_op->upcall.req.lookup.parent_refn = parent->refn;
134
135 strncpy(new_op->upcall.req.lookup.d_name, dentry->d_name.name,
47b4948f 136 ORANGEFS_NAME_MAX);
274dcf55
MM
137
138 gossip_debug(GOSSIP_NAME_DEBUG,
6ceaf781 139 "%s: doing lookup on %s under %pU,%d\n",
274dcf55
MM
140 __func__,
141 new_op->upcall.req.lookup.d_name,
142 &new_op->upcall.req.lookup.parent_refn.khandle,
6ceaf781 143 new_op->upcall.req.lookup.parent_refn.fs_id);
274dcf55
MM
144
145 ret = service_operation(new_op, __func__, get_interruptible_flag(dir));
146
147 gossip_debug(GOSSIP_NAME_DEBUG,
148 "Lookup Got %pU, fsid %d (ret=%d)\n",
149 &new_op->downcall.resp.lookup.refn.khandle,
150 new_op->downcall.resp.lookup.refn.fs_id,
151 ret);
152
153 if (ret < 0) {
154 if (ret == -ENOENT) {
155 /*
156 * if no inode was found, add a negative dentry to
157 * dcache anyway; if we don't, we don't hold expected
158 * lookup semantics and we most noticeably break
159 * during directory renames.
160 *
161 * however, if the operation failed or exited, do not
162 * add the dentry (e.g. in the case that a touch is
163 * issued on a file that already exists that was
164 * interrupted during this lookup -- no need to add
165 * another negative dentry for an existing file)
166 */
167
168 gossip_debug(GOSSIP_NAME_DEBUG,
8bb8aefd 169 "orangefs_lookup: Adding *negative* dentry "
274dcf55
MM
170 "%p for %s\n",
171 dentry,
172 dentry->d_name.name);
173
174 d_add(dentry, NULL);
175 res = NULL;
176 goto out;
177 }
178
179 /* must be a non-recoverable error */
180 res = ERR_PTR(ret);
181 goto out;
182 }
183
8bb8aefd 184 inode = orangefs_iget(dir->i_sb, &new_op->downcall.resp.lookup.refn);
274dcf55
MM
185 if (IS_ERR(inode)) {
186 gossip_debug(GOSSIP_NAME_DEBUG,
187 "error %ld from iget\n", PTR_ERR(inode));
188 res = ERR_CAST(inode);
189 goto out;
190 }
191
192 gossip_debug(GOSSIP_NAME_DEBUG,
193 "%s:%s:%d "
194 "Found good inode [%lu] with count [%d]\n",
195 __FILE__,
196 __func__,
197 __LINE__,
198 inode->i_ino,
199 (int)atomic_read(&inode->i_count));
200
201 /* update dentry/inode pair into dcache */
202 res = d_splice_alias(inode, dentry);
203
204 gossip_debug(GOSSIP_NAME_DEBUG,
205 "Lookup success (inode ct = %d)\n",
206 (int)atomic_read(&inode->i_count));
207out:
208 op_release(new_op);
209 return res;
210}
211
212/* return 0 on success; non-zero otherwise */
8bb8aefd 213static int orangefs_unlink(struct inode *dir, struct dentry *dentry)
274dcf55
MM
214{
215 struct inode *inode = dentry->d_inode;
8bb8aefd
YL
216 struct orangefs_inode_s *parent = ORANGEFS_I(dir);
217 struct orangefs_kernel_op_s *new_op;
274dcf55
MM
218 int ret;
219
220 gossip_debug(GOSSIP_NAME_DEBUG,
221 "%s: called on %s\n"
222 " (inode %pU): Parent is %pU | fs_id %d\n",
223 __func__,
224 dentry->d_name.name,
225 get_khandle_from_ino(inode),
226 &parent->refn.khandle,
227 parent->refn.fs_id);
228
8bb8aefd 229 new_op = op_alloc(ORANGEFS_VFS_OP_REMOVE);
274dcf55
MM
230 if (!new_op)
231 return -ENOMEM;
232
233 new_op->upcall.req.remove.parent_refn = parent->refn;
234 strncpy(new_op->upcall.req.remove.d_name, dentry->d_name.name,
47b4948f 235 ORANGEFS_NAME_MAX);
274dcf55 236
8bb8aefd 237 ret = service_operation(new_op, "orangefs_unlink",
274dcf55
MM
238 get_interruptible_flag(inode));
239
5253487e
MM
240 gossip_debug(GOSSIP_NAME_DEBUG,
241 "%s: service_operation returned:%d:\n",
242 __func__,
243 ret);
244
274dcf55
MM
245 op_release(new_op);
246
247 if (!ret) {
248 drop_nlink(inode);
249
250 SetMtimeFlag(parent);
251 dir->i_mtime = dir->i_ctime = current_fs_time(dir->i_sb);
252 mark_inode_dirty_sync(dir);
253 }
254 return ret;
255}
256
8bb8aefd 257static int orangefs_symlink(struct inode *dir,
274dcf55
MM
258 struct dentry *dentry,
259 const char *symname)
260{
8bb8aefd
YL
261 struct orangefs_inode_s *parent = ORANGEFS_I(dir);
262 struct orangefs_kernel_op_s *new_op;
274dcf55
MM
263 struct inode *inode;
264 int mode = 755;
265 int ret;
266
267 gossip_debug(GOSSIP_NAME_DEBUG, "%s: called\n", __func__);
268
269 if (!symname)
270 return -EINVAL;
271
8bb8aefd 272 new_op = op_alloc(ORANGEFS_VFS_OP_SYMLINK);
274dcf55
MM
273 if (!new_op)
274 return -ENOMEM;
275
276 new_op->upcall.req.sym.parent_refn = parent->refn;
277
278 fill_default_sys_attrs(new_op->upcall.req.sym.attributes,
8bb8aefd 279 ORANGEFS_TYPE_SYMLINK,
274dcf55
MM
280 mode);
281
282 strncpy(new_op->upcall.req.sym.entry_name,
283 dentry->d_name.name,
47b4948f
MB
284 ORANGEFS_NAME_MAX);
285 strncpy(new_op->upcall.req.sym.target, symname, ORANGEFS_NAME_MAX);
274dcf55
MM
286
287 ret = service_operation(new_op, __func__, get_interruptible_flag(dir));
288
289 gossip_debug(GOSSIP_NAME_DEBUG,
8bb8aefd 290 "Symlink Got ORANGEFS handle %pU on fsid %d (ret=%d)\n",
274dcf55
MM
291 &new_op->downcall.resp.sym.refn.khandle,
292 new_op->downcall.resp.sym.refn.fs_id, ret);
293
294 if (ret < 0) {
295 gossip_debug(GOSSIP_NAME_DEBUG,
296 "%s: failed with error code %d\n",
297 __func__, ret);
298 goto out;
299 }
300
8bb8aefd 301 inode = orangefs_new_inode(dir->i_sb, dir, S_IFLNK | mode, 0,
274dcf55
MM
302 &new_op->downcall.resp.sym.refn);
303 if (IS_ERR(inode)) {
304 gossip_err
8bb8aefd 305 ("*** Failed to allocate orangefs symlink inode\n");
274dcf55
MM
306 ret = PTR_ERR(inode);
307 goto out;
308 }
309
310 gossip_debug(GOSSIP_NAME_DEBUG,
311 "Assigned symlink inode new number of %pU\n",
312 get_khandle_from_ino(inode));
313
314 d_instantiate(dentry, inode);
315 unlock_new_inode(inode);
316
317 gossip_debug(GOSSIP_NAME_DEBUG,
318 "Inode (Symlink) %pU -> %s\n",
319 get_khandle_from_ino(inode),
320 dentry->d_name.name);
321
322 SetMtimeFlag(parent);
323 dir->i_mtime = dir->i_ctime = current_fs_time(dir->i_sb);
324 mark_inode_dirty_sync(dir);
325 ret = 0;
326out:
327 op_release(new_op);
328 return ret;
329}
330
8bb8aefd 331static int orangefs_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode)
274dcf55 332{
8bb8aefd
YL
333 struct orangefs_inode_s *parent = ORANGEFS_I(dir);
334 struct orangefs_kernel_op_s *new_op;
274dcf55
MM
335 struct inode *inode;
336 int ret;
337
8bb8aefd 338 new_op = op_alloc(ORANGEFS_VFS_OP_MKDIR);
274dcf55
MM
339 if (!new_op)
340 return -ENOMEM;
341
342 new_op->upcall.req.mkdir.parent_refn = parent->refn;
343
344 fill_default_sys_attrs(new_op->upcall.req.mkdir.attributes,
8bb8aefd 345 ORANGEFS_TYPE_DIRECTORY, mode);
274dcf55
MM
346
347 strncpy(new_op->upcall.req.mkdir.d_name,
47b4948f 348 dentry->d_name.name, ORANGEFS_NAME_MAX);
274dcf55
MM
349
350 ret = service_operation(new_op, __func__, get_interruptible_flag(dir));
351
352 gossip_debug(GOSSIP_NAME_DEBUG,
8bb8aefd 353 "Mkdir Got ORANGEFS handle %pU on fsid %d\n",
274dcf55
MM
354 &new_op->downcall.resp.mkdir.refn.khandle,
355 new_op->downcall.resp.mkdir.refn.fs_id);
356
357 if (ret < 0) {
358 gossip_debug(GOSSIP_NAME_DEBUG,
359 "%s: failed with error code %d\n",
360 __func__, ret);
361 goto out;
362 }
363
8bb8aefd 364 inode = orangefs_new_inode(dir->i_sb, dir, S_IFDIR | mode, 0,
274dcf55
MM
365 &new_op->downcall.resp.mkdir.refn);
366 if (IS_ERR(inode)) {
8bb8aefd 367 gossip_err("*** Failed to allocate orangefs dir inode\n");
274dcf55
MM
368 ret = PTR_ERR(inode);
369 goto out;
370 }
371
372 gossip_debug(GOSSIP_NAME_DEBUG,
373 "Assigned dir inode new number of %pU\n",
374 get_khandle_from_ino(inode));
375
376 d_instantiate(dentry, inode);
377 unlock_new_inode(inode);
378
379 gossip_debug(GOSSIP_NAME_DEBUG,
380 "Inode (Directory) %pU -> %s\n",
381 get_khandle_from_ino(inode),
382 dentry->d_name.name);
383
384 /*
385 * NOTE: we have no good way to keep nlink consistent for directories
386 * across clients; keep constant at 1.
387 */
388 SetMtimeFlag(parent);
389 dir->i_mtime = dir->i_ctime = current_fs_time(dir->i_sb);
390 mark_inode_dirty_sync(dir);
391out:
392 op_release(new_op);
393 return ret;
394}
395
8bb8aefd 396static int orangefs_rename(struct inode *old_dir,
274dcf55
MM
397 struct dentry *old_dentry,
398 struct inode *new_dir,
399 struct dentry *new_dentry)
400{
8bb8aefd 401 struct orangefs_kernel_op_s *new_op;
274dcf55
MM
402 int ret;
403
404 gossip_debug(GOSSIP_NAME_DEBUG,
8bb8aefd 405 "orangefs_rename: called (%s/%s => %s/%s) ct=%d\n",
274dcf55
MM
406 old_dentry->d_parent->d_name.name,
407 old_dentry->d_name.name,
408 new_dentry->d_parent->d_name.name,
409 new_dentry->d_name.name,
410 d_count(new_dentry));
411
8bb8aefd 412 new_op = op_alloc(ORANGEFS_VFS_OP_RENAME);
274dcf55
MM
413 if (!new_op)
414 return -EINVAL;
415
8bb8aefd
YL
416 new_op->upcall.req.rename.old_parent_refn = ORANGEFS_I(old_dir)->refn;
417 new_op->upcall.req.rename.new_parent_refn = ORANGEFS_I(new_dir)->refn;
274dcf55
MM
418
419 strncpy(new_op->upcall.req.rename.d_old_name,
420 old_dentry->d_name.name,
47b4948f 421 ORANGEFS_NAME_MAX);
274dcf55
MM
422 strncpy(new_op->upcall.req.rename.d_new_name,
423 new_dentry->d_name.name,
47b4948f 424 ORANGEFS_NAME_MAX);
274dcf55
MM
425
426 ret = service_operation(new_op,
8bb8aefd 427 "orangefs_rename",
274dcf55
MM
428 get_interruptible_flag(old_dentry->d_inode));
429
430 gossip_debug(GOSSIP_NAME_DEBUG,
8bb8aefd 431 "orangefs_rename: got downcall status %d\n",
274dcf55
MM
432 ret);
433
434 if (new_dentry->d_inode)
435 new_dentry->d_inode->i_ctime = CURRENT_TIME;
436
437 op_release(new_op);
438 return ret;
439}
440
8bb8aefd
YL
441/* ORANGEFS implementation of VFS inode operations for directories */
442struct inode_operations orangefs_dir_inode_operations = {
443 .lookup = orangefs_lookup,
444 .get_acl = orangefs_get_acl,
445 .set_acl = orangefs_set_acl,
446 .create = orangefs_create,
447 .unlink = orangefs_unlink,
448 .symlink = orangefs_symlink,
449 .mkdir = orangefs_mkdir,
450 .rmdir = orangefs_unlink,
451 .rename = orangefs_rename,
452 .setattr = orangefs_setattr,
453 .getattr = orangefs_getattr,
274dcf55
MM
454 .setxattr = generic_setxattr,
455 .getxattr = generic_getxattr,
456 .removexattr = generic_removexattr,
8bb8aefd 457 .listxattr = orangefs_listxattr,
933287da 458 .permission = orangefs_permission,
274dcf55 459};
This page took 0.049948 seconds and 5 git commands to generate.