GFS2: Reduce file fragmentation
[deliverable/linux.git] / fs / gfs2 / inode.c
1 /*
2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
3 * Copyright (C) 2004-2011 Red Hat, Inc. All rights reserved.
4 *
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
7 * of the GNU General Public License version 2.
8 */
9
10 #include <linux/slab.h>
11 #include <linux/spinlock.h>
12 #include <linux/completion.h>
13 #include <linux/buffer_head.h>
14 #include <linux/namei.h>
15 #include <linux/mm.h>
16 #include <linux/xattr.h>
17 #include <linux/posix_acl.h>
18 #include <linux/gfs2_ondisk.h>
19 #include <linux/crc32.h>
20 #include <linux/fiemap.h>
21 #include <linux/security.h>
22 #include <asm/uaccess.h>
23
24 #include "gfs2.h"
25 #include "incore.h"
26 #include "acl.h"
27 #include "bmap.h"
28 #include "dir.h"
29 #include "xattr.h"
30 #include "glock.h"
31 #include "inode.h"
32 #include "meta_io.h"
33 #include "quota.h"
34 #include "rgrp.h"
35 #include "trans.h"
36 #include "util.h"
37 #include "super.h"
38 #include "glops.h"
39
40 struct gfs2_skip_data {
41 u64 no_addr;
42 int skipped;
43 int non_block;
44 };
45
46 static int iget_test(struct inode *inode, void *opaque)
47 {
48 struct gfs2_inode *ip = GFS2_I(inode);
49 struct gfs2_skip_data *data = opaque;
50
51 if (ip->i_no_addr == data->no_addr) {
52 if (data->non_block &&
53 inode->i_state & (I_FREEING|I_CLEAR|I_WILL_FREE)) {
54 data->skipped = 1;
55 return 0;
56 }
57 return 1;
58 }
59 return 0;
60 }
61
62 static int iget_set(struct inode *inode, void *opaque)
63 {
64 struct gfs2_inode *ip = GFS2_I(inode);
65 struct gfs2_skip_data *data = opaque;
66
67 if (data->skipped)
68 return -ENOENT;
69 inode->i_ino = (unsigned long)(data->no_addr);
70 ip->i_no_addr = data->no_addr;
71 return 0;
72 }
73
74 struct inode *gfs2_ilookup(struct super_block *sb, u64 no_addr, int non_block)
75 {
76 unsigned long hash = (unsigned long)no_addr;
77 struct gfs2_skip_data data;
78
79 data.no_addr = no_addr;
80 data.skipped = 0;
81 data.non_block = non_block;
82 return ilookup5(sb, hash, iget_test, &data);
83 }
84
85 static struct inode *gfs2_iget(struct super_block *sb, u64 no_addr,
86 int non_block)
87 {
88 struct gfs2_skip_data data;
89 unsigned long hash = (unsigned long)no_addr;
90
91 data.no_addr = no_addr;
92 data.skipped = 0;
93 data.non_block = non_block;
94 return iget5_locked(sb, hash, iget_test, iget_set, &data);
95 }
96
97 /**
98 * gfs2_set_iop - Sets inode operations
99 * @inode: The inode with correct i_mode filled in
100 *
101 * GFS2 lookup code fills in vfs inode contents based on info obtained
102 * from directory entry inside gfs2_inode_lookup().
103 */
104
105 static void gfs2_set_iop(struct inode *inode)
106 {
107 struct gfs2_sbd *sdp = GFS2_SB(inode);
108 umode_t mode = inode->i_mode;
109
110 if (S_ISREG(mode)) {
111 inode->i_op = &gfs2_file_iops;
112 if (gfs2_localflocks(sdp))
113 inode->i_fop = &gfs2_file_fops_nolock;
114 else
115 inode->i_fop = &gfs2_file_fops;
116 } else if (S_ISDIR(mode)) {
117 inode->i_op = &gfs2_dir_iops;
118 if (gfs2_localflocks(sdp))
119 inode->i_fop = &gfs2_dir_fops_nolock;
120 else
121 inode->i_fop = &gfs2_dir_fops;
122 } else if (S_ISLNK(mode)) {
123 inode->i_op = &gfs2_symlink_iops;
124 } else {
125 inode->i_op = &gfs2_file_iops;
126 init_special_inode(inode, inode->i_mode, inode->i_rdev);
127 }
128 }
129
130 /**
131 * gfs2_inode_lookup - Lookup an inode
132 * @sb: The super block
133 * @no_addr: The inode number
134 * @type: The type of the inode
135 * non_block: Can we block on inodes that are being freed?
136 *
137 * Returns: A VFS inode, or an error
138 */
139
140 struct inode *gfs2_inode_lookup(struct super_block *sb, unsigned int type,
141 u64 no_addr, u64 no_formal_ino, int non_block)
142 {
143 struct inode *inode;
144 struct gfs2_inode *ip;
145 struct gfs2_glock *io_gl = NULL;
146 int error;
147
148 inode = gfs2_iget(sb, no_addr, non_block);
149 ip = GFS2_I(inode);
150
151 if (!inode)
152 return ERR_PTR(-ENOBUFS);
153
154 if (inode->i_state & I_NEW) {
155 struct gfs2_sbd *sdp = GFS2_SB(inode);
156 ip->i_no_formal_ino = no_formal_ino;
157
158 error = gfs2_glock_get(sdp, no_addr, &gfs2_inode_glops, CREATE, &ip->i_gl);
159 if (unlikely(error))
160 goto fail;
161 ip->i_gl->gl_object = ip;
162
163 error = gfs2_glock_get(sdp, no_addr, &gfs2_iopen_glops, CREATE, &io_gl);
164 if (unlikely(error))
165 goto fail_put;
166
167 set_bit(GIF_INVALID, &ip->i_flags);
168 error = gfs2_glock_nq_init(io_gl, LM_ST_SHARED, GL_EXACT, &ip->i_iopen_gh);
169 if (unlikely(error))
170 goto fail_iopen;
171
172 ip->i_iopen_gh.gh_gl->gl_object = ip;
173 gfs2_glock_put(io_gl);
174 io_gl = NULL;
175
176 if (type == DT_UNKNOWN) {
177 /* Inode glock must be locked already */
178 error = gfs2_inode_refresh(GFS2_I(inode));
179 if (error)
180 goto fail_refresh;
181 } else {
182 inode->i_mode = DT2IF(type);
183 }
184
185 gfs2_set_iop(inode);
186 unlock_new_inode(inode);
187 }
188
189 return inode;
190
191 fail_refresh:
192 ip->i_iopen_gh.gh_gl->gl_object = NULL;
193 gfs2_glock_dq_uninit(&ip->i_iopen_gh);
194 fail_iopen:
195 if (io_gl)
196 gfs2_glock_put(io_gl);
197 fail_put:
198 ip->i_gl->gl_object = NULL;
199 gfs2_glock_put(ip->i_gl);
200 fail:
201 iget_failed(inode);
202 return ERR_PTR(error);
203 }
204
205 struct inode *gfs2_lookup_by_inum(struct gfs2_sbd *sdp, u64 no_addr,
206 u64 *no_formal_ino, unsigned int blktype)
207 {
208 struct super_block *sb = sdp->sd_vfs;
209 struct gfs2_holder i_gh;
210 struct inode *inode = NULL;
211 int error;
212
213 /* Must not read in block until block type is verified */
214 error = gfs2_glock_nq_num(sdp, no_addr, &gfs2_inode_glops,
215 LM_ST_EXCLUSIVE, GL_SKIP, &i_gh);
216 if (error)
217 return ERR_PTR(error);
218
219 error = gfs2_check_blk_type(sdp, no_addr, blktype);
220 if (error)
221 goto fail;
222
223 inode = gfs2_inode_lookup(sb, DT_UNKNOWN, no_addr, 0, 1);
224 if (IS_ERR(inode))
225 goto fail;
226
227 /* Two extra checks for NFS only */
228 if (no_formal_ino) {
229 error = -ESTALE;
230 if (GFS2_I(inode)->i_no_formal_ino != *no_formal_ino)
231 goto fail_iput;
232
233 error = -EIO;
234 if (GFS2_I(inode)->i_diskflags & GFS2_DIF_SYSTEM)
235 goto fail_iput;
236
237 error = 0;
238 }
239
240 fail:
241 gfs2_glock_dq_uninit(&i_gh);
242 return error ? ERR_PTR(error) : inode;
243 fail_iput:
244 iput(inode);
245 goto fail;
246 }
247
248
249 struct inode *gfs2_lookup_simple(struct inode *dip, const char *name)
250 {
251 struct qstr qstr;
252 struct inode *inode;
253 gfs2_str2qstr(&qstr, name);
254 inode = gfs2_lookupi(dip, &qstr, 1);
255 /* gfs2_lookupi has inconsistent callers: vfs
256 * related routines expect NULL for no entry found,
257 * gfs2_lookup_simple callers expect ENOENT
258 * and do not check for NULL.
259 */
260 if (inode == NULL)
261 return ERR_PTR(-ENOENT);
262 else
263 return inode;
264 }
265
266
267 /**
268 * gfs2_lookupi - Look up a filename in a directory and return its inode
269 * @d_gh: An initialized holder for the directory glock
270 * @name: The name of the inode to look for
271 * @is_root: If 1, ignore the caller's permissions
272 * @i_gh: An uninitialized holder for the new inode glock
273 *
274 * This can be called via the VFS filldir function when NFS is doing
275 * a readdirplus and the inode which its intending to stat isn't
276 * already in cache. In this case we must not take the directory glock
277 * again, since the readdir call will have already taken that lock.
278 *
279 * Returns: errno
280 */
281
282 struct inode *gfs2_lookupi(struct inode *dir, const struct qstr *name,
283 int is_root)
284 {
285 struct super_block *sb = dir->i_sb;
286 struct gfs2_inode *dip = GFS2_I(dir);
287 struct gfs2_holder d_gh;
288 int error = 0;
289 struct inode *inode = NULL;
290 int unlock = 0;
291
292 if (!name->len || name->len > GFS2_FNAMESIZE)
293 return ERR_PTR(-ENAMETOOLONG);
294
295 if ((name->len == 1 && memcmp(name->name, ".", 1) == 0) ||
296 (name->len == 2 && memcmp(name->name, "..", 2) == 0 &&
297 dir == sb->s_root->d_inode)) {
298 igrab(dir);
299 return dir;
300 }
301
302 if (gfs2_glock_is_locked_by_me(dip->i_gl) == NULL) {
303 error = gfs2_glock_nq_init(dip->i_gl, LM_ST_SHARED, 0, &d_gh);
304 if (error)
305 return ERR_PTR(error);
306 unlock = 1;
307 }
308
309 if (!is_root) {
310 error = gfs2_permission(dir, MAY_EXEC);
311 if (error)
312 goto out;
313 }
314
315 inode = gfs2_dir_search(dir, name);
316 if (IS_ERR(inode))
317 error = PTR_ERR(inode);
318 out:
319 if (unlock)
320 gfs2_glock_dq_uninit(&d_gh);
321 if (error == -ENOENT)
322 return NULL;
323 return inode ? inode : ERR_PTR(error);
324 }
325
326 /**
327 * create_ok - OK to create a new on-disk inode here?
328 * @dip: Directory in which dinode is to be created
329 * @name: Name of new dinode
330 * @mode:
331 *
332 * Returns: errno
333 */
334
335 static int create_ok(struct gfs2_inode *dip, const struct qstr *name,
336 umode_t mode)
337 {
338 int error;
339
340 error = gfs2_permission(&dip->i_inode, MAY_WRITE | MAY_EXEC);
341 if (error)
342 return error;
343
344 /* Don't create entries in an unlinked directory */
345 if (!dip->i_inode.i_nlink)
346 return -ENOENT;
347
348 error = gfs2_dir_check(&dip->i_inode, name, NULL);
349 switch (error) {
350 case -ENOENT:
351 error = 0;
352 break;
353 case 0:
354 return -EEXIST;
355 default:
356 return error;
357 }
358
359 if (dip->i_entries == (u32)-1)
360 return -EFBIG;
361 if (S_ISDIR(mode) && dip->i_inode.i_nlink == (u32)-1)
362 return -EMLINK;
363
364 return 0;
365 }
366
367 static void munge_mode_uid_gid(struct gfs2_inode *dip, umode_t *mode,
368 unsigned int *uid, unsigned int *gid)
369 {
370 if (GFS2_SB(&dip->i_inode)->sd_args.ar_suiddir &&
371 (dip->i_inode.i_mode & S_ISUID) && dip->i_inode.i_uid) {
372 if (S_ISDIR(*mode))
373 *mode |= S_ISUID;
374 else if (dip->i_inode.i_uid != current_fsuid())
375 *mode &= ~07111;
376 *uid = dip->i_inode.i_uid;
377 } else
378 *uid = current_fsuid();
379
380 if (dip->i_inode.i_mode & S_ISGID) {
381 if (S_ISDIR(*mode))
382 *mode |= S_ISGID;
383 *gid = dip->i_inode.i_gid;
384 } else
385 *gid = current_fsgid();
386 }
387
388 static int alloc_dinode(struct gfs2_inode *dip, u64 *no_addr, u64 *generation)
389 {
390 struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
391 int error;
392 int dblocks = 1;
393
394 error = gfs2_inplace_reserve(dip, RES_DINODE);
395 if (error)
396 goto out;
397
398 error = gfs2_trans_begin(sdp, RES_RG_BIT + RES_STATFS, 0);
399 if (error)
400 goto out_ipreserv;
401
402 error = gfs2_alloc_blocks(dip, no_addr, &dblocks, 1, generation);
403
404 gfs2_trans_end(sdp);
405
406 out_ipreserv:
407 gfs2_inplace_release(dip);
408 out:
409 return error;
410 }
411
412 static void gfs2_init_dir(struct buffer_head *dibh,
413 const struct gfs2_inode *parent)
414 {
415 struct gfs2_dinode *di = (struct gfs2_dinode *)dibh->b_data;
416 struct gfs2_dirent *dent = (struct gfs2_dirent *)(di+1);
417
418 gfs2_qstr2dirent(&gfs2_qdot, GFS2_DIRENT_SIZE(gfs2_qdot.len), dent);
419 dent->de_inum = di->di_num; /* already GFS2 endian */
420 dent->de_type = cpu_to_be16(DT_DIR);
421
422 dent = (struct gfs2_dirent *)((char*)dent + GFS2_DIRENT_SIZE(1));
423 gfs2_qstr2dirent(&gfs2_qdotdot, dibh->b_size - GFS2_DIRENT_SIZE(1) - sizeof(struct gfs2_dinode), dent);
424 gfs2_inum_out(parent, dent);
425 dent->de_type = cpu_to_be16(DT_DIR);
426
427 }
428
429 /**
430 * init_dinode - Fill in a new dinode structure
431 * @dip: The directory this inode is being created in
432 * @gl: The glock covering the new inode
433 * @inum: The inode number
434 * @mode: The file permissions
435 * @uid: The uid of the new inode
436 * @gid: The gid of the new inode
437 * @generation: The generation number of the new inode
438 * @dev: The device number (if a device node)
439 * @symname: The symlink destination (if a symlink)
440 * @size: The inode size (ignored for directories)
441 * @bhp: The buffer head (returned to caller)
442 *
443 */
444
445 static void init_dinode(struct gfs2_inode *dip, struct gfs2_glock *gl,
446 const struct gfs2_inum_host *inum, umode_t mode,
447 unsigned int uid, unsigned int gid,
448 const u64 *generation, dev_t dev, const char *symname,
449 unsigned size, struct buffer_head **bhp)
450 {
451 struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
452 struct gfs2_dinode *di;
453 struct buffer_head *dibh;
454 struct timespec tv = CURRENT_TIME;
455
456 dibh = gfs2_meta_new(gl, inum->no_addr);
457 gfs2_trans_add_bh(gl, dibh, 1);
458 gfs2_metatype_set(dibh, GFS2_METATYPE_DI, GFS2_FORMAT_DI);
459 gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode));
460 di = (struct gfs2_dinode *)dibh->b_data;
461
462 di->di_num.no_formal_ino = cpu_to_be64(inum->no_formal_ino);
463 di->di_num.no_addr = cpu_to_be64(inum->no_addr);
464 di->di_mode = cpu_to_be32(mode);
465 di->di_uid = cpu_to_be32(uid);
466 di->di_gid = cpu_to_be32(gid);
467 di->di_nlink = 0;
468 di->di_size = cpu_to_be64(size);
469 di->di_blocks = cpu_to_be64(1);
470 di->di_atime = di->di_mtime = di->di_ctime = cpu_to_be64(tv.tv_sec);
471 di->di_major = cpu_to_be32(MAJOR(dev));
472 di->di_minor = cpu_to_be32(MINOR(dev));
473 di->di_goal_meta = di->di_goal_data = cpu_to_be64(inum->no_addr);
474 di->di_generation = cpu_to_be64(*generation);
475 di->di_flags = 0;
476 di->__pad1 = 0;
477 di->di_payload_format = cpu_to_be32(S_ISDIR(mode) ? GFS2_FORMAT_DE : 0);
478 di->di_height = 0;
479 di->__pad2 = 0;
480 di->__pad3 = 0;
481 di->di_depth = 0;
482 di->di_entries = 0;
483 memset(&di->__pad4, 0, sizeof(di->__pad4));
484 di->di_eattr = 0;
485 di->di_atime_nsec = cpu_to_be32(tv.tv_nsec);
486 di->di_mtime_nsec = cpu_to_be32(tv.tv_nsec);
487 di->di_ctime_nsec = cpu_to_be32(tv.tv_nsec);
488 memset(&di->di_reserved, 0, sizeof(di->di_reserved));
489
490 switch(mode & S_IFMT) {
491 case S_IFREG:
492 if ((dip->i_diskflags & GFS2_DIF_INHERIT_JDATA) ||
493 gfs2_tune_get(sdp, gt_new_files_jdata))
494 di->di_flags |= cpu_to_be32(GFS2_DIF_JDATA);
495 break;
496 case S_IFDIR:
497 di->di_flags |= cpu_to_be32(dip->i_diskflags &
498 GFS2_DIF_INHERIT_JDATA);
499 di->di_flags |= cpu_to_be32(GFS2_DIF_JDATA);
500 di->di_size = cpu_to_be64(sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode));
501 di->di_entries = cpu_to_be32(2);
502 gfs2_init_dir(dibh, dip);
503 break;
504 case S_IFLNK:
505 memcpy(dibh->b_data + sizeof(struct gfs2_dinode), symname, size);
506 break;
507 }
508
509 set_buffer_uptodate(dibh);
510
511 *bhp = dibh;
512 }
513
514 static int make_dinode(struct gfs2_inode *dip, struct gfs2_glock *gl,
515 umode_t mode, const struct gfs2_inum_host *inum,
516 const u64 *generation, dev_t dev, const char *symname,
517 unsigned int size, struct buffer_head **bhp)
518 {
519 struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
520 unsigned int uid, gid;
521 int error;
522
523 munge_mode_uid_gid(dip, &mode, &uid, &gid);
524 error = gfs2_rindex_update(sdp);
525 if (error)
526 return error;
527
528 error = gfs2_quota_lock(dip, uid, gid);
529 if (error)
530 return error;
531
532 error = gfs2_quota_check(dip, uid, gid);
533 if (error)
534 goto out_quota;
535
536 error = gfs2_trans_begin(sdp, RES_DINODE + RES_QUOTA, 0);
537 if (error)
538 goto out_quota;
539
540 init_dinode(dip, gl, inum, mode, uid, gid, generation, dev, symname, size, bhp);
541 gfs2_quota_change(dip, +1, uid, gid);
542 gfs2_trans_end(sdp);
543
544 out_quota:
545 gfs2_quota_unlock(dip);
546 return error;
547 }
548
549 static int link_dinode(struct gfs2_inode *dip, const struct qstr *name,
550 struct gfs2_inode *ip)
551 {
552 struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
553 int alloc_required;
554 struct buffer_head *dibh;
555 int error;
556
557 error = gfs2_rindex_update(sdp);
558 if (error)
559 return error;
560
561 error = gfs2_quota_lock(dip, NO_QUOTA_CHANGE, NO_QUOTA_CHANGE);
562 if (error)
563 goto fail;
564
565 error = alloc_required = gfs2_diradd_alloc_required(&dip->i_inode, name);
566 if (alloc_required < 0)
567 goto fail_quota_locks;
568 if (alloc_required) {
569 error = gfs2_quota_check(dip, dip->i_inode.i_uid, dip->i_inode.i_gid);
570 if (error)
571 goto fail_quota_locks;
572
573 error = gfs2_inplace_reserve(dip, sdp->sd_max_dirres);
574 if (error)
575 goto fail_quota_locks;
576
577 error = gfs2_trans_begin(sdp, sdp->sd_max_dirres +
578 dip->i_rgd->rd_length +
579 2 * RES_DINODE +
580 RES_STATFS + RES_QUOTA, 0);
581 if (error)
582 goto fail_ipreserv;
583 } else {
584 error = gfs2_trans_begin(sdp, RES_LEAF + 2 * RES_DINODE, 0);
585 if (error)
586 goto fail_quota_locks;
587 }
588
589 error = gfs2_dir_add(&dip->i_inode, name, ip);
590 if (error)
591 goto fail_end_trans;
592
593 error = gfs2_meta_inode_buffer(ip, &dibh);
594 if (error)
595 goto fail_end_trans;
596 set_nlink(&ip->i_inode, S_ISDIR(ip->i_inode.i_mode) ? 2 : 1);
597 gfs2_trans_add_bh(ip->i_gl, dibh, 1);
598 gfs2_dinode_out(ip, dibh->b_data);
599 brelse(dibh);
600 return 0;
601
602 fail_end_trans:
603 gfs2_trans_end(sdp);
604
605 fail_ipreserv:
606 if (alloc_required)
607 gfs2_inplace_release(dip);
608
609 fail_quota_locks:
610 gfs2_quota_unlock(dip);
611
612 fail:
613 return error;
614 }
615
616 static int gfs2_initxattrs(struct inode *inode, const struct xattr *xattr_array,
617 void *fs_info)
618 {
619 const struct xattr *xattr;
620 int err = 0;
621
622 for (xattr = xattr_array; xattr->name != NULL; xattr++) {
623 err = __gfs2_xattr_set(inode, xattr->name, xattr->value,
624 xattr->value_len, 0,
625 GFS2_EATYPE_SECURITY);
626 if (err < 0)
627 break;
628 }
629 return err;
630 }
631
632 static int gfs2_security_init(struct gfs2_inode *dip, struct gfs2_inode *ip,
633 const struct qstr *qstr)
634 {
635 return security_inode_init_security(&ip->i_inode, &dip->i_inode, qstr,
636 &gfs2_initxattrs, NULL);
637 }
638
639 /**
640 * gfs2_create_inode - Create a new inode
641 * @dir: The parent directory
642 * @dentry: The new dentry
643 * @mode: The permissions on the new inode
644 * @dev: For device nodes, this is the device number
645 * @symname: For symlinks, this is the link destination
646 * @size: The initial size of the inode (ignored for directories)
647 *
648 * Returns: 0 on success, or error code
649 */
650
651 static int gfs2_create_inode(struct inode *dir, struct dentry *dentry,
652 umode_t mode, dev_t dev, const char *symname,
653 unsigned int size, int excl)
654 {
655 const struct qstr *name = &dentry->d_name;
656 struct gfs2_holder ghs[2];
657 struct inode *inode = NULL;
658 struct gfs2_inode *dip = GFS2_I(dir), *ip;
659 struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
660 struct gfs2_inum_host inum = { .no_addr = 0, .no_formal_ino = 0 };
661 int error;
662 u64 generation;
663 struct buffer_head *bh = NULL;
664
665 if (!name->len || name->len > GFS2_FNAMESIZE)
666 return -ENAMETOOLONG;
667
668 /* We need a reservation to allocate the new dinode block. The
669 directory ip temporarily points to the reservation, but this is
670 being done to get a set of contiguous blocks for the new dinode.
671 Since this is a create, we don't have a sizehint yet, so it will
672 have to use the minimum reservation size. */
673 error = gfs2_rs_alloc(dip);
674 if (error)
675 return error;
676
677 error = gfs2_glock_nq_init(dip->i_gl, LM_ST_EXCLUSIVE, 0, ghs);
678 if (error)
679 goto fail;
680
681 error = create_ok(dip, name, mode);
682 if ((error == -EEXIST) && S_ISREG(mode) && !excl) {
683 inode = gfs2_lookupi(dir, &dentry->d_name, 0);
684 gfs2_glock_dq_uninit(ghs);
685 d_instantiate(dentry, inode);
686 return IS_ERR(inode) ? PTR_ERR(inode) : 0;
687 }
688 if (error)
689 goto fail_gunlock;
690
691 error = alloc_dinode(dip, &inum.no_addr, &generation);
692 if (error)
693 goto fail_gunlock;
694 inum.no_formal_ino = generation;
695
696 error = gfs2_glock_nq_num(sdp, inum.no_addr, &gfs2_inode_glops,
697 LM_ST_EXCLUSIVE, GL_SKIP, ghs + 1);
698 if (error)
699 goto fail_gunlock;
700
701 error = make_dinode(dip, ghs[1].gh_gl, mode, &inum, &generation, dev, symname, size, &bh);
702 if (error)
703 goto fail_gunlock2;
704
705 inode = gfs2_inode_lookup(dir->i_sb, IF2DT(mode), inum.no_addr,
706 inum.no_formal_ino, 0);
707 if (IS_ERR(inode))
708 goto fail_gunlock2;
709
710 ip = GFS2_I(inode);
711 error = gfs2_inode_refresh(ip);
712 if (error)
713 goto fail_gunlock2;
714
715 /* The newly created inode needs a reservation so it can allocate
716 xattrs. At the same time, we want new blocks allocated to the new
717 dinode to be as contiguous as possible. Since we allocated the
718 dinode block under the directory's reservation, we transfer
719 ownership of that reservation to the new inode. The directory
720 doesn't need a reservation unless it needs a new allocation. */
721 ip->i_res = dip->i_res;
722 dip->i_res = NULL;
723
724 error = gfs2_acl_create(dip, inode);
725 if (error)
726 goto fail_gunlock2;
727
728 error = gfs2_security_init(dip, ip, name);
729 if (error)
730 goto fail_gunlock2;
731
732 error = link_dinode(dip, name, ip);
733 if (error)
734 goto fail_gunlock2;
735
736 if (bh)
737 brelse(bh);
738
739 gfs2_trans_end(sdp);
740 /* Check if we reserved space in the rgrp. Function link_dinode may
741 not, depending on whether alloc is required. */
742 if (gfs2_mb_reserved(dip))
743 gfs2_inplace_release(dip);
744 gfs2_quota_unlock(dip);
745 mark_inode_dirty(inode);
746 gfs2_glock_dq_uninit_m(2, ghs);
747 d_instantiate(dentry, inode);
748 return 0;
749
750 fail_gunlock2:
751 gfs2_glock_dq_uninit(ghs + 1);
752 fail_gunlock:
753 gfs2_glock_dq_uninit(ghs);
754 if (inode && !IS_ERR(inode)) {
755 set_bit(GIF_ALLOC_FAILED, &GFS2_I(inode)->i_flags);
756 iput(inode);
757 }
758 fail:
759 gfs2_rs_delete(dip);
760 if (bh)
761 brelse(bh);
762 return error;
763 }
764
765 /**
766 * gfs2_create - Create a file
767 * @dir: The directory in which to create the file
768 * @dentry: The dentry of the new file
769 * @mode: The mode of the new file
770 *
771 * Returns: errno
772 */
773
774 static int gfs2_create(struct inode *dir, struct dentry *dentry,
775 umode_t mode, struct nameidata *nd)
776 {
777 int excl = 0;
778 if (nd && (nd->flags & LOOKUP_EXCL))
779 excl = 1;
780 return gfs2_create_inode(dir, dentry, S_IFREG | mode, 0, NULL, 0, excl);
781 }
782
783 /**
784 * gfs2_lookup - Look up a filename in a directory and return its inode
785 * @dir: The directory inode
786 * @dentry: The dentry of the new inode
787 * @nd: passed from Linux VFS, ignored by us
788 *
789 * Called by the VFS layer. Lock dir and call gfs2_lookupi()
790 *
791 * Returns: errno
792 */
793
794 static struct dentry *gfs2_lookup(struct inode *dir, struct dentry *dentry,
795 struct nameidata *nd)
796 {
797 struct inode *inode = gfs2_lookupi(dir, &dentry->d_name, 0);
798 if (inode && !IS_ERR(inode)) {
799 struct gfs2_glock *gl = GFS2_I(inode)->i_gl;
800 struct gfs2_holder gh;
801 int error;
802 error = gfs2_glock_nq_init(gl, LM_ST_SHARED, LM_FLAG_ANY, &gh);
803 if (error) {
804 iput(inode);
805 return ERR_PTR(error);
806 }
807 gfs2_glock_dq_uninit(&gh);
808 }
809 return d_splice_alias(inode, dentry);
810 }
811
812 /**
813 * gfs2_link - Link to a file
814 * @old_dentry: The inode to link
815 * @dir: Add link to this directory
816 * @dentry: The name of the link
817 *
818 * Link the inode in "old_dentry" into the directory "dir" with the
819 * name in "dentry".
820 *
821 * Returns: errno
822 */
823
824 static int gfs2_link(struct dentry *old_dentry, struct inode *dir,
825 struct dentry *dentry)
826 {
827 struct gfs2_inode *dip = GFS2_I(dir);
828 struct gfs2_sbd *sdp = GFS2_SB(dir);
829 struct inode *inode = old_dentry->d_inode;
830 struct gfs2_inode *ip = GFS2_I(inode);
831 struct gfs2_holder ghs[2];
832 struct buffer_head *dibh;
833 int alloc_required;
834 int error;
835
836 if (S_ISDIR(inode->i_mode))
837 return -EPERM;
838
839 error = gfs2_rs_alloc(dip);
840 if (error)
841 return error;
842
843 gfs2_holder_init(dip->i_gl, LM_ST_EXCLUSIVE, 0, ghs);
844 gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + 1);
845
846 error = gfs2_glock_nq(ghs); /* parent */
847 if (error)
848 goto out_parent;
849
850 error = gfs2_glock_nq(ghs + 1); /* child */
851 if (error)
852 goto out_child;
853
854 error = -ENOENT;
855 if (inode->i_nlink == 0)
856 goto out_gunlock;
857
858 error = gfs2_permission(dir, MAY_WRITE | MAY_EXEC);
859 if (error)
860 goto out_gunlock;
861
862 error = gfs2_dir_check(dir, &dentry->d_name, NULL);
863 switch (error) {
864 case -ENOENT:
865 break;
866 case 0:
867 error = -EEXIST;
868 default:
869 goto out_gunlock;
870 }
871
872 error = -EINVAL;
873 if (!dip->i_inode.i_nlink)
874 goto out_gunlock;
875 error = -EFBIG;
876 if (dip->i_entries == (u32)-1)
877 goto out_gunlock;
878 error = -EPERM;
879 if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
880 goto out_gunlock;
881 error = -EINVAL;
882 if (!ip->i_inode.i_nlink)
883 goto out_gunlock;
884 error = -EMLINK;
885 if (ip->i_inode.i_nlink == (u32)-1)
886 goto out_gunlock;
887
888 alloc_required = error = gfs2_diradd_alloc_required(dir, &dentry->d_name);
889 if (error < 0)
890 goto out_gunlock;
891 error = 0;
892
893 if (alloc_required) {
894 error = gfs2_quota_lock_check(dip);
895 if (error)
896 goto out_gunlock;
897
898 error = gfs2_inplace_reserve(dip, sdp->sd_max_dirres);
899 if (error)
900 goto out_gunlock_q;
901
902 error = gfs2_trans_begin(sdp, sdp->sd_max_dirres +
903 gfs2_rg_blocks(dip) +
904 2 * RES_DINODE + RES_STATFS +
905 RES_QUOTA, 0);
906 if (error)
907 goto out_ipres;
908 } else {
909 error = gfs2_trans_begin(sdp, 2 * RES_DINODE + RES_LEAF, 0);
910 if (error)
911 goto out_ipres;
912 }
913
914 error = gfs2_meta_inode_buffer(ip, &dibh);
915 if (error)
916 goto out_end_trans;
917
918 error = gfs2_dir_add(dir, &dentry->d_name, ip);
919 if (error)
920 goto out_brelse;
921
922 gfs2_trans_add_bh(ip->i_gl, dibh, 1);
923 inc_nlink(&ip->i_inode);
924 ip->i_inode.i_ctime = CURRENT_TIME;
925 ihold(inode);
926 d_instantiate(dentry, inode);
927 mark_inode_dirty(inode);
928
929 out_brelse:
930 brelse(dibh);
931 out_end_trans:
932 gfs2_trans_end(sdp);
933 out_ipres:
934 if (alloc_required)
935 gfs2_inplace_release(dip);
936 out_gunlock_q:
937 if (alloc_required)
938 gfs2_quota_unlock(dip);
939 out_gunlock:
940 gfs2_glock_dq(ghs + 1);
941 out_child:
942 gfs2_glock_dq(ghs);
943 out_parent:
944 gfs2_holder_uninit(ghs);
945 gfs2_holder_uninit(ghs + 1);
946 return error;
947 }
948
949 /*
950 * gfs2_unlink_ok - check to see that a inode is still in a directory
951 * @dip: the directory
952 * @name: the name of the file
953 * @ip: the inode
954 *
955 * Assumes that the lock on (at least) @dip is held.
956 *
957 * Returns: 0 if the parent/child relationship is correct, errno if it isn't
958 */
959
960 static int gfs2_unlink_ok(struct gfs2_inode *dip, const struct qstr *name,
961 const struct gfs2_inode *ip)
962 {
963 int error;
964
965 if (IS_IMMUTABLE(&ip->i_inode) || IS_APPEND(&ip->i_inode))
966 return -EPERM;
967
968 if ((dip->i_inode.i_mode & S_ISVTX) &&
969 dip->i_inode.i_uid != current_fsuid() &&
970 ip->i_inode.i_uid != current_fsuid() && !capable(CAP_FOWNER))
971 return -EPERM;
972
973 if (IS_APPEND(&dip->i_inode))
974 return -EPERM;
975
976 error = gfs2_permission(&dip->i_inode, MAY_WRITE | MAY_EXEC);
977 if (error)
978 return error;
979
980 error = gfs2_dir_check(&dip->i_inode, name, ip);
981 if (error)
982 return error;
983
984 return 0;
985 }
986
987 /**
988 * gfs2_unlink_inode - Removes an inode from its parent dir and unlinks it
989 * @dip: The parent directory
990 * @name: The name of the entry in the parent directory
991 * @bh: The inode buffer for the inode to be removed
992 * @inode: The inode to be removed
993 *
994 * Called with all the locks and in a transaction. This will only be
995 * called for a directory after it has been checked to ensure it is empty.
996 *
997 * Returns: 0 on success, or an error
998 */
999
1000 static int gfs2_unlink_inode(struct gfs2_inode *dip,
1001 const struct dentry *dentry,
1002 struct buffer_head *bh)
1003 {
1004 struct inode *inode = dentry->d_inode;
1005 struct gfs2_inode *ip = GFS2_I(inode);
1006 int error;
1007
1008 error = gfs2_dir_del(dip, dentry);
1009 if (error)
1010 return error;
1011
1012 ip->i_entries = 0;
1013 inode->i_ctime = CURRENT_TIME;
1014 if (S_ISDIR(inode->i_mode))
1015 clear_nlink(inode);
1016 else
1017 drop_nlink(inode);
1018 mark_inode_dirty(inode);
1019 if (inode->i_nlink == 0)
1020 gfs2_unlink_di(inode);
1021 return 0;
1022 }
1023
1024
1025 /**
1026 * gfs2_unlink - Unlink an inode (this does rmdir as well)
1027 * @dir: The inode of the directory containing the inode to unlink
1028 * @dentry: The file itself
1029 *
1030 * This routine uses the type of the inode as a flag to figure out
1031 * whether this is an unlink or an rmdir.
1032 *
1033 * Returns: errno
1034 */
1035
1036 static int gfs2_unlink(struct inode *dir, struct dentry *dentry)
1037 {
1038 struct gfs2_inode *dip = GFS2_I(dir);
1039 struct gfs2_sbd *sdp = GFS2_SB(dir);
1040 struct inode *inode = dentry->d_inode;
1041 struct gfs2_inode *ip = GFS2_I(inode);
1042 struct buffer_head *bh;
1043 struct gfs2_holder ghs[3];
1044 struct gfs2_rgrpd *rgd;
1045 int error;
1046
1047 error = gfs2_rindex_update(sdp);
1048 if (error)
1049 return error;
1050
1051 error = -EROFS;
1052
1053 gfs2_holder_init(dip->i_gl, LM_ST_EXCLUSIVE, 0, ghs);
1054 gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + 1);
1055
1056 rgd = gfs2_blk2rgrpd(sdp, ip->i_no_addr, 1);
1057 if (!rgd)
1058 goto out_inodes;
1059
1060 gfs2_holder_init(rgd->rd_gl, LM_ST_EXCLUSIVE, 0, ghs + 2);
1061
1062
1063 error = gfs2_glock_nq(ghs); /* parent */
1064 if (error)
1065 goto out_parent;
1066
1067 error = gfs2_glock_nq(ghs + 1); /* child */
1068 if (error)
1069 goto out_child;
1070
1071 error = -ENOENT;
1072 if (inode->i_nlink == 0)
1073 goto out_rgrp;
1074
1075 if (S_ISDIR(inode->i_mode)) {
1076 error = -ENOTEMPTY;
1077 if (ip->i_entries > 2 || inode->i_nlink > 2)
1078 goto out_rgrp;
1079 }
1080
1081 error = gfs2_glock_nq(ghs + 2); /* rgrp */
1082 if (error)
1083 goto out_rgrp;
1084
1085 error = gfs2_unlink_ok(dip, &dentry->d_name, ip);
1086 if (error)
1087 goto out_gunlock;
1088
1089 error = gfs2_trans_begin(sdp, 2*RES_DINODE + 3*RES_LEAF + RES_RG_BIT, 0);
1090 if (error)
1091 goto out_gunlock;
1092
1093 error = gfs2_meta_inode_buffer(ip, &bh);
1094 if (error)
1095 goto out_end_trans;
1096
1097 error = gfs2_unlink_inode(dip, dentry, bh);
1098 brelse(bh);
1099
1100 out_end_trans:
1101 gfs2_trans_end(sdp);
1102 out_gunlock:
1103 gfs2_glock_dq(ghs + 2);
1104 out_rgrp:
1105 gfs2_glock_dq(ghs + 1);
1106 out_child:
1107 gfs2_glock_dq(ghs);
1108 out_parent:
1109 gfs2_holder_uninit(ghs + 2);
1110 out_inodes:
1111 gfs2_holder_uninit(ghs + 1);
1112 gfs2_holder_uninit(ghs);
1113 return error;
1114 }
1115
1116 /**
1117 * gfs2_symlink - Create a symlink
1118 * @dir: The directory to create the symlink in
1119 * @dentry: The dentry to put the symlink in
1120 * @symname: The thing which the link points to
1121 *
1122 * Returns: errno
1123 */
1124
1125 static int gfs2_symlink(struct inode *dir, struct dentry *dentry,
1126 const char *symname)
1127 {
1128 struct gfs2_sbd *sdp = GFS2_SB(dir);
1129 unsigned int size;
1130
1131 size = strlen(symname);
1132 if (size > sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode) - 1)
1133 return -ENAMETOOLONG;
1134
1135 return gfs2_create_inode(dir, dentry, S_IFLNK | S_IRWXUGO, 0, symname, size, 0);
1136 }
1137
1138 /**
1139 * gfs2_mkdir - Make a directory
1140 * @dir: The parent directory of the new one
1141 * @dentry: The dentry of the new directory
1142 * @mode: The mode of the new directory
1143 *
1144 * Returns: errno
1145 */
1146
1147 static int gfs2_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode)
1148 {
1149 return gfs2_create_inode(dir, dentry, S_IFDIR | mode, 0, NULL, 0, 0);
1150 }
1151
1152 /**
1153 * gfs2_mknod - Make a special file
1154 * @dir: The directory in which the special file will reside
1155 * @dentry: The dentry of the special file
1156 * @mode: The mode of the special file
1157 * @dev: The device specification of the special file
1158 *
1159 */
1160
1161 static int gfs2_mknod(struct inode *dir, struct dentry *dentry, umode_t mode,
1162 dev_t dev)
1163 {
1164 return gfs2_create_inode(dir, dentry, mode, dev, NULL, 0, 0);
1165 }
1166
1167 /*
1168 * gfs2_ok_to_move - check if it's ok to move a directory to another directory
1169 * @this: move this
1170 * @to: to here
1171 *
1172 * Follow @to back to the root and make sure we don't encounter @this
1173 * Assumes we already hold the rename lock.
1174 *
1175 * Returns: errno
1176 */
1177
1178 static int gfs2_ok_to_move(struct gfs2_inode *this, struct gfs2_inode *to)
1179 {
1180 struct inode *dir = &to->i_inode;
1181 struct super_block *sb = dir->i_sb;
1182 struct inode *tmp;
1183 int error = 0;
1184
1185 igrab(dir);
1186
1187 for (;;) {
1188 if (dir == &this->i_inode) {
1189 error = -EINVAL;
1190 break;
1191 }
1192 if (dir == sb->s_root->d_inode) {
1193 error = 0;
1194 break;
1195 }
1196
1197 tmp = gfs2_lookupi(dir, &gfs2_qdotdot, 1);
1198 if (IS_ERR(tmp)) {
1199 error = PTR_ERR(tmp);
1200 break;
1201 }
1202
1203 iput(dir);
1204 dir = tmp;
1205 }
1206
1207 iput(dir);
1208
1209 return error;
1210 }
1211
1212 /**
1213 * gfs2_rename - Rename a file
1214 * @odir: Parent directory of old file name
1215 * @odentry: The old dentry of the file
1216 * @ndir: Parent directory of new file name
1217 * @ndentry: The new dentry of the file
1218 *
1219 * Returns: errno
1220 */
1221
1222 static int gfs2_rename(struct inode *odir, struct dentry *odentry,
1223 struct inode *ndir, struct dentry *ndentry)
1224 {
1225 struct gfs2_inode *odip = GFS2_I(odir);
1226 struct gfs2_inode *ndip = GFS2_I(ndir);
1227 struct gfs2_inode *ip = GFS2_I(odentry->d_inode);
1228 struct gfs2_inode *nip = NULL;
1229 struct gfs2_sbd *sdp = GFS2_SB(odir);
1230 struct gfs2_holder ghs[5], r_gh = { .gh_gl = NULL, };
1231 struct gfs2_rgrpd *nrgd;
1232 unsigned int num_gh;
1233 int dir_rename = 0;
1234 int alloc_required = 0;
1235 unsigned int x;
1236 int error;
1237
1238 if (ndentry->d_inode) {
1239 nip = GFS2_I(ndentry->d_inode);
1240 if (ip == nip)
1241 return 0;
1242 }
1243
1244 error = gfs2_rindex_update(sdp);
1245 if (error)
1246 return error;
1247
1248 error = gfs2_rs_alloc(ndip);
1249 if (error)
1250 return error;
1251
1252 if (odip != ndip) {
1253 error = gfs2_glock_nq_init(sdp->sd_rename_gl, LM_ST_EXCLUSIVE,
1254 0, &r_gh);
1255 if (error)
1256 goto out;
1257
1258 if (S_ISDIR(ip->i_inode.i_mode)) {
1259 dir_rename = 1;
1260 /* don't move a dirctory into it's subdir */
1261 error = gfs2_ok_to_move(ip, ndip);
1262 if (error)
1263 goto out_gunlock_r;
1264 }
1265 }
1266
1267 num_gh = 1;
1268 gfs2_holder_init(odip->i_gl, LM_ST_EXCLUSIVE, 0, ghs);
1269 if (odip != ndip) {
1270 gfs2_holder_init(ndip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + num_gh);
1271 num_gh++;
1272 }
1273 gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + num_gh);
1274 num_gh++;
1275
1276 if (nip) {
1277 gfs2_holder_init(nip->i_gl, LM_ST_EXCLUSIVE, 0, ghs + num_gh);
1278 num_gh++;
1279 /* grab the resource lock for unlink flag twiddling
1280 * this is the case of the target file already existing
1281 * so we unlink before doing the rename
1282 */
1283 nrgd = gfs2_blk2rgrpd(sdp, nip->i_no_addr, 1);
1284 if (nrgd)
1285 gfs2_holder_init(nrgd->rd_gl, LM_ST_EXCLUSIVE, 0, ghs + num_gh++);
1286 }
1287
1288 for (x = 0; x < num_gh; x++) {
1289 error = gfs2_glock_nq(ghs + x);
1290 if (error)
1291 goto out_gunlock;
1292 }
1293
1294 error = -ENOENT;
1295 if (ip->i_inode.i_nlink == 0)
1296 goto out_gunlock;
1297
1298 /* Check out the old directory */
1299
1300 error = gfs2_unlink_ok(odip, &odentry->d_name, ip);
1301 if (error)
1302 goto out_gunlock;
1303
1304 /* Check out the new directory */
1305
1306 if (nip) {
1307 error = gfs2_unlink_ok(ndip, &ndentry->d_name, nip);
1308 if (error)
1309 goto out_gunlock;
1310
1311 if (nip->i_inode.i_nlink == 0) {
1312 error = -EAGAIN;
1313 goto out_gunlock;
1314 }
1315
1316 if (S_ISDIR(nip->i_inode.i_mode)) {
1317 if (nip->i_entries < 2) {
1318 gfs2_consist_inode(nip);
1319 error = -EIO;
1320 goto out_gunlock;
1321 }
1322 if (nip->i_entries > 2) {
1323 error = -ENOTEMPTY;
1324 goto out_gunlock;
1325 }
1326 }
1327 } else {
1328 error = gfs2_permission(ndir, MAY_WRITE | MAY_EXEC);
1329 if (error)
1330 goto out_gunlock;
1331
1332 error = gfs2_dir_check(ndir, &ndentry->d_name, NULL);
1333 switch (error) {
1334 case -ENOENT:
1335 error = 0;
1336 break;
1337 case 0:
1338 error = -EEXIST;
1339 default:
1340 goto out_gunlock;
1341 };
1342
1343 if (odip != ndip) {
1344 if (!ndip->i_inode.i_nlink) {
1345 error = -ENOENT;
1346 goto out_gunlock;
1347 }
1348 if (ndip->i_entries == (u32)-1) {
1349 error = -EFBIG;
1350 goto out_gunlock;
1351 }
1352 if (S_ISDIR(ip->i_inode.i_mode) &&
1353 ndip->i_inode.i_nlink == (u32)-1) {
1354 error = -EMLINK;
1355 goto out_gunlock;
1356 }
1357 }
1358 }
1359
1360 /* Check out the dir to be renamed */
1361
1362 if (dir_rename) {
1363 error = gfs2_permission(odentry->d_inode, MAY_WRITE);
1364 if (error)
1365 goto out_gunlock;
1366 }
1367
1368 if (nip == NULL)
1369 alloc_required = gfs2_diradd_alloc_required(ndir, &ndentry->d_name);
1370 error = alloc_required;
1371 if (error < 0)
1372 goto out_gunlock;
1373
1374 if (alloc_required) {
1375 error = gfs2_quota_lock_check(ndip);
1376 if (error)
1377 goto out_gunlock;
1378
1379 error = gfs2_inplace_reserve(ndip, sdp->sd_max_dirres);
1380 if (error)
1381 goto out_gunlock_q;
1382
1383 error = gfs2_trans_begin(sdp, sdp->sd_max_dirres +
1384 gfs2_rg_blocks(ndip) +
1385 4 * RES_DINODE + 4 * RES_LEAF +
1386 RES_STATFS + RES_QUOTA + 4, 0);
1387 if (error)
1388 goto out_ipreserv;
1389 } else {
1390 error = gfs2_trans_begin(sdp, 4 * RES_DINODE +
1391 5 * RES_LEAF + 4, 0);
1392 if (error)
1393 goto out_gunlock;
1394 }
1395
1396 /* Remove the target file, if it exists */
1397
1398 if (nip) {
1399 struct buffer_head *bh;
1400 error = gfs2_meta_inode_buffer(nip, &bh);
1401 if (error)
1402 goto out_end_trans;
1403 error = gfs2_unlink_inode(ndip, ndentry, bh);
1404 brelse(bh);
1405 }
1406
1407 if (dir_rename) {
1408 error = gfs2_dir_mvino(ip, &gfs2_qdotdot, ndip, DT_DIR);
1409 if (error)
1410 goto out_end_trans;
1411 } else {
1412 struct buffer_head *dibh;
1413 error = gfs2_meta_inode_buffer(ip, &dibh);
1414 if (error)
1415 goto out_end_trans;
1416 ip->i_inode.i_ctime = CURRENT_TIME;
1417 gfs2_trans_add_bh(ip->i_gl, dibh, 1);
1418 gfs2_dinode_out(ip, dibh->b_data);
1419 brelse(dibh);
1420 }
1421
1422 error = gfs2_dir_del(odip, odentry);
1423 if (error)
1424 goto out_end_trans;
1425
1426 error = gfs2_dir_add(ndir, &ndentry->d_name, ip);
1427 if (error)
1428 goto out_end_trans;
1429
1430 out_end_trans:
1431 gfs2_trans_end(sdp);
1432 out_ipreserv:
1433 if (alloc_required)
1434 gfs2_inplace_release(ndip);
1435 out_gunlock_q:
1436 if (alloc_required)
1437 gfs2_quota_unlock(ndip);
1438 out_gunlock:
1439 while (x--) {
1440 gfs2_glock_dq(ghs + x);
1441 gfs2_holder_uninit(ghs + x);
1442 }
1443 out_gunlock_r:
1444 if (r_gh.gh_gl)
1445 gfs2_glock_dq_uninit(&r_gh);
1446 out:
1447 return error;
1448 }
1449
1450 /**
1451 * gfs2_follow_link - Follow a symbolic link
1452 * @dentry: The dentry of the link
1453 * @nd: Data that we pass to vfs_follow_link()
1454 *
1455 * This can handle symlinks of any size.
1456 *
1457 * Returns: 0 on success or error code
1458 */
1459
1460 static void *gfs2_follow_link(struct dentry *dentry, struct nameidata *nd)
1461 {
1462 struct gfs2_inode *ip = GFS2_I(dentry->d_inode);
1463 struct gfs2_holder i_gh;
1464 struct buffer_head *dibh;
1465 unsigned int size;
1466 char *buf;
1467 int error;
1468
1469 gfs2_holder_init(ip->i_gl, LM_ST_SHARED, 0, &i_gh);
1470 error = gfs2_glock_nq(&i_gh);
1471 if (error) {
1472 gfs2_holder_uninit(&i_gh);
1473 nd_set_link(nd, ERR_PTR(error));
1474 return NULL;
1475 }
1476
1477 size = (unsigned int)i_size_read(&ip->i_inode);
1478 if (size == 0) {
1479 gfs2_consist_inode(ip);
1480 buf = ERR_PTR(-EIO);
1481 goto out;
1482 }
1483
1484 error = gfs2_meta_inode_buffer(ip, &dibh);
1485 if (error) {
1486 buf = ERR_PTR(error);
1487 goto out;
1488 }
1489
1490 buf = kzalloc(size + 1, GFP_NOFS);
1491 if (!buf)
1492 buf = ERR_PTR(-ENOMEM);
1493 else
1494 memcpy(buf, dibh->b_data + sizeof(struct gfs2_dinode), size);
1495 brelse(dibh);
1496 out:
1497 gfs2_glock_dq_uninit(&i_gh);
1498 nd_set_link(nd, buf);
1499 return NULL;
1500 }
1501
1502 static void gfs2_put_link(struct dentry *dentry, struct nameidata *nd, void *p)
1503 {
1504 char *s = nd_get_link(nd);
1505 if (!IS_ERR(s))
1506 kfree(s);
1507 }
1508
1509 /**
1510 * gfs2_permission -
1511 * @inode: The inode
1512 * @mask: The mask to be tested
1513 * @flags: Indicates whether this is an RCU path walk or not
1514 *
1515 * This may be called from the VFS directly, or from within GFS2 with the
1516 * inode locked, so we look to see if the glock is already locked and only
1517 * lock the glock if its not already been done.
1518 *
1519 * Returns: errno
1520 */
1521
1522 int gfs2_permission(struct inode *inode, int mask)
1523 {
1524 struct gfs2_inode *ip;
1525 struct gfs2_holder i_gh;
1526 int error;
1527 int unlock = 0;
1528
1529
1530 ip = GFS2_I(inode);
1531 if (gfs2_glock_is_locked_by_me(ip->i_gl) == NULL) {
1532 if (mask & MAY_NOT_BLOCK)
1533 return -ECHILD;
1534 error = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED, LM_FLAG_ANY, &i_gh);
1535 if (error)
1536 return error;
1537 unlock = 1;
1538 }
1539
1540 if ((mask & MAY_WRITE) && IS_IMMUTABLE(inode))
1541 error = -EACCES;
1542 else
1543 error = generic_permission(inode, mask);
1544 if (unlock)
1545 gfs2_glock_dq_uninit(&i_gh);
1546
1547 return error;
1548 }
1549
1550 static int __gfs2_setattr_simple(struct inode *inode, struct iattr *attr)
1551 {
1552 setattr_copy(inode, attr);
1553 mark_inode_dirty(inode);
1554 return 0;
1555 }
1556
1557 /**
1558 * gfs2_setattr_simple -
1559 * @ip:
1560 * @attr:
1561 *
1562 * Returns: errno
1563 */
1564
1565 int gfs2_setattr_simple(struct inode *inode, struct iattr *attr)
1566 {
1567 int error;
1568
1569 if (current->journal_info)
1570 return __gfs2_setattr_simple(inode, attr);
1571
1572 error = gfs2_trans_begin(GFS2_SB(inode), RES_DINODE, 0);
1573 if (error)
1574 return error;
1575
1576 error = __gfs2_setattr_simple(inode, attr);
1577 gfs2_trans_end(GFS2_SB(inode));
1578 return error;
1579 }
1580
1581 static int setattr_chown(struct inode *inode, struct iattr *attr)
1582 {
1583 struct gfs2_inode *ip = GFS2_I(inode);
1584 struct gfs2_sbd *sdp = GFS2_SB(inode);
1585 u32 ouid, ogid, nuid, ngid;
1586 int error;
1587
1588 ouid = inode->i_uid;
1589 ogid = inode->i_gid;
1590 nuid = attr->ia_uid;
1591 ngid = attr->ia_gid;
1592
1593 if (!(attr->ia_valid & ATTR_UID) || ouid == nuid)
1594 ouid = nuid = NO_QUOTA_CHANGE;
1595 if (!(attr->ia_valid & ATTR_GID) || ogid == ngid)
1596 ogid = ngid = NO_QUOTA_CHANGE;
1597
1598 error = gfs2_quota_lock(ip, nuid, ngid);
1599 if (error)
1600 return error;
1601
1602 if (ouid != NO_QUOTA_CHANGE || ogid != NO_QUOTA_CHANGE) {
1603 error = gfs2_quota_check(ip, nuid, ngid);
1604 if (error)
1605 goto out_gunlock_q;
1606 }
1607
1608 error = gfs2_trans_begin(sdp, RES_DINODE + 2 * RES_QUOTA, 0);
1609 if (error)
1610 goto out_gunlock_q;
1611
1612 error = gfs2_setattr_simple(inode, attr);
1613 if (error)
1614 goto out_end_trans;
1615
1616 if (ouid != NO_QUOTA_CHANGE || ogid != NO_QUOTA_CHANGE) {
1617 u64 blocks = gfs2_get_inode_blocks(&ip->i_inode);
1618 gfs2_quota_change(ip, -blocks, ouid, ogid);
1619 gfs2_quota_change(ip, blocks, nuid, ngid);
1620 }
1621
1622 out_end_trans:
1623 gfs2_trans_end(sdp);
1624 out_gunlock_q:
1625 gfs2_quota_unlock(ip);
1626 return error;
1627 }
1628
1629 /**
1630 * gfs2_setattr - Change attributes on an inode
1631 * @dentry: The dentry which is changing
1632 * @attr: The structure describing the change
1633 *
1634 * The VFS layer wants to change one or more of an inodes attributes. Write
1635 * that change out to disk.
1636 *
1637 * Returns: errno
1638 */
1639
1640 static int gfs2_setattr(struct dentry *dentry, struct iattr *attr)
1641 {
1642 struct inode *inode = dentry->d_inode;
1643 struct gfs2_inode *ip = GFS2_I(inode);
1644 struct gfs2_holder i_gh;
1645 int error;
1646
1647 error = gfs2_rs_alloc(ip);
1648 if (error)
1649 return error;
1650
1651 error = gfs2_glock_nq_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, &i_gh);
1652 if (error)
1653 return error;
1654
1655 error = -EPERM;
1656 if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
1657 goto out;
1658
1659 error = inode_change_ok(inode, attr);
1660 if (error)
1661 goto out;
1662
1663 if (attr->ia_valid & ATTR_SIZE)
1664 error = gfs2_setattr_size(inode, attr->ia_size);
1665 else if (attr->ia_valid & (ATTR_UID | ATTR_GID))
1666 error = setattr_chown(inode, attr);
1667 else if ((attr->ia_valid & ATTR_MODE) && IS_POSIXACL(inode))
1668 error = gfs2_acl_chmod(ip, attr);
1669 else
1670 error = gfs2_setattr_simple(inode, attr);
1671
1672 out:
1673 if (!error)
1674 mark_inode_dirty(inode);
1675 gfs2_glock_dq_uninit(&i_gh);
1676 return error;
1677 }
1678
1679 /**
1680 * gfs2_getattr - Read out an inode's attributes
1681 * @mnt: The vfsmount the inode is being accessed from
1682 * @dentry: The dentry to stat
1683 * @stat: The inode's stats
1684 *
1685 * This may be called from the VFS directly, or from within GFS2 with the
1686 * inode locked, so we look to see if the glock is already locked and only
1687 * lock the glock if its not already been done. Note that its the NFS
1688 * readdirplus operation which causes this to be called (from filldir)
1689 * with the glock already held.
1690 *
1691 * Returns: errno
1692 */
1693
1694 static int gfs2_getattr(struct vfsmount *mnt, struct dentry *dentry,
1695 struct kstat *stat)
1696 {
1697 struct inode *inode = dentry->d_inode;
1698 struct gfs2_inode *ip = GFS2_I(inode);
1699 struct gfs2_holder gh;
1700 int error;
1701 int unlock = 0;
1702
1703 if (gfs2_glock_is_locked_by_me(ip->i_gl) == NULL) {
1704 error = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED, LM_FLAG_ANY, &gh);
1705 if (error)
1706 return error;
1707 unlock = 1;
1708 }
1709
1710 generic_fillattr(inode, stat);
1711 if (unlock)
1712 gfs2_glock_dq_uninit(&gh);
1713
1714 return 0;
1715 }
1716
1717 static int gfs2_setxattr(struct dentry *dentry, const char *name,
1718 const void *data, size_t size, int flags)
1719 {
1720 struct inode *inode = dentry->d_inode;
1721 struct gfs2_inode *ip = GFS2_I(inode);
1722 struct gfs2_holder gh;
1723 int ret;
1724
1725 gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, &gh);
1726 ret = gfs2_glock_nq(&gh);
1727 if (ret == 0) {
1728 ret = generic_setxattr(dentry, name, data, size, flags);
1729 gfs2_glock_dq(&gh);
1730 }
1731 gfs2_holder_uninit(&gh);
1732 return ret;
1733 }
1734
1735 static ssize_t gfs2_getxattr(struct dentry *dentry, const char *name,
1736 void *data, size_t size)
1737 {
1738 struct inode *inode = dentry->d_inode;
1739 struct gfs2_inode *ip = GFS2_I(inode);
1740 struct gfs2_holder gh;
1741 int ret;
1742
1743 gfs2_holder_init(ip->i_gl, LM_ST_SHARED, LM_FLAG_ANY, &gh);
1744 ret = gfs2_glock_nq(&gh);
1745 if (ret == 0) {
1746 ret = generic_getxattr(dentry, name, data, size);
1747 gfs2_glock_dq(&gh);
1748 }
1749 gfs2_holder_uninit(&gh);
1750 return ret;
1751 }
1752
1753 static int gfs2_removexattr(struct dentry *dentry, const char *name)
1754 {
1755 struct inode *inode = dentry->d_inode;
1756 struct gfs2_inode *ip = GFS2_I(inode);
1757 struct gfs2_holder gh;
1758 int ret;
1759
1760 gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, &gh);
1761 ret = gfs2_glock_nq(&gh);
1762 if (ret == 0) {
1763 ret = generic_removexattr(dentry, name);
1764 gfs2_glock_dq(&gh);
1765 }
1766 gfs2_holder_uninit(&gh);
1767 return ret;
1768 }
1769
1770 static int gfs2_fiemap(struct inode *inode, struct fiemap_extent_info *fieinfo,
1771 u64 start, u64 len)
1772 {
1773 struct gfs2_inode *ip = GFS2_I(inode);
1774 struct gfs2_holder gh;
1775 int ret;
1776
1777 ret = fiemap_check_flags(fieinfo, FIEMAP_FLAG_SYNC);
1778 if (ret)
1779 return ret;
1780
1781 mutex_lock(&inode->i_mutex);
1782
1783 ret = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED, 0, &gh);
1784 if (ret)
1785 goto out;
1786
1787 if (gfs2_is_stuffed(ip)) {
1788 u64 phys = ip->i_no_addr << inode->i_blkbits;
1789 u64 size = i_size_read(inode);
1790 u32 flags = FIEMAP_EXTENT_LAST|FIEMAP_EXTENT_NOT_ALIGNED|
1791 FIEMAP_EXTENT_DATA_INLINE;
1792 phys += sizeof(struct gfs2_dinode);
1793 phys += start;
1794 if (start + len > size)
1795 len = size - start;
1796 if (start < size)
1797 ret = fiemap_fill_next_extent(fieinfo, start, phys,
1798 len, flags);
1799 if (ret == 1)
1800 ret = 0;
1801 } else {
1802 ret = __generic_block_fiemap(inode, fieinfo, start, len,
1803 gfs2_block_map);
1804 }
1805
1806 gfs2_glock_dq_uninit(&gh);
1807 out:
1808 mutex_unlock(&inode->i_mutex);
1809 return ret;
1810 }
1811
1812 const struct inode_operations gfs2_file_iops = {
1813 .permission = gfs2_permission,
1814 .setattr = gfs2_setattr,
1815 .getattr = gfs2_getattr,
1816 .setxattr = gfs2_setxattr,
1817 .getxattr = gfs2_getxattr,
1818 .listxattr = gfs2_listxattr,
1819 .removexattr = gfs2_removexattr,
1820 .fiemap = gfs2_fiemap,
1821 .get_acl = gfs2_get_acl,
1822 };
1823
1824 const struct inode_operations gfs2_dir_iops = {
1825 .create = gfs2_create,
1826 .lookup = gfs2_lookup,
1827 .link = gfs2_link,
1828 .unlink = gfs2_unlink,
1829 .symlink = gfs2_symlink,
1830 .mkdir = gfs2_mkdir,
1831 .rmdir = gfs2_unlink,
1832 .mknod = gfs2_mknod,
1833 .rename = gfs2_rename,
1834 .permission = gfs2_permission,
1835 .setattr = gfs2_setattr,
1836 .getattr = gfs2_getattr,
1837 .setxattr = gfs2_setxattr,
1838 .getxattr = gfs2_getxattr,
1839 .listxattr = gfs2_listxattr,
1840 .removexattr = gfs2_removexattr,
1841 .fiemap = gfs2_fiemap,
1842 .get_acl = gfs2_get_acl,
1843 };
1844
1845 const struct inode_operations gfs2_symlink_iops = {
1846 .readlink = generic_readlink,
1847 .follow_link = gfs2_follow_link,
1848 .put_link = gfs2_put_link,
1849 .permission = gfs2_permission,
1850 .setattr = gfs2_setattr,
1851 .getattr = gfs2_getattr,
1852 .setxattr = gfs2_setxattr,
1853 .getxattr = gfs2_getxattr,
1854 .listxattr = gfs2_listxattr,
1855 .removexattr = gfs2_removexattr,
1856 .fiemap = gfs2_fiemap,
1857 .get_acl = gfs2_get_acl,
1858 };
1859
This page took 0.108931 seconds and 5 git commands to generate.