kmalloc a few large stack objects in the btrfs_ioctl path
[deliverable/linux.git] / fs / btrfs / inode.c
CommitLineData
6cbd5570
CM
1/*
2 * Copyright (C) 2007 Oracle. All rights reserved.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public
6 * License v2 as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope that it will be useful,
9 * but WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * General Public License for more details.
12 *
13 * You should have received a copy of the GNU General Public
14 * License along with this program; if not, write to the
15 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
16 * Boston, MA 021110-1307, USA.
17 */
18
39279cc3
CM
19#include <linux/buffer_head.h>
20#include <linux/fs.h>
21#include <linux/pagemap.h>
22#include <linux/highmem.h>
23#include <linux/time.h>
24#include <linux/init.h>
25#include <linux/string.h>
26#include <linux/smp_lock.h>
27#include <linux/backing-dev.h>
28#include <linux/mpage.h>
29#include <linux/swap.h>
30#include <linux/writeback.h>
31#include <linux/statfs.h>
32#include <linux/compat.h>
9ebefb18 33#include <linux/bit_spinlock.h>
92fee66d 34#include <linux/version.h>
5103e947 35#include <linux/xattr.h>
39279cc3
CM
36#include "ctree.h"
37#include "disk-io.h"
38#include "transaction.h"
39#include "btrfs_inode.h"
40#include "ioctl.h"
41#include "print-tree.h"
42
43struct btrfs_iget_args {
44 u64 ino;
45 struct btrfs_root *root;
46};
47
48static struct inode_operations btrfs_dir_inode_operations;
49static struct inode_operations btrfs_symlink_inode_operations;
50static struct inode_operations btrfs_dir_ro_inode_operations;
618e21d5 51static struct inode_operations btrfs_special_inode_operations;
39279cc3
CM
52static struct inode_operations btrfs_file_inode_operations;
53static struct address_space_operations btrfs_aops;
54static struct address_space_operations btrfs_symlink_aops;
55static struct file_operations btrfs_dir_file_operations;
07157aac 56static struct extent_map_ops btrfs_extent_map_ops;
39279cc3
CM
57
58static struct kmem_cache *btrfs_inode_cachep;
59struct kmem_cache *btrfs_trans_handle_cachep;
60struct kmem_cache *btrfs_transaction_cachep;
61struct kmem_cache *btrfs_bit_radix_cachep;
62struct kmem_cache *btrfs_path_cachep;
63
64#define S_SHIFT 12
65static unsigned char btrfs_type_by_mode[S_IFMT >> S_SHIFT] = {
66 [S_IFREG >> S_SHIFT] = BTRFS_FT_REG_FILE,
67 [S_IFDIR >> S_SHIFT] = BTRFS_FT_DIR,
68 [S_IFCHR >> S_SHIFT] = BTRFS_FT_CHRDEV,
69 [S_IFBLK >> S_SHIFT] = BTRFS_FT_BLKDEV,
70 [S_IFIFO >> S_SHIFT] = BTRFS_FT_FIFO,
71 [S_IFSOCK >> S_SHIFT] = BTRFS_FT_SOCK,
72 [S_IFLNK >> S_SHIFT] = BTRFS_FT_SYMLINK,
73};
74
be20aa9d 75static int cow_file_range(struct inode *inode, u64 start, u64 end)
b888db2b
CM
76{
77 struct btrfs_root *root = BTRFS_I(inode)->root;
78 struct btrfs_trans_handle *trans;
b888db2b 79 u64 alloc_hint = 0;
db94535d 80 u64 num_bytes;
c59f8951 81 u64 cur_alloc_size;
db94535d 82 u64 blocksize = root->sectorsize;
be20aa9d
CM
83 struct btrfs_key ins;
84 int ret;
b888db2b 85
b888db2b 86 trans = btrfs_start_transaction(root, 1);
b888db2b 87 BUG_ON(!trans);
be20aa9d
CM
88 btrfs_set_trans_block_group(trans, inode);
89
db94535d 90 num_bytes = (end - start + blocksize) & ~(blocksize - 1);
be20aa9d 91 num_bytes = max(blocksize, num_bytes);
b888db2b 92 ret = btrfs_drop_extents(trans, root, inode,
3326d1b0 93 start, start + num_bytes, start, &alloc_hint);
db94535d 94
179e29e4
CM
95 if (alloc_hint == EXTENT_MAP_INLINE)
96 goto out;
97
c59f8951
CM
98 while(num_bytes > 0) {
99 cur_alloc_size = min(num_bytes, root->fs_info->max_extent);
100 ret = btrfs_alloc_extent(trans, root, cur_alloc_size,
101 root->root_key.objectid,
102 trans->transid,
103 inode->i_ino, start, 0,
104 alloc_hint, (u64)-1, &ins, 1);
105 if (ret) {
106 WARN_ON(1);
107 goto out;
108 }
109 ret = btrfs_insert_file_extent(trans, root, inode->i_ino,
110 start, ins.objectid, ins.offset,
111 ins.offset);
112 num_bytes -= cur_alloc_size;
113 alloc_hint = ins.objectid + ins.offset;
114 start += cur_alloc_size;
b888db2b 115 }
b888db2b
CM
116out:
117 btrfs_end_transaction(trans, root);
be20aa9d
CM
118 return ret;
119}
120
121static int run_delalloc_nocow(struct inode *inode, u64 start, u64 end)
122{
123 u64 extent_start;
124 u64 extent_end;
125 u64 bytenr;
126 u64 cow_end;
127 struct btrfs_root *root = BTRFS_I(inode)->root;
128 struct extent_buffer *leaf;
129 int found_type;
130 struct btrfs_path *path;
131 struct btrfs_file_extent_item *item;
132 int ret;
133 int err;
134 struct btrfs_key found_key;
135
136 path = btrfs_alloc_path();
137 BUG_ON(!path);
138again:
139 ret = btrfs_lookup_file_extent(NULL, root, path,
140 inode->i_ino, start, 0);
141 if (ret < 0) {
142 btrfs_free_path(path);
143 return ret;
144 }
145
146 cow_end = end;
147 if (ret != 0) {
148 if (path->slots[0] == 0)
149 goto not_found;
150 path->slots[0]--;
151 }
152
153 leaf = path->nodes[0];
154 item = btrfs_item_ptr(leaf, path->slots[0],
155 struct btrfs_file_extent_item);
156
157 /* are we inside the extent that was found? */
158 btrfs_item_key_to_cpu(leaf, &found_key, path->slots[0]);
159 found_type = btrfs_key_type(&found_key);
160 if (found_key.objectid != inode->i_ino ||
161 found_type != BTRFS_EXTENT_DATA_KEY) {
162 goto not_found;
163 }
164
165 found_type = btrfs_file_extent_type(leaf, item);
166 extent_start = found_key.offset;
167 if (found_type == BTRFS_FILE_EXTENT_REG) {
168 extent_end = extent_start +
169 btrfs_file_extent_num_bytes(leaf, item);
170 err = 0;
171
172 if (start < extent_start || start >= extent_end)
173 goto not_found;
174
175 cow_end = min(end, extent_end - 1);
176 bytenr = btrfs_file_extent_disk_bytenr(leaf, item);
177 if (bytenr == 0)
178 goto not_found;
179
180 bytenr += btrfs_file_extent_offset(leaf, item);
181 if (btrfs_count_snapshots_in_path(root, path, bytenr) != 1) {
182 goto not_found;
183 }
184
185 start = extent_end;
186 } else if (found_type == BTRFS_FILE_EXTENT_INLINE) {
187 goto not_found;
188 }
189loop:
190 if (start > end) {
191 btrfs_free_path(path);
192 return 0;
193 }
194 btrfs_release_path(root, path);
195 goto again;
196
197not_found:
198 cow_file_range(inode, start, cow_end);
199 start = cow_end + 1;
200 goto loop;
201}
202
203static int run_delalloc_range(struct inode *inode, u64 start, u64 end)
204{
205 struct btrfs_root *root = BTRFS_I(inode)->root;
206 int ret;
207
208 mutex_lock(&root->fs_info->fs_mutex);
209 if (btrfs_test_opt(root, NODATACOW))
210 ret = run_delalloc_nocow(inode, start, end);
211 else
212 ret = cow_file_range(inode, start, end);
b888db2b
CM
213 mutex_unlock(&root->fs_info->fs_mutex);
214 return ret;
215}
216
07157aac
CM
217int btrfs_writepage_io_hook(struct page *page, u64 start, u64 end)
218{
219 struct inode *inode = page->mapping->host;
220 struct btrfs_root *root = BTRFS_I(inode)->root;
221 struct btrfs_trans_handle *trans;
222 char *kaddr;
b6cda9bc 223 int ret = 0;
35ebb934 224 u64 page_start = (u64)page->index << PAGE_CACHE_SHIFT;
07157aac
CM
225 size_t offset = start - page_start;
226
b6cda9bc
CM
227 if (btrfs_test_opt(root, NODATASUM))
228 return 0;
229
07157aac
CM
230 mutex_lock(&root->fs_info->fs_mutex);
231 trans = btrfs_start_transaction(root, 1);
232 btrfs_set_trans_block_group(trans, inode);
233 kaddr = kmap(page);
f578d4bd 234 btrfs_csum_file_block(trans, root, inode, inode->i_ino,
07157aac
CM
235 start, kaddr + offset, end - start + 1);
236 kunmap(page);
237 ret = btrfs_end_transaction(trans, root);
238 BUG_ON(ret);
239 mutex_unlock(&root->fs_info->fs_mutex);
240 return ret;
241}
242
243int btrfs_readpage_io_hook(struct page *page, u64 start, u64 end)
244{
245 int ret = 0;
246 struct inode *inode = page->mapping->host;
247 struct btrfs_root *root = BTRFS_I(inode)->root;
248 struct extent_map_tree *em_tree = &BTRFS_I(inode)->extent_tree;
249 struct btrfs_csum_item *item;
250 struct btrfs_path *path = NULL;
ff79f819 251 u32 csum;
07157aac 252
b6cda9bc
CM
253 if (btrfs_test_opt(root, NODATASUM))
254 return 0;
255
07157aac
CM
256 mutex_lock(&root->fs_info->fs_mutex);
257 path = btrfs_alloc_path();
258 item = btrfs_lookup_csum(NULL, root, path, inode->i_ino, start, 0);
259 if (IS_ERR(item)) {
260 ret = PTR_ERR(item);
261 /* a csum that isn't present is a preallocated region. */
262 if (ret == -ENOENT || ret == -EFBIG)
263 ret = 0;
ff79f819 264 csum = 0;
07157aac
CM
265 goto out;
266 }
ff79f819
CM
267 read_extent_buffer(path->nodes[0], &csum, (unsigned long)item,
268 BTRFS_CRC32_SIZE);
269 set_state_private(em_tree, start, csum);
07157aac
CM
270out:
271 if (path)
272 btrfs_free_path(path);
273 mutex_unlock(&root->fs_info->fs_mutex);
274 return ret;
275}
276
277int btrfs_readpage_end_io_hook(struct page *page, u64 start, u64 end)
278{
35ebb934 279 size_t offset = start - ((u64)page->index << PAGE_CACHE_SHIFT);
07157aac 280 struct inode *inode = page->mapping->host;
07157aac
CM
281 struct extent_map_tree *em_tree = &BTRFS_I(inode)->extent_tree;
282 char *kaddr;
283 u64 private;
284 int ret;
ff79f819
CM
285 struct btrfs_root *root = BTRFS_I(inode)->root;
286 u32 csum = ~(u32)0;
bbf0d006 287 unsigned long flags;
07157aac 288
b6cda9bc
CM
289 if (btrfs_test_opt(root, NODATASUM))
290 return 0;
291
07157aac 292 ret = get_state_private(em_tree, start, &private);
bbf0d006 293 local_irq_save(flags);
07157aac
CM
294 kaddr = kmap_atomic(page, KM_IRQ0);
295 if (ret) {
296 goto zeroit;
297 }
ff79f819
CM
298 csum = btrfs_csum_data(root, kaddr + offset, csum, end - start + 1);
299 btrfs_csum_final(csum, (char *)&csum);
300 if (csum != private) {
07157aac
CM
301 goto zeroit;
302 }
303 kunmap_atomic(kaddr, KM_IRQ0);
bbf0d006 304 local_irq_restore(flags);
07157aac
CM
305 return 0;
306
307zeroit:
308 printk("btrfs csum failed ino %lu off %llu\n",
309 page->mapping->host->i_ino, (unsigned long long)start);
db94535d
CM
310 memset(kaddr + offset, 1, end - start + 1);
311 flush_dcache_page(page);
07157aac 312 kunmap_atomic(kaddr, KM_IRQ0);
bbf0d006 313 local_irq_restore(flags);
07157aac
CM
314 return 0;
315}
b888db2b 316
39279cc3
CM
317void btrfs_read_locked_inode(struct inode *inode)
318{
319 struct btrfs_path *path;
5f39d397 320 struct extent_buffer *leaf;
39279cc3 321 struct btrfs_inode_item *inode_item;
5f39d397 322 struct btrfs_inode_timespec *tspec;
39279cc3
CM
323 struct btrfs_root *root = BTRFS_I(inode)->root;
324 struct btrfs_key location;
325 u64 alloc_group_block;
618e21d5 326 u32 rdev;
39279cc3
CM
327 int ret;
328
329 path = btrfs_alloc_path();
330 BUG_ON(!path);
39279cc3
CM
331 mutex_lock(&root->fs_info->fs_mutex);
332
333 memcpy(&location, &BTRFS_I(inode)->location, sizeof(location));
334 ret = btrfs_lookup_inode(NULL, root, path, &location, 0);
5f39d397 335 if (ret)
39279cc3 336 goto make_bad;
39279cc3 337
5f39d397
CM
338 leaf = path->nodes[0];
339 inode_item = btrfs_item_ptr(leaf, path->slots[0],
340 struct btrfs_inode_item);
341
342 inode->i_mode = btrfs_inode_mode(leaf, inode_item);
343 inode->i_nlink = btrfs_inode_nlink(leaf, inode_item);
344 inode->i_uid = btrfs_inode_uid(leaf, inode_item);
345 inode->i_gid = btrfs_inode_gid(leaf, inode_item);
346 inode->i_size = btrfs_inode_size(leaf, inode_item);
347
348 tspec = btrfs_inode_atime(inode_item);
349 inode->i_atime.tv_sec = btrfs_timespec_sec(leaf, tspec);
350 inode->i_atime.tv_nsec = btrfs_timespec_nsec(leaf, tspec);
351
352 tspec = btrfs_inode_mtime(inode_item);
353 inode->i_mtime.tv_sec = btrfs_timespec_sec(leaf, tspec);
354 inode->i_mtime.tv_nsec = btrfs_timespec_nsec(leaf, tspec);
355
356 tspec = btrfs_inode_ctime(inode_item);
357 inode->i_ctime.tv_sec = btrfs_timespec_sec(leaf, tspec);
358 inode->i_ctime.tv_nsec = btrfs_timespec_nsec(leaf, tspec);
359
360 inode->i_blocks = btrfs_inode_nblocks(leaf, inode_item);
361 inode->i_generation = btrfs_inode_generation(leaf, inode_item);
618e21d5 362 inode->i_rdev = 0;
5f39d397
CM
363 rdev = btrfs_inode_rdev(leaf, inode_item);
364
365 alloc_group_block = btrfs_inode_block_group(leaf, inode_item);
39279cc3
CM
366 BTRFS_I(inode)->block_group = btrfs_lookup_block_group(root->fs_info,
367 alloc_group_block);
368
369 btrfs_free_path(path);
370 inode_item = NULL;
371
372 mutex_unlock(&root->fs_info->fs_mutex);
373
374 switch (inode->i_mode & S_IFMT) {
39279cc3
CM
375 case S_IFREG:
376 inode->i_mapping->a_ops = &btrfs_aops;
07157aac 377 BTRFS_I(inode)->extent_tree.ops = &btrfs_extent_map_ops;
39279cc3
CM
378 inode->i_fop = &btrfs_file_operations;
379 inode->i_op = &btrfs_file_inode_operations;
380 break;
381 case S_IFDIR:
382 inode->i_fop = &btrfs_dir_file_operations;
383 if (root == root->fs_info->tree_root)
384 inode->i_op = &btrfs_dir_ro_inode_operations;
385 else
386 inode->i_op = &btrfs_dir_inode_operations;
387 break;
388 case S_IFLNK:
389 inode->i_op = &btrfs_symlink_inode_operations;
390 inode->i_mapping->a_ops = &btrfs_symlink_aops;
391 break;
618e21d5
JB
392 default:
393 init_special_inode(inode, inode->i_mode, rdev);
394 break;
39279cc3
CM
395 }
396 return;
397
398make_bad:
399 btrfs_release_path(root, path);
400 btrfs_free_path(path);
401 mutex_unlock(&root->fs_info->fs_mutex);
402 make_bad_inode(inode);
403}
404
5f39d397
CM
405static void fill_inode_item(struct extent_buffer *leaf,
406 struct btrfs_inode_item *item,
39279cc3
CM
407 struct inode *inode)
408{
5f39d397
CM
409 btrfs_set_inode_uid(leaf, item, inode->i_uid);
410 btrfs_set_inode_gid(leaf, item, inode->i_gid);
411 btrfs_set_inode_size(leaf, item, inode->i_size);
412 btrfs_set_inode_mode(leaf, item, inode->i_mode);
413 btrfs_set_inode_nlink(leaf, item, inode->i_nlink);
414
415 btrfs_set_timespec_sec(leaf, btrfs_inode_atime(item),
416 inode->i_atime.tv_sec);
417 btrfs_set_timespec_nsec(leaf, btrfs_inode_atime(item),
418 inode->i_atime.tv_nsec);
419
420 btrfs_set_timespec_sec(leaf, btrfs_inode_mtime(item),
421 inode->i_mtime.tv_sec);
422 btrfs_set_timespec_nsec(leaf, btrfs_inode_mtime(item),
423 inode->i_mtime.tv_nsec);
424
425 btrfs_set_timespec_sec(leaf, btrfs_inode_ctime(item),
426 inode->i_ctime.tv_sec);
427 btrfs_set_timespec_nsec(leaf, btrfs_inode_ctime(item),
428 inode->i_ctime.tv_nsec);
429
430 btrfs_set_inode_nblocks(leaf, item, inode->i_blocks);
431 btrfs_set_inode_generation(leaf, item, inode->i_generation);
432 btrfs_set_inode_rdev(leaf, item, inode->i_rdev);
433 btrfs_set_inode_block_group(leaf, item,
39279cc3
CM
434 BTRFS_I(inode)->block_group->key.objectid);
435}
436
a52d9a80 437int btrfs_update_inode(struct btrfs_trans_handle *trans,
39279cc3
CM
438 struct btrfs_root *root,
439 struct inode *inode)
440{
441 struct btrfs_inode_item *inode_item;
442 struct btrfs_path *path;
5f39d397 443 struct extent_buffer *leaf;
39279cc3
CM
444 int ret;
445
446 path = btrfs_alloc_path();
447 BUG_ON(!path);
39279cc3
CM
448 ret = btrfs_lookup_inode(trans, root, path,
449 &BTRFS_I(inode)->location, 1);
450 if (ret) {
451 if (ret > 0)
452 ret = -ENOENT;
453 goto failed;
454 }
455
5f39d397
CM
456 leaf = path->nodes[0];
457 inode_item = btrfs_item_ptr(leaf, path->slots[0],
39279cc3
CM
458 struct btrfs_inode_item);
459
5f39d397
CM
460 fill_inode_item(leaf, inode_item, inode);
461 btrfs_mark_buffer_dirty(leaf);
15ee9bc7 462 btrfs_set_inode_last_trans(trans, inode);
39279cc3
CM
463 ret = 0;
464failed:
465 btrfs_release_path(root, path);
466 btrfs_free_path(path);
467 return ret;
468}
469
470
471static int btrfs_unlink_trans(struct btrfs_trans_handle *trans,
472 struct btrfs_root *root,
473 struct inode *dir,
474 struct dentry *dentry)
475{
476 struct btrfs_path *path;
477 const char *name = dentry->d_name.name;
478 int name_len = dentry->d_name.len;
479 int ret = 0;
5f39d397 480 struct extent_buffer *leaf;
39279cc3 481 struct btrfs_dir_item *di;
5f39d397 482 struct btrfs_key key;
39279cc3
CM
483
484 path = btrfs_alloc_path();
54aa1f4d
CM
485 if (!path) {
486 ret = -ENOMEM;
487 goto err;
488 }
489
39279cc3
CM
490 di = btrfs_lookup_dir_item(trans, root, path, dir->i_ino,
491 name, name_len, -1);
492 if (IS_ERR(di)) {
493 ret = PTR_ERR(di);
494 goto err;
495 }
496 if (!di) {
497 ret = -ENOENT;
498 goto err;
499 }
5f39d397
CM
500 leaf = path->nodes[0];
501 btrfs_dir_item_key_to_cpu(leaf, di, &key);
39279cc3 502 ret = btrfs_delete_one_dir_name(trans, root, path, di);
54aa1f4d
CM
503 if (ret)
504 goto err;
39279cc3
CM
505 btrfs_release_path(root, path);
506
507 di = btrfs_lookup_dir_index_item(trans, root, path, dir->i_ino,
5f39d397 508 key.objectid, name, name_len, -1);
39279cc3
CM
509 if (IS_ERR(di)) {
510 ret = PTR_ERR(di);
511 goto err;
512 }
513 if (!di) {
514 ret = -ENOENT;
515 goto err;
516 }
517 ret = btrfs_delete_one_dir_name(trans, root, path, di);
39279cc3
CM
518
519 dentry->d_inode->i_ctime = dir->i_ctime;
76fea00a
CM
520 ret = btrfs_del_inode_ref(trans, root, name, name_len,
521 dentry->d_inode->i_ino,
522 dentry->d_parent->d_inode->i_ino);
523 if (ret) {
524 printk("failed to delete reference to %.*s, "
525 "inode %lu parent %lu\n", name_len, name,
526 dentry->d_inode->i_ino,
527 dentry->d_parent->d_inode->i_ino);
3954401f 528 }
39279cc3
CM
529err:
530 btrfs_free_path(path);
531 if (!ret) {
532 dir->i_size -= name_len * 2;
79c44584 533 dir->i_mtime = dir->i_ctime = CURRENT_TIME;
39279cc3 534 btrfs_update_inode(trans, root, dir);
6da6abae
CM
535#if LINUX_VERSION_CODE <= KERNEL_VERSION(2,6,18)
536 dentry->d_inode->i_nlink--;
537#else
39279cc3 538 drop_nlink(dentry->d_inode);
6da6abae 539#endif
54aa1f4d 540 ret = btrfs_update_inode(trans, root, dentry->d_inode);
39279cc3
CM
541 dir->i_sb->s_dirt = 1;
542 }
543 return ret;
544}
545
546static int btrfs_unlink(struct inode *dir, struct dentry *dentry)
547{
548 struct btrfs_root *root;
549 struct btrfs_trans_handle *trans;
550 int ret;
d3c2fdcf 551 unsigned long nr;
39279cc3
CM
552
553 root = BTRFS_I(dir)->root;
554 mutex_lock(&root->fs_info->fs_mutex);
555 trans = btrfs_start_transaction(root, 1);
5f39d397 556
39279cc3
CM
557 btrfs_set_trans_block_group(trans, dir);
558 ret = btrfs_unlink_trans(trans, root, dir, dentry);
d3c2fdcf 559 nr = trans->blocks_used;
5f39d397 560
39279cc3
CM
561 btrfs_end_transaction(trans, root);
562 mutex_unlock(&root->fs_info->fs_mutex);
d3c2fdcf 563 btrfs_btree_balance_dirty(root, nr);
5f39d397 564
39279cc3
CM
565 return ret;
566}
567
568static int btrfs_rmdir(struct inode *dir, struct dentry *dentry)
569{
570 struct inode *inode = dentry->d_inode;
571 int err;
572 int ret;
573 struct btrfs_root *root = BTRFS_I(dir)->root;
39279cc3 574 struct btrfs_trans_handle *trans;
d3c2fdcf 575 unsigned long nr;
39279cc3 576
134d4512
Y
577 if (inode->i_size > BTRFS_EMPTY_DIR_SIZE)
578 return -ENOTEMPTY;
579
39279cc3
CM
580 mutex_lock(&root->fs_info->fs_mutex);
581 trans = btrfs_start_transaction(root, 1);
582 btrfs_set_trans_block_group(trans, dir);
39279cc3
CM
583
584 /* now the directory is empty */
585 err = btrfs_unlink_trans(trans, root, dir, dentry);
586 if (!err) {
587 inode->i_size = 0;
588 }
3954401f 589
d3c2fdcf 590 nr = trans->blocks_used;
39279cc3 591 ret = btrfs_end_transaction(trans, root);
134d4512 592 mutex_unlock(&root->fs_info->fs_mutex);
d3c2fdcf 593 btrfs_btree_balance_dirty(root, nr);
3954401f 594
39279cc3
CM
595 if (ret && !err)
596 err = ret;
597 return err;
598}
599
600static int btrfs_free_inode(struct btrfs_trans_handle *trans,
601 struct btrfs_root *root,
602 struct inode *inode)
603{
604 struct btrfs_path *path;
605 int ret;
606
607 clear_inode(inode);
608
609 path = btrfs_alloc_path();
610 BUG_ON(!path);
39279cc3
CM
611 ret = btrfs_lookup_inode(trans, root, path,
612 &BTRFS_I(inode)->location, -1);
54aa1f4d
CM
613 if (ret > 0)
614 ret = -ENOENT;
615 if (!ret)
616 ret = btrfs_del_item(trans, root, path);
39279cc3
CM
617 btrfs_free_path(path);
618 return ret;
619}
620
39279cc3
CM
621/*
622 * this can truncate away extent items, csum items and directory items.
623 * It starts at a high offset and removes keys until it can't find
624 * any higher than i_size.
625 *
626 * csum items that cross the new i_size are truncated to the new size
627 * as well.
628 */
629static int btrfs_truncate_in_trans(struct btrfs_trans_handle *trans,
630 struct btrfs_root *root,
631 struct inode *inode)
632{
633 int ret;
634 struct btrfs_path *path;
635 struct btrfs_key key;
5f39d397 636 struct btrfs_key found_key;
39279cc3 637 u32 found_type;
5f39d397 638 struct extent_buffer *leaf;
39279cc3
CM
639 struct btrfs_file_extent_item *fi;
640 u64 extent_start = 0;
db94535d 641 u64 extent_num_bytes = 0;
39279cc3 642 u64 item_end = 0;
7bb86316 643 u64 root_gen = 0;
d8d5f3e1 644 u64 root_owner = 0;
39279cc3
CM
645 int found_extent;
646 int del_item;
179e29e4 647 int extent_type = -1;
39279cc3 648
a52d9a80 649 btrfs_drop_extent_cache(inode, inode->i_size, (u64)-1);
39279cc3 650 path = btrfs_alloc_path();
3c69faec 651 path->reada = -1;
39279cc3 652 BUG_ON(!path);
5f39d397 653
39279cc3
CM
654 /* FIXME, add redo link to tree so we don't leak on crash */
655 key.objectid = inode->i_ino;
656 key.offset = (u64)-1;
5f39d397
CM
657 key.type = (u8)-1;
658
39279cc3
CM
659 while(1) {
660 btrfs_init_path(path);
661 fi = NULL;
662 ret = btrfs_search_slot(trans, root, &key, path, -1, 1);
663 if (ret < 0) {
664 goto error;
665 }
666 if (ret > 0) {
667 BUG_ON(path->slots[0] == 0);
668 path->slots[0]--;
669 }
5f39d397
CM
670 leaf = path->nodes[0];
671 btrfs_item_key_to_cpu(leaf, &found_key, path->slots[0]);
672 found_type = btrfs_key_type(&found_key);
39279cc3 673
5f39d397 674 if (found_key.objectid != inode->i_ino)
39279cc3 675 break;
5f39d397 676
39279cc3
CM
677 if (found_type != BTRFS_CSUM_ITEM_KEY &&
678 found_type != BTRFS_DIR_ITEM_KEY &&
679 found_type != BTRFS_DIR_INDEX_KEY &&
680 found_type != BTRFS_EXTENT_DATA_KEY)
681 break;
682
5f39d397 683 item_end = found_key.offset;
39279cc3 684 if (found_type == BTRFS_EXTENT_DATA_KEY) {
5f39d397 685 fi = btrfs_item_ptr(leaf, path->slots[0],
39279cc3 686 struct btrfs_file_extent_item);
179e29e4
CM
687 extent_type = btrfs_file_extent_type(leaf, fi);
688 if (extent_type != BTRFS_FILE_EXTENT_INLINE) {
5f39d397 689 item_end +=
db94535d 690 btrfs_file_extent_num_bytes(leaf, fi);
179e29e4
CM
691 } else if (extent_type == BTRFS_FILE_EXTENT_INLINE) {
692 struct btrfs_item *item = btrfs_item_nr(leaf,
693 path->slots[0]);
694 item_end += btrfs_file_extent_inline_len(leaf,
695 item);
39279cc3 696 }
008630c1 697 item_end--;
39279cc3
CM
698 }
699 if (found_type == BTRFS_CSUM_ITEM_KEY) {
700 ret = btrfs_csum_truncate(trans, root, path,
701 inode->i_size);
702 BUG_ON(ret);
703 }
008630c1 704 if (item_end < inode->i_size) {
b888db2b
CM
705 if (found_type == BTRFS_DIR_ITEM_KEY) {
706 found_type = BTRFS_INODE_ITEM_KEY;
707 } else if (found_type == BTRFS_EXTENT_ITEM_KEY) {
708 found_type = BTRFS_CSUM_ITEM_KEY;
709 } else if (found_type) {
710 found_type--;
711 } else {
712 break;
39279cc3 713 }
a61721d5 714 btrfs_set_key_type(&key, found_type);
65555a06 715 btrfs_release_path(root, path);
b888db2b 716 continue;
39279cc3 717 }
5f39d397 718 if (found_key.offset >= inode->i_size)
39279cc3
CM
719 del_item = 1;
720 else
721 del_item = 0;
722 found_extent = 0;
723
724 /* FIXME, shrink the extent if the ref count is only 1 */
179e29e4
CM
725 if (found_type != BTRFS_EXTENT_DATA_KEY)
726 goto delete;
727
728 if (extent_type != BTRFS_FILE_EXTENT_INLINE) {
39279cc3 729 u64 num_dec;
db94535d 730 extent_start = btrfs_file_extent_disk_bytenr(leaf, fi);
39279cc3 731 if (!del_item) {
db94535d
CM
732 u64 orig_num_bytes =
733 btrfs_file_extent_num_bytes(leaf, fi);
734 extent_num_bytes = inode->i_size -
5f39d397 735 found_key.offset + root->sectorsize - 1;
db94535d
CM
736 btrfs_set_file_extent_num_bytes(leaf, fi,
737 extent_num_bytes);
738 num_dec = (orig_num_bytes -
739 extent_num_bytes) >> 9;
bab9fb03
Y
740 if (extent_start != 0) {
741 inode->i_blocks -= num_dec;
742 }
5f39d397 743 btrfs_mark_buffer_dirty(leaf);
39279cc3 744 } else {
db94535d
CM
745 extent_num_bytes =
746 btrfs_file_extent_disk_num_bytes(leaf,
747 fi);
39279cc3 748 /* FIXME blocksize != 4096 */
db94535d
CM
749 num_dec = btrfs_file_extent_num_bytes(leaf,
750 fi) >> 9;
39279cc3
CM
751 if (extent_start != 0) {
752 found_extent = 1;
753 inode->i_blocks -= num_dec;
754 }
d8d5f3e1
CM
755 root_gen = btrfs_header_generation(leaf);
756 root_owner = btrfs_header_owner(leaf);
39279cc3 757 }
179e29e4
CM
758 } else if (extent_type == BTRFS_FILE_EXTENT_INLINE &&
759 !del_item) {
760 u32 newsize = inode->i_size - found_key.offset;
761 newsize = btrfs_file_extent_calc_inline_size(newsize);
762 ret = btrfs_truncate_item(trans, root, path,
763 newsize, 1);
764 BUG_ON(ret);
39279cc3 765 }
179e29e4 766delete:
39279cc3
CM
767 if (del_item) {
768 ret = btrfs_del_item(trans, root, path);
54aa1f4d
CM
769 if (ret)
770 goto error;
39279cc3
CM
771 } else {
772 break;
773 }
774 btrfs_release_path(root, path);
775 if (found_extent) {
776 ret = btrfs_free_extent(trans, root, extent_start,
7bb86316 777 extent_num_bytes,
d8d5f3e1 778 root_owner,
7bb86316
CM
779 root_gen, inode->i_ino,
780 found_key.offset, 0);
39279cc3
CM
781 BUG_ON(ret);
782 }
783 }
784 ret = 0;
785error:
786 btrfs_release_path(root, path);
787 btrfs_free_path(path);
788 inode->i_sb->s_dirt = 1;
789 return ret;
790}
791
b888db2b 792static int btrfs_cow_one_page(struct inode *inode, struct page *page,
a52d9a80
CM
793 size_t zero_start)
794{
795 char *kaddr;
796 int ret = 0;
b888db2b 797 struct extent_map_tree *em_tree = &BTRFS_I(inode)->extent_tree;
35ebb934 798 u64 page_start = (u64)page->index << PAGE_CACHE_SHIFT;
b888db2b 799 u64 page_end = page_start + PAGE_CACHE_SIZE - 1;
a52d9a80 800
b3cfa35a 801 set_page_extent_mapped(page);
a52d9a80 802
b888db2b
CM
803 lock_extent(em_tree, page_start, page_end, GFP_NOFS);
804 set_extent_delalloc(&BTRFS_I(inode)->extent_tree, page_start,
805 page_end, GFP_NOFS);
a52d9a80 806 if (zero_start != PAGE_CACHE_SIZE) {
b888db2b 807 kaddr = kmap(page);
a52d9a80
CM
808 memset(kaddr + zero_start, 0, PAGE_CACHE_SIZE - zero_start);
809 flush_dcache_page(page);
b888db2b 810 kunmap(page);
a52d9a80 811 }
b888db2b
CM
812 set_page_dirty(page);
813 unlock_extent(em_tree, page_start, page_end, GFP_NOFS);
a52d9a80 814
a52d9a80
CM
815 return ret;
816}
817
39279cc3
CM
818/*
819 * taken from block_truncate_page, but does cow as it zeros out
820 * any bytes left in the last page in the file.
821 */
822static int btrfs_truncate_page(struct address_space *mapping, loff_t from)
823{
824 struct inode *inode = mapping->host;
db94535d
CM
825 struct btrfs_root *root = BTRFS_I(inode)->root;
826 u32 blocksize = root->sectorsize;
39279cc3
CM
827 pgoff_t index = from >> PAGE_CACHE_SHIFT;
828 unsigned offset = from & (PAGE_CACHE_SIZE-1);
829 struct page *page;
39279cc3 830 int ret = 0;
a52d9a80 831 u64 page_start;
39279cc3
CM
832
833 if ((offset & (blocksize - 1)) == 0)
834 goto out;
835
db94535d 836 down_read(&root->snap_sem);
39279cc3
CM
837 ret = -ENOMEM;
838 page = grab_cache_page(mapping, index);
839 if (!page)
840 goto out;
39279cc3 841 if (!PageUptodate(page)) {
9ebefb18 842 ret = btrfs_readpage(NULL, page);
39279cc3
CM
843 lock_page(page);
844 if (!PageUptodate(page)) {
845 ret = -EIO;
846 goto out;
847 }
848 }
35ebb934 849 page_start = (u64)page->index << PAGE_CACHE_SHIFT;
a52d9a80 850
b888db2b 851 ret = btrfs_cow_one_page(inode, page, offset);
39279cc3 852
39279cc3
CM
853 unlock_page(page);
854 page_cache_release(page);
011410bd 855 up_read(&BTRFS_I(inode)->root->snap_sem);
39279cc3
CM
856out:
857 return ret;
858}
859
860static int btrfs_setattr(struct dentry *dentry, struct iattr *attr)
861{
862 struct inode *inode = dentry->d_inode;
863 int err;
864
865 err = inode_change_ok(inode, attr);
866 if (err)
867 return err;
868
869 if (S_ISREG(inode->i_mode) &&
870 attr->ia_valid & ATTR_SIZE && attr->ia_size > inode->i_size) {
871 struct btrfs_trans_handle *trans;
872 struct btrfs_root *root = BTRFS_I(inode)->root;
2bf5a725
CM
873 struct extent_map_tree *em_tree = &BTRFS_I(inode)->extent_tree;
874
5f39d397 875 u64 mask = root->sectorsize - 1;
39279cc3 876 u64 pos = (inode->i_size + mask) & ~mask;
2bf5a725 877 u64 block_end = attr->ia_size | mask;
39279cc3 878 u64 hole_size;
179e29e4 879 u64 alloc_hint = 0;
39279cc3
CM
880
881 if (attr->ia_size <= pos)
882 goto out;
883
884 btrfs_truncate_page(inode->i_mapping, inode->i_size);
885
2bf5a725 886 lock_extent(em_tree, pos, block_end, GFP_NOFS);
39279cc3 887 hole_size = (attr->ia_size - pos + mask) & ~mask;
39279cc3
CM
888
889 mutex_lock(&root->fs_info->fs_mutex);
890 trans = btrfs_start_transaction(root, 1);
891 btrfs_set_trans_block_group(trans, inode);
2bf5a725 892 err = btrfs_drop_extents(trans, root, inode,
3326d1b0
CM
893 pos, pos + hole_size, pos,
894 &alloc_hint);
2bf5a725 895
179e29e4
CM
896 if (alloc_hint != EXTENT_MAP_INLINE) {
897 err = btrfs_insert_file_extent(trans, root,
898 inode->i_ino,
899 pos, 0, 0, hole_size);
900 }
39279cc3
CM
901 btrfs_end_transaction(trans, root);
902 mutex_unlock(&root->fs_info->fs_mutex);
2bf5a725 903 unlock_extent(em_tree, pos, block_end, GFP_NOFS);
54aa1f4d
CM
904 if (err)
905 return err;
39279cc3
CM
906 }
907out:
908 err = inode_setattr(inode, attr);
909
910 return err;
911}
912void btrfs_delete_inode(struct inode *inode)
913{
914 struct btrfs_trans_handle *trans;
915 struct btrfs_root *root = BTRFS_I(inode)->root;
d3c2fdcf 916 unsigned long nr;
39279cc3
CM
917 int ret;
918
919 truncate_inode_pages(&inode->i_data, 0);
920 if (is_bad_inode(inode)) {
921 goto no_delete;
922 }
5f39d397 923
39279cc3
CM
924 inode->i_size = 0;
925 mutex_lock(&root->fs_info->fs_mutex);
926 trans = btrfs_start_transaction(root, 1);
5f39d397 927
39279cc3
CM
928 btrfs_set_trans_block_group(trans, inode);
929 ret = btrfs_truncate_in_trans(trans, root, inode);
5103e947
JB
930 if (ret)
931 goto no_delete_lock;
932 ret = btrfs_delete_xattrs(trans, root, inode);
54aa1f4d
CM
933 if (ret)
934 goto no_delete_lock;
935 ret = btrfs_free_inode(trans, root, inode);
936 if (ret)
937 goto no_delete_lock;
d3c2fdcf 938 nr = trans->blocks_used;
5f39d397 939
39279cc3
CM
940 btrfs_end_transaction(trans, root);
941 mutex_unlock(&root->fs_info->fs_mutex);
d3c2fdcf 942 btrfs_btree_balance_dirty(root, nr);
39279cc3 943 return;
54aa1f4d
CM
944
945no_delete_lock:
d3c2fdcf 946 nr = trans->blocks_used;
54aa1f4d
CM
947 btrfs_end_transaction(trans, root);
948 mutex_unlock(&root->fs_info->fs_mutex);
d3c2fdcf 949 btrfs_btree_balance_dirty(root, nr);
39279cc3
CM
950no_delete:
951 clear_inode(inode);
952}
953
954/*
955 * this returns the key found in the dir entry in the location pointer.
956 * If no dir entries were found, location->objectid is 0.
957 */
958static int btrfs_inode_by_name(struct inode *dir, struct dentry *dentry,
959 struct btrfs_key *location)
960{
961 const char *name = dentry->d_name.name;
962 int namelen = dentry->d_name.len;
963 struct btrfs_dir_item *di;
964 struct btrfs_path *path;
965 struct btrfs_root *root = BTRFS_I(dir)->root;
0d9f7f3e 966 int ret = 0;
39279cc3 967
3954401f
CM
968 if (namelen == 1 && strcmp(name, ".") == 0) {
969 location->objectid = dir->i_ino;
970 location->type = BTRFS_INODE_ITEM_KEY;
971 location->offset = 0;
972 return 0;
973 }
39279cc3
CM
974 path = btrfs_alloc_path();
975 BUG_ON(!path);
3954401f 976
7a720536 977 if (namelen == 2 && strcmp(name, "..") == 0) {
3954401f
CM
978 struct btrfs_key key;
979 struct extent_buffer *leaf;
980 u32 nritems;
981 int slot;
982
983 key.objectid = dir->i_ino;
984 btrfs_set_key_type(&key, BTRFS_INODE_REF_KEY);
985 key.offset = 0;
986 ret = btrfs_search_slot(NULL, root, &key, path, 0, 0);
987 BUG_ON(ret == 0);
988 ret = 0;
989
990 leaf = path->nodes[0];
991 slot = path->slots[0];
992 nritems = btrfs_header_nritems(leaf);
993 if (slot >= nritems)
994 goto out_err;
995
996 btrfs_item_key_to_cpu(leaf, &key, slot);
997 if (key.objectid != dir->i_ino ||
998 key.type != BTRFS_INODE_REF_KEY) {
999 goto out_err;
1000 }
1001 location->objectid = key.offset;
1002 location->type = BTRFS_INODE_ITEM_KEY;
1003 location->offset = 0;
1004 goto out;
1005 }
1006
39279cc3
CM
1007 di = btrfs_lookup_dir_item(NULL, root, path, dir->i_ino, name,
1008 namelen, 0);
0d9f7f3e
Y
1009 if (IS_ERR(di))
1010 ret = PTR_ERR(di);
39279cc3 1011 if (!di || IS_ERR(di)) {
3954401f 1012 goto out_err;
39279cc3 1013 }
5f39d397 1014 btrfs_dir_item_key_to_cpu(path->nodes[0], di, location);
39279cc3 1015out:
39279cc3
CM
1016 btrfs_free_path(path);
1017 return ret;
3954401f
CM
1018out_err:
1019 location->objectid = 0;
1020 goto out;
39279cc3
CM
1021}
1022
1023/*
1024 * when we hit a tree root in a directory, the btrfs part of the inode
1025 * needs to be changed to reflect the root directory of the tree root. This
1026 * is kind of like crossing a mount point.
1027 */
1028static int fixup_tree_root_location(struct btrfs_root *root,
1029 struct btrfs_key *location,
58176a96
JB
1030 struct btrfs_root **sub_root,
1031 struct dentry *dentry)
39279cc3
CM
1032{
1033 struct btrfs_path *path;
1034 struct btrfs_root_item *ri;
1035
1036 if (btrfs_key_type(location) != BTRFS_ROOT_ITEM_KEY)
1037 return 0;
1038 if (location->objectid == BTRFS_ROOT_TREE_OBJECTID)
1039 return 0;
1040
1041 path = btrfs_alloc_path();
1042 BUG_ON(!path);
1043 mutex_lock(&root->fs_info->fs_mutex);
1044
58176a96
JB
1045 *sub_root = btrfs_read_fs_root(root->fs_info, location,
1046 dentry->d_name.name,
1047 dentry->d_name.len);
39279cc3
CM
1048 if (IS_ERR(*sub_root))
1049 return PTR_ERR(*sub_root);
1050
1051 ri = &(*sub_root)->root_item;
1052 location->objectid = btrfs_root_dirid(ri);
39279cc3
CM
1053 btrfs_set_key_type(location, BTRFS_INODE_ITEM_KEY);
1054 location->offset = 0;
1055
1056 btrfs_free_path(path);
1057 mutex_unlock(&root->fs_info->fs_mutex);
1058 return 0;
1059}
1060
1061static int btrfs_init_locked_inode(struct inode *inode, void *p)
1062{
1063 struct btrfs_iget_args *args = p;
1064 inode->i_ino = args->ino;
1065 BTRFS_I(inode)->root = args->root;
b888db2b
CM
1066 extent_map_tree_init(&BTRFS_I(inode)->extent_tree,
1067 inode->i_mapping, GFP_NOFS);
39279cc3
CM
1068 return 0;
1069}
1070
1071static int btrfs_find_actor(struct inode *inode, void *opaque)
1072{
1073 struct btrfs_iget_args *args = opaque;
1074 return (args->ino == inode->i_ino &&
1075 args->root == BTRFS_I(inode)->root);
1076}
1077
1078struct inode *btrfs_iget_locked(struct super_block *s, u64 objectid,
1079 struct btrfs_root *root)
1080{
1081 struct inode *inode;
1082 struct btrfs_iget_args args;
1083 args.ino = objectid;
1084 args.root = root;
1085
1086 inode = iget5_locked(s, objectid, btrfs_find_actor,
1087 btrfs_init_locked_inode,
1088 (void *)&args);
1089 return inode;
1090}
1091
1092static struct dentry *btrfs_lookup(struct inode *dir, struct dentry *dentry,
1093 struct nameidata *nd)
1094{
1095 struct inode * inode;
1096 struct btrfs_inode *bi = BTRFS_I(dir);
1097 struct btrfs_root *root = bi->root;
1098 struct btrfs_root *sub_root = root;
1099 struct btrfs_key location;
1100 int ret;
1101
1102 if (dentry->d_name.len > BTRFS_NAME_LEN)
1103 return ERR_PTR(-ENAMETOOLONG);
5f39d397 1104
39279cc3
CM
1105 mutex_lock(&root->fs_info->fs_mutex);
1106 ret = btrfs_inode_by_name(dir, dentry, &location);
1107 mutex_unlock(&root->fs_info->fs_mutex);
5f39d397 1108
39279cc3
CM
1109 if (ret < 0)
1110 return ERR_PTR(ret);
5f39d397 1111
39279cc3
CM
1112 inode = NULL;
1113 if (location.objectid) {
58176a96
JB
1114 ret = fixup_tree_root_location(root, &location, &sub_root,
1115 dentry);
39279cc3
CM
1116 if (ret < 0)
1117 return ERR_PTR(ret);
1118 if (ret > 0)
1119 return ERR_PTR(-ENOENT);
1120 inode = btrfs_iget_locked(dir->i_sb, location.objectid,
1121 sub_root);
1122 if (!inode)
1123 return ERR_PTR(-EACCES);
1124 if (inode->i_state & I_NEW) {
1125 /* the inode and parent dir are two different roots */
1126 if (sub_root != root) {
1127 igrab(inode);
1128 sub_root->inode = inode;
1129 }
1130 BTRFS_I(inode)->root = sub_root;
1131 memcpy(&BTRFS_I(inode)->location, &location,
1132 sizeof(location));
1133 btrfs_read_locked_inode(inode);
1134 unlock_new_inode(inode);
1135 }
1136 }
1137 return d_splice_alias(inode, dentry);
1138}
1139
39279cc3
CM
1140static unsigned char btrfs_filetype_table[] = {
1141 DT_UNKNOWN, DT_REG, DT_DIR, DT_CHR, DT_BLK, DT_FIFO, DT_SOCK, DT_LNK
1142};
1143
1144static int btrfs_readdir(struct file *filp, void *dirent, filldir_t filldir)
1145{
6da6abae 1146 struct inode *inode = filp->f_dentry->d_inode;
39279cc3
CM
1147 struct btrfs_root *root = BTRFS_I(inode)->root;
1148 struct btrfs_item *item;
1149 struct btrfs_dir_item *di;
1150 struct btrfs_key key;
5f39d397 1151 struct btrfs_key found_key;
39279cc3
CM
1152 struct btrfs_path *path;
1153 int ret;
1154 u32 nritems;
5f39d397 1155 struct extent_buffer *leaf;
39279cc3
CM
1156 int slot;
1157 int advance;
1158 unsigned char d_type;
1159 int over = 0;
1160 u32 di_cur;
1161 u32 di_total;
1162 u32 di_len;
1163 int key_type = BTRFS_DIR_INDEX_KEY;
5f39d397
CM
1164 char tmp_name[32];
1165 char *name_ptr;
1166 int name_len;
39279cc3
CM
1167
1168 /* FIXME, use a real flag for deciding about the key type */
1169 if (root->fs_info->tree_root == root)
1170 key_type = BTRFS_DIR_ITEM_KEY;
5f39d397 1171
3954401f
CM
1172 /* special case for "." */
1173 if (filp->f_pos == 0) {
1174 over = filldir(dirent, ".", 1,
1175 1, inode->i_ino,
1176 DT_DIR);
1177 if (over)
1178 return 0;
1179 filp->f_pos = 1;
1180 }
1181
39279cc3
CM
1182 mutex_lock(&root->fs_info->fs_mutex);
1183 key.objectid = inode->i_ino;
3954401f
CM
1184 path = btrfs_alloc_path();
1185 path->reada = 2;
1186
1187 /* special case for .., just use the back ref */
1188 if (filp->f_pos == 1) {
1189 btrfs_set_key_type(&key, BTRFS_INODE_REF_KEY);
1190 key.offset = 0;
1191 ret = btrfs_search_slot(NULL, root, &key, path, 0, 0);
1192 BUG_ON(ret == 0);
1193 leaf = path->nodes[0];
1194 slot = path->slots[0];
1195 nritems = btrfs_header_nritems(leaf);
1196 if (slot >= nritems) {
1197 btrfs_release_path(root, path);
1198 goto read_dir_items;
1199 }
1200 btrfs_item_key_to_cpu(leaf, &found_key, slot);
1201 btrfs_release_path(root, path);
1202 if (found_key.objectid != key.objectid ||
1203 found_key.type != BTRFS_INODE_REF_KEY)
1204 goto read_dir_items;
1205 over = filldir(dirent, "..", 2,
1206 2, found_key.offset, DT_DIR);
1207 if (over)
1208 goto nopos;
1209 filp->f_pos = 2;
1210 }
1211
1212read_dir_items:
39279cc3
CM
1213 btrfs_set_key_type(&key, key_type);
1214 key.offset = filp->f_pos;
5f39d397 1215
39279cc3
CM
1216 ret = btrfs_search_slot(NULL, root, &key, path, 0, 0);
1217 if (ret < 0)
1218 goto err;
1219 advance = 0;
39279cc3 1220 while(1) {
5f39d397
CM
1221 leaf = path->nodes[0];
1222 nritems = btrfs_header_nritems(leaf);
39279cc3
CM
1223 slot = path->slots[0];
1224 if (advance || slot >= nritems) {
1225 if (slot >= nritems -1) {
39279cc3
CM
1226 ret = btrfs_next_leaf(root, path);
1227 if (ret)
1228 break;
5f39d397
CM
1229 leaf = path->nodes[0];
1230 nritems = btrfs_header_nritems(leaf);
39279cc3
CM
1231 slot = path->slots[0];
1232 } else {
1233 slot++;
1234 path->slots[0]++;
1235 }
1236 }
1237 advance = 1;
5f39d397
CM
1238 item = btrfs_item_nr(leaf, slot);
1239 btrfs_item_key_to_cpu(leaf, &found_key, slot);
1240
1241 if (found_key.objectid != key.objectid)
39279cc3 1242 break;
5f39d397 1243 if (btrfs_key_type(&found_key) != key_type)
39279cc3 1244 break;
5f39d397 1245 if (found_key.offset < filp->f_pos)
39279cc3 1246 continue;
5f39d397
CM
1247
1248 filp->f_pos = found_key.offset;
39279cc3
CM
1249 advance = 1;
1250 di = btrfs_item_ptr(leaf, slot, struct btrfs_dir_item);
1251 di_cur = 0;
5f39d397 1252 di_total = btrfs_item_size(leaf, item);
39279cc3 1253 while(di_cur < di_total) {
5f39d397
CM
1254 struct btrfs_key location;
1255
1256 name_len = btrfs_dir_name_len(leaf, di);
1257 if (name_len < 32) {
1258 name_ptr = tmp_name;
1259 } else {
1260 name_ptr = kmalloc(name_len, GFP_NOFS);
1261 BUG_ON(!name_ptr);
1262 }
1263 read_extent_buffer(leaf, name_ptr,
1264 (unsigned long)(di + 1), name_len);
1265
1266 d_type = btrfs_filetype_table[btrfs_dir_type(leaf, di)];
1267 btrfs_dir_item_key_to_cpu(leaf, di, &location);
1268
1269 over = filldir(dirent, name_ptr, name_len,
1270 found_key.offset,
1271 location.objectid,
39279cc3 1272 d_type);
5f39d397
CM
1273
1274 if (name_ptr != tmp_name)
1275 kfree(name_ptr);
1276
39279cc3
CM
1277 if (over)
1278 goto nopos;
5103e947
JB
1279 di_len = btrfs_dir_name_len(leaf, di) +
1280 btrfs_dir_data_len(leaf, di) +sizeof(*di);
39279cc3
CM
1281 di_cur += di_len;
1282 di = (struct btrfs_dir_item *)((char *)di + di_len);
1283 }
1284 }
1285 filp->f_pos++;
1286nopos:
1287 ret = 0;
1288err:
1289 btrfs_release_path(root, path);
1290 btrfs_free_path(path);
1291 mutex_unlock(&root->fs_info->fs_mutex);
1292 return ret;
1293}
1294
1295int btrfs_write_inode(struct inode *inode, int wait)
1296{
1297 struct btrfs_root *root = BTRFS_I(inode)->root;
1298 struct btrfs_trans_handle *trans;
1299 int ret = 0;
1300
1301 if (wait) {
1302 mutex_lock(&root->fs_info->fs_mutex);
1303 trans = btrfs_start_transaction(root, 1);
1304 btrfs_set_trans_block_group(trans, inode);
1305 ret = btrfs_commit_transaction(trans, root);
1306 mutex_unlock(&root->fs_info->fs_mutex);
1307 }
1308 return ret;
1309}
1310
1311/*
54aa1f4d 1312 * This is somewhat expensive, updating the tree every time the
39279cc3
CM
1313 * inode changes. But, it is most likely to find the inode in cache.
1314 * FIXME, needs more benchmarking...there are no reasons other than performance
1315 * to keep or drop this code.
1316 */
1317void btrfs_dirty_inode(struct inode *inode)
1318{
1319 struct btrfs_root *root = BTRFS_I(inode)->root;
1320 struct btrfs_trans_handle *trans;
1321
1322 mutex_lock(&root->fs_info->fs_mutex);
1323 trans = btrfs_start_transaction(root, 1);
1324 btrfs_set_trans_block_group(trans, inode);
1325 btrfs_update_inode(trans, root, inode);
1326 btrfs_end_transaction(trans, root);
1327 mutex_unlock(&root->fs_info->fs_mutex);
39279cc3
CM
1328}
1329
1330static struct inode *btrfs_new_inode(struct btrfs_trans_handle *trans,
1331 struct btrfs_root *root,
1332 u64 objectid,
1333 struct btrfs_block_group_cache *group,
1334 int mode)
1335{
1336 struct inode *inode;
5f39d397 1337 struct btrfs_inode_item *inode_item;
39279cc3 1338 struct btrfs_key *location;
5f39d397 1339 struct btrfs_path *path;
39279cc3
CM
1340 int ret;
1341 int owner;
1342
5f39d397
CM
1343 path = btrfs_alloc_path();
1344 BUG_ON(!path);
1345
39279cc3
CM
1346 inode = new_inode(root->fs_info->sb);
1347 if (!inode)
1348 return ERR_PTR(-ENOMEM);
1349
b888db2b
CM
1350 extent_map_tree_init(&BTRFS_I(inode)->extent_tree,
1351 inode->i_mapping, GFP_NOFS);
39279cc3 1352 BTRFS_I(inode)->root = root;
b888db2b 1353
39279cc3
CM
1354 if (mode & S_IFDIR)
1355 owner = 0;
1356 else
1357 owner = 1;
1358 group = btrfs_find_block_group(root, group, 0, 0, owner);
1359 BTRFS_I(inode)->block_group = group;
1360
5f39d397
CM
1361 ret = btrfs_insert_empty_inode(trans, root, path, objectid);
1362 if (ret)
1363 goto fail;
1364
39279cc3
CM
1365 inode->i_uid = current->fsuid;
1366 inode->i_gid = current->fsgid;
1367 inode->i_mode = mode;
1368 inode->i_ino = objectid;
1369 inode->i_blocks = 0;
1370 inode->i_mtime = inode->i_atime = inode->i_ctime = CURRENT_TIME;
5f39d397
CM
1371 inode_item = btrfs_item_ptr(path->nodes[0], path->slots[0],
1372 struct btrfs_inode_item);
1373 fill_inode_item(path->nodes[0], inode_item, inode);
1374 btrfs_mark_buffer_dirty(path->nodes[0]);
1375 btrfs_free_path(path);
1376
39279cc3
CM
1377 location = &BTRFS_I(inode)->location;
1378 location->objectid = objectid;
39279cc3
CM
1379 location->offset = 0;
1380 btrfs_set_key_type(location, BTRFS_INODE_ITEM_KEY);
1381
39279cc3
CM
1382 insert_inode_hash(inode);
1383 return inode;
5f39d397
CM
1384fail:
1385 btrfs_free_path(path);
1386 return ERR_PTR(ret);
39279cc3
CM
1387}
1388
1389static inline u8 btrfs_inode_type(struct inode *inode)
1390{
1391 return btrfs_type_by_mode[(inode->i_mode & S_IFMT) >> S_SHIFT];
1392}
1393
1394static int btrfs_add_link(struct btrfs_trans_handle *trans,
1395 struct dentry *dentry, struct inode *inode)
1396{
1397 int ret;
1398 struct btrfs_key key;
1399 struct btrfs_root *root = BTRFS_I(dentry->d_parent->d_inode)->root;
79c44584 1400 struct inode *parent_inode;
5f39d397 1401
39279cc3 1402 key.objectid = inode->i_ino;
39279cc3
CM
1403 btrfs_set_key_type(&key, BTRFS_INODE_ITEM_KEY);
1404 key.offset = 0;
1405
1406 ret = btrfs_insert_dir_item(trans, root,
1407 dentry->d_name.name, dentry->d_name.len,
1408 dentry->d_parent->d_inode->i_ino,
1409 &key, btrfs_inode_type(inode));
1410 if (ret == 0) {
76fea00a
CM
1411 ret = btrfs_insert_inode_ref(trans, root,
1412 dentry->d_name.name,
1413 dentry->d_name.len,
1414 inode->i_ino,
1415 dentry->d_parent->d_inode->i_ino);
79c44584
CM
1416 parent_inode = dentry->d_parent->d_inode;
1417 parent_inode->i_size += dentry->d_name.len * 2;
1418 parent_inode->i_mtime = parent_inode->i_ctime = CURRENT_TIME;
39279cc3
CM
1419 ret = btrfs_update_inode(trans, root,
1420 dentry->d_parent->d_inode);
1421 }
1422 return ret;
1423}
1424
1425static int btrfs_add_nondir(struct btrfs_trans_handle *trans,
1426 struct dentry *dentry, struct inode *inode)
1427{
1428 int err = btrfs_add_link(trans, dentry, inode);
1429 if (!err) {
1430 d_instantiate(dentry, inode);
1431 return 0;
1432 }
1433 if (err > 0)
1434 err = -EEXIST;
1435 return err;
1436}
1437
618e21d5
JB
1438static int btrfs_mknod(struct inode *dir, struct dentry *dentry,
1439 int mode, dev_t rdev)
1440{
1441 struct btrfs_trans_handle *trans;
1442 struct btrfs_root *root = BTRFS_I(dir)->root;
1443 struct inode *inode;
1444 int err;
1445 int drop_inode = 0;
1446 u64 objectid;
d3c2fdcf 1447 unsigned long nr;
618e21d5
JB
1448
1449 if (!new_valid_dev(rdev))
1450 return -EINVAL;
1451
1452 mutex_lock(&root->fs_info->fs_mutex);
1453 trans = btrfs_start_transaction(root, 1);
1454 btrfs_set_trans_block_group(trans, dir);
1455
1456 err = btrfs_find_free_objectid(trans, root, dir->i_ino, &objectid);
1457 if (err) {
1458 err = -ENOSPC;
1459 goto out_unlock;
1460 }
1461
1462 inode = btrfs_new_inode(trans, root, objectid,
1463 BTRFS_I(dir)->block_group, mode);
1464 err = PTR_ERR(inode);
1465 if (IS_ERR(inode))
1466 goto out_unlock;
1467
1468 btrfs_set_trans_block_group(trans, inode);
1469 err = btrfs_add_nondir(trans, dentry, inode);
1470 if (err)
1471 drop_inode = 1;
1472 else {
1473 inode->i_op = &btrfs_special_inode_operations;
1474 init_special_inode(inode, inode->i_mode, rdev);
1b4ab1bb 1475 btrfs_update_inode(trans, root, inode);
618e21d5
JB
1476 }
1477 dir->i_sb->s_dirt = 1;
1478 btrfs_update_inode_block_group(trans, inode);
1479 btrfs_update_inode_block_group(trans, dir);
1480out_unlock:
d3c2fdcf 1481 nr = trans->blocks_used;
618e21d5
JB
1482 btrfs_end_transaction(trans, root);
1483 mutex_unlock(&root->fs_info->fs_mutex);
1484
1485 if (drop_inode) {
1486 inode_dec_link_count(inode);
1487 iput(inode);
1488 }
d3c2fdcf 1489 btrfs_btree_balance_dirty(root, nr);
618e21d5
JB
1490 return err;
1491}
1492
39279cc3
CM
1493static int btrfs_create(struct inode *dir, struct dentry *dentry,
1494 int mode, struct nameidata *nd)
1495{
1496 struct btrfs_trans_handle *trans;
1497 struct btrfs_root *root = BTRFS_I(dir)->root;
1498 struct inode *inode;
1499 int err;
1500 int drop_inode = 0;
d3c2fdcf 1501 unsigned long nr;
39279cc3
CM
1502 u64 objectid;
1503
1504 mutex_lock(&root->fs_info->fs_mutex);
1505 trans = btrfs_start_transaction(root, 1);
1506 btrfs_set_trans_block_group(trans, dir);
1507
1508 err = btrfs_find_free_objectid(trans, root, dir->i_ino, &objectid);
1509 if (err) {
1510 err = -ENOSPC;
1511 goto out_unlock;
1512 }
1513
1514 inode = btrfs_new_inode(trans, root, objectid,
1515 BTRFS_I(dir)->block_group, mode);
1516 err = PTR_ERR(inode);
1517 if (IS_ERR(inode))
1518 goto out_unlock;
1519
1520 btrfs_set_trans_block_group(trans, inode);
1521 err = btrfs_add_nondir(trans, dentry, inode);
1522 if (err)
1523 drop_inode = 1;
1524 else {
1525 inode->i_mapping->a_ops = &btrfs_aops;
1526 inode->i_fop = &btrfs_file_operations;
1527 inode->i_op = &btrfs_file_inode_operations;
a52d9a80
CM
1528 extent_map_tree_init(&BTRFS_I(inode)->extent_tree,
1529 inode->i_mapping, GFP_NOFS);
07157aac 1530 BTRFS_I(inode)->extent_tree.ops = &btrfs_extent_map_ops;
39279cc3
CM
1531 }
1532 dir->i_sb->s_dirt = 1;
1533 btrfs_update_inode_block_group(trans, inode);
1534 btrfs_update_inode_block_group(trans, dir);
1535out_unlock:
d3c2fdcf 1536 nr = trans->blocks_used;
39279cc3
CM
1537 btrfs_end_transaction(trans, root);
1538 mutex_unlock(&root->fs_info->fs_mutex);
1539
1540 if (drop_inode) {
1541 inode_dec_link_count(inode);
1542 iput(inode);
1543 }
d3c2fdcf 1544 btrfs_btree_balance_dirty(root, nr);
39279cc3
CM
1545 return err;
1546}
1547
1548static int btrfs_link(struct dentry *old_dentry, struct inode *dir,
1549 struct dentry *dentry)
1550{
1551 struct btrfs_trans_handle *trans;
1552 struct btrfs_root *root = BTRFS_I(dir)->root;
1553 struct inode *inode = old_dentry->d_inode;
d3c2fdcf 1554 unsigned long nr;
39279cc3
CM
1555 int err;
1556 int drop_inode = 0;
1557
1558 if (inode->i_nlink == 0)
1559 return -ENOENT;
1560
6da6abae
CM
1561#if LINUX_VERSION_CODE <= KERNEL_VERSION(2,6,18)
1562 inode->i_nlink++;
1563#else
39279cc3 1564 inc_nlink(inode);
6da6abae 1565#endif
39279cc3
CM
1566 mutex_lock(&root->fs_info->fs_mutex);
1567 trans = btrfs_start_transaction(root, 1);
5f39d397 1568
39279cc3
CM
1569 btrfs_set_trans_block_group(trans, dir);
1570 atomic_inc(&inode->i_count);
1571 err = btrfs_add_nondir(trans, dentry, inode);
5f39d397 1572
39279cc3
CM
1573 if (err)
1574 drop_inode = 1;
5f39d397 1575
39279cc3
CM
1576 dir->i_sb->s_dirt = 1;
1577 btrfs_update_inode_block_group(trans, dir);
54aa1f4d 1578 err = btrfs_update_inode(trans, root, inode);
5f39d397 1579
54aa1f4d
CM
1580 if (err)
1581 drop_inode = 1;
39279cc3 1582
d3c2fdcf 1583 nr = trans->blocks_used;
39279cc3
CM
1584 btrfs_end_transaction(trans, root);
1585 mutex_unlock(&root->fs_info->fs_mutex);
1586
1587 if (drop_inode) {
1588 inode_dec_link_count(inode);
1589 iput(inode);
1590 }
d3c2fdcf 1591 btrfs_btree_balance_dirty(root, nr);
39279cc3
CM
1592 return err;
1593}
1594
39279cc3
CM
1595static int btrfs_mkdir(struct inode *dir, struct dentry *dentry, int mode)
1596{
1597 struct inode *inode;
1598 struct btrfs_trans_handle *trans;
1599 struct btrfs_root *root = BTRFS_I(dir)->root;
1600 int err = 0;
1601 int drop_on_err = 0;
1602 u64 objectid;
d3c2fdcf 1603 unsigned long nr = 1;
39279cc3
CM
1604
1605 mutex_lock(&root->fs_info->fs_mutex);
1606 trans = btrfs_start_transaction(root, 1);
1607 btrfs_set_trans_block_group(trans, dir);
5f39d397 1608
39279cc3
CM
1609 if (IS_ERR(trans)) {
1610 err = PTR_ERR(trans);
1611 goto out_unlock;
1612 }
1613
1614 err = btrfs_find_free_objectid(trans, root, dir->i_ino, &objectid);
1615 if (err) {
1616 err = -ENOSPC;
1617 goto out_unlock;
1618 }
1619
1620 inode = btrfs_new_inode(trans, root, objectid,
1621 BTRFS_I(dir)->block_group, S_IFDIR | mode);
1622 if (IS_ERR(inode)) {
1623 err = PTR_ERR(inode);
1624 goto out_fail;
1625 }
5f39d397 1626
39279cc3
CM
1627 drop_on_err = 1;
1628 inode->i_op = &btrfs_dir_inode_operations;
1629 inode->i_fop = &btrfs_dir_file_operations;
1630 btrfs_set_trans_block_group(trans, inode);
1631
3954401f 1632 inode->i_size = 0;
39279cc3
CM
1633 err = btrfs_update_inode(trans, root, inode);
1634 if (err)
1635 goto out_fail;
5f39d397 1636
39279cc3
CM
1637 err = btrfs_add_link(trans, dentry, inode);
1638 if (err)
1639 goto out_fail;
5f39d397 1640
39279cc3
CM
1641 d_instantiate(dentry, inode);
1642 drop_on_err = 0;
1643 dir->i_sb->s_dirt = 1;
1644 btrfs_update_inode_block_group(trans, inode);
1645 btrfs_update_inode_block_group(trans, dir);
1646
1647out_fail:
d3c2fdcf 1648 nr = trans->blocks_used;
39279cc3 1649 btrfs_end_transaction(trans, root);
5f39d397 1650
39279cc3
CM
1651out_unlock:
1652 mutex_unlock(&root->fs_info->fs_mutex);
1653 if (drop_on_err)
1654 iput(inode);
d3c2fdcf 1655 btrfs_btree_balance_dirty(root, nr);
39279cc3
CM
1656 return err;
1657}
1658
a52d9a80
CM
1659struct extent_map *btrfs_get_extent(struct inode *inode, struct page *page,
1660 size_t page_offset, u64 start, u64 end,
1661 int create)
1662{
1663 int ret;
1664 int err = 0;
db94535d 1665 u64 bytenr;
a52d9a80
CM
1666 u64 extent_start = 0;
1667 u64 extent_end = 0;
1668 u64 objectid = inode->i_ino;
1669 u32 found_type;
1670 int failed_insert = 0;
1671 struct btrfs_path *path;
1672 struct btrfs_root *root = BTRFS_I(inode)->root;
1673 struct btrfs_file_extent_item *item;
5f39d397
CM
1674 struct extent_buffer *leaf;
1675 struct btrfs_key found_key;
a52d9a80
CM
1676 struct extent_map *em = NULL;
1677 struct extent_map_tree *em_tree = &BTRFS_I(inode)->extent_tree;
1678 struct btrfs_trans_handle *trans = NULL;
1679
1680 path = btrfs_alloc_path();
1681 BUG_ON(!path);
1682 mutex_lock(&root->fs_info->fs_mutex);
1683
1684again:
1685 em = lookup_extent_mapping(em_tree, start, end);
1686 if (em) {
1687 goto out;
1688 }
1689 if (!em) {
1690 em = alloc_extent_map(GFP_NOFS);
1691 if (!em) {
1692 err = -ENOMEM;
1693 goto out;
1694 }
5f39d397
CM
1695 em->start = EXTENT_MAP_HOLE;
1696 em->end = EXTENT_MAP_HOLE;
a52d9a80
CM
1697 }
1698 em->bdev = inode->i_sb->s_bdev;
179e29e4
CM
1699 ret = btrfs_lookup_file_extent(trans, root, path,
1700 objectid, start, trans != NULL);
a52d9a80
CM
1701 if (ret < 0) {
1702 err = ret;
1703 goto out;
1704 }
1705
1706 if (ret != 0) {
1707 if (path->slots[0] == 0)
1708 goto not_found;
1709 path->slots[0]--;
1710 }
1711
5f39d397
CM
1712 leaf = path->nodes[0];
1713 item = btrfs_item_ptr(leaf, path->slots[0],
a52d9a80 1714 struct btrfs_file_extent_item);
a52d9a80 1715 /* are we inside the extent that was found? */
5f39d397
CM
1716 btrfs_item_key_to_cpu(leaf, &found_key, path->slots[0]);
1717 found_type = btrfs_key_type(&found_key);
1718 if (found_key.objectid != objectid ||
a52d9a80
CM
1719 found_type != BTRFS_EXTENT_DATA_KEY) {
1720 goto not_found;
1721 }
1722
5f39d397
CM
1723 found_type = btrfs_file_extent_type(leaf, item);
1724 extent_start = found_key.offset;
a52d9a80
CM
1725 if (found_type == BTRFS_FILE_EXTENT_REG) {
1726 extent_end = extent_start +
db94535d 1727 btrfs_file_extent_num_bytes(leaf, item);
a52d9a80 1728 err = 0;
b888db2b 1729 if (start < extent_start || start >= extent_end) {
a52d9a80
CM
1730 em->start = start;
1731 if (start < extent_start) {
b888db2b
CM
1732 if (end < extent_start)
1733 goto not_found;
a52d9a80
CM
1734 em->end = extent_end - 1;
1735 } else {
1736 em->end = end;
1737 }
1738 goto not_found_em;
1739 }
db94535d
CM
1740 bytenr = btrfs_file_extent_disk_bytenr(leaf, item);
1741 if (bytenr == 0) {
a52d9a80
CM
1742 em->start = extent_start;
1743 em->end = extent_end - 1;
5f39d397
CM
1744 em->block_start = EXTENT_MAP_HOLE;
1745 em->block_end = EXTENT_MAP_HOLE;
a52d9a80
CM
1746 goto insert;
1747 }
db94535d
CM
1748 bytenr += btrfs_file_extent_offset(leaf, item);
1749 em->block_start = bytenr;
a52d9a80 1750 em->block_end = em->block_start +
db94535d 1751 btrfs_file_extent_num_bytes(leaf, item) - 1;
a52d9a80
CM
1752 em->start = extent_start;
1753 em->end = extent_end - 1;
1754 goto insert;
1755 } else if (found_type == BTRFS_FILE_EXTENT_INLINE) {
5f39d397 1756 unsigned long ptr;
a52d9a80 1757 char *map;
3326d1b0
CM
1758 size_t size;
1759 size_t extent_offset;
1760 size_t copy_size;
a52d9a80 1761
5f39d397
CM
1762 size = btrfs_file_extent_inline_len(leaf, btrfs_item_nr(leaf,
1763 path->slots[0]));
689f9346 1764 extent_end = (extent_start + size - 1) |
db94535d 1765 ((u64)root->sectorsize - 1);
b888db2b 1766 if (start < extent_start || start >= extent_end) {
a52d9a80
CM
1767 em->start = start;
1768 if (start < extent_start) {
b888db2b
CM
1769 if (end < extent_start)
1770 goto not_found;
50b78c24 1771 em->end = extent_end;
a52d9a80
CM
1772 } else {
1773 em->end = end;
1774 }
1775 goto not_found_em;
1776 }
689f9346
Y
1777 em->block_start = EXTENT_MAP_INLINE;
1778 em->block_end = EXTENT_MAP_INLINE;
1779
1780 if (!page) {
1781 em->start = extent_start;
1782 em->end = extent_start + size - 1;
1783 goto out;
1784 }
5f39d397 1785
35ebb934 1786 extent_offset = ((u64)page->index << PAGE_CACHE_SHIFT) -
689f9346 1787 extent_start + page_offset;
ae2f5411 1788 copy_size = min_t(u64, PAGE_CACHE_SIZE - page_offset,
3326d1b0 1789 size - extent_offset);
3326d1b0
CM
1790 em->start = extent_start + extent_offset;
1791 em->end = (em->start + copy_size -1) |
1792 ((u64)root->sectorsize -1);
689f9346
Y
1793 map = kmap(page);
1794 ptr = btrfs_file_extent_inline_start(item) + extent_offset;
179e29e4
CM
1795 if (create == 0 && !PageUptodate(page)) {
1796 read_extent_buffer(leaf, map + page_offset, ptr,
1797 copy_size);
1798 flush_dcache_page(page);
1799 } else if (create && PageUptodate(page)) {
1800 if (!trans) {
1801 kunmap(page);
1802 free_extent_map(em);
1803 em = NULL;
1804 btrfs_release_path(root, path);
1805 trans = btrfs_start_transaction(root, 1);
1806 goto again;
1807 }
1808 write_extent_buffer(leaf, map + page_offset, ptr,
1809 copy_size);
1810 btrfs_mark_buffer_dirty(leaf);
a52d9a80 1811 }
a52d9a80 1812 kunmap(page);
3326d1b0 1813 set_extent_uptodate(em_tree, em->start, em->end, GFP_NOFS);
a52d9a80
CM
1814 goto insert;
1815 } else {
1816 printk("unkknown found_type %d\n", found_type);
1817 WARN_ON(1);
1818 }
1819not_found:
1820 em->start = start;
1821 em->end = end;
1822not_found_em:
5f39d397
CM
1823 em->block_start = EXTENT_MAP_HOLE;
1824 em->block_end = EXTENT_MAP_HOLE;
a52d9a80
CM
1825insert:
1826 btrfs_release_path(root, path);
1827 if (em->start > start || em->end < start) {
b888db2b 1828 printk("bad extent! em: [%Lu %Lu] passed [%Lu %Lu]\n", em->start, em->end, start, end);
a52d9a80
CM
1829 err = -EIO;
1830 goto out;
1831 }
1832 ret = add_extent_mapping(em_tree, em);
1833 if (ret == -EEXIST) {
1834 free_extent_map(em);
2bf5a725 1835 em = NULL;
6da6abae
CM
1836 if (0 && failed_insert == 1) {
1837 btrfs_drop_extent_cache(inode, start, end);
1838 }
a52d9a80
CM
1839 failed_insert++;
1840 if (failed_insert > 5) {
1841 printk("failing to insert %Lu %Lu\n", start, end);
1842 err = -EIO;
1843 goto out;
1844 }
a52d9a80
CM
1845 goto again;
1846 }
1847 err = 0;
1848out:
1849 btrfs_free_path(path);
1850 if (trans) {
1851 ret = btrfs_end_transaction(trans, root);
1852 if (!err)
1853 err = ret;
1854 }
1855 mutex_unlock(&root->fs_info->fs_mutex);
1856 if (err) {
1857 free_extent_map(em);
1858 WARN_ON(1);
1859 return ERR_PTR(err);
1860 }
1861 return em;
1862}
1863
d396c6f5 1864static sector_t btrfs_bmap(struct address_space *mapping, sector_t iblock)
39279cc3 1865{
d396c6f5 1866 return extent_bmap(mapping, iblock, btrfs_get_extent);
39279cc3
CM
1867}
1868
1869static int btrfs_prepare_write(struct file *file, struct page *page,
1870 unsigned from, unsigned to)
1871{
a52d9a80
CM
1872 return extent_prepare_write(&BTRFS_I(page->mapping->host)->extent_tree,
1873 page->mapping->host, page, from, to,
1874 btrfs_get_extent);
39279cc3
CM
1875}
1876
a52d9a80 1877int btrfs_readpage(struct file *file, struct page *page)
9ebefb18 1878{
a52d9a80
CM
1879 struct extent_map_tree *tree;
1880 tree = &BTRFS_I(page->mapping->host)->extent_tree;
1881 return extent_read_full_page(tree, page, btrfs_get_extent);
9ebefb18 1882}
a52d9a80 1883static int btrfs_writepage(struct page *page, struct writeback_control *wbc)
39279cc3 1884{
a52d9a80 1885 struct extent_map_tree *tree;
b888db2b
CM
1886
1887
1888 if (current->flags & PF_MEMALLOC) {
1889 redirty_page_for_writepage(wbc, page);
1890 unlock_page(page);
1891 return 0;
1892 }
a52d9a80
CM
1893 tree = &BTRFS_I(page->mapping->host)->extent_tree;
1894 return extent_write_full_page(tree, page, btrfs_get_extent, wbc);
9ebefb18
CM
1895}
1896
b293f02e
CM
1897static int btrfs_writepages(struct address_space *mapping,
1898 struct writeback_control *wbc)
1899{
1900 struct extent_map_tree *tree;
1901 tree = &BTRFS_I(mapping->host)->extent_tree;
1902 return extent_writepages(tree, mapping, btrfs_get_extent, wbc);
1903}
1904
3ab2fb5a
CM
1905static int
1906btrfs_readpages(struct file *file, struct address_space *mapping,
1907 struct list_head *pages, unsigned nr_pages)
1908{
1909 struct extent_map_tree *tree;
1910 tree = &BTRFS_I(mapping->host)->extent_tree;
1911 return extent_readpages(tree, mapping, pages, nr_pages,
1912 btrfs_get_extent);
1913}
1914
a52d9a80 1915static int btrfs_releasepage(struct page *page, gfp_t unused_gfp_flags)
9ebefb18 1916{
a52d9a80
CM
1917 struct extent_map_tree *tree;
1918 int ret;
8c2383c3 1919
a52d9a80
CM
1920 tree = &BTRFS_I(page->mapping->host)->extent_tree;
1921 ret = try_release_extent_mapping(tree, page);
1922 if (ret == 1) {
1923 ClearPagePrivate(page);
1924 set_page_private(page, 0);
1925 page_cache_release(page);
39279cc3 1926 }
a52d9a80 1927 return ret;
39279cc3
CM
1928}
1929
a52d9a80 1930static void btrfs_invalidatepage(struct page *page, unsigned long offset)
39279cc3 1931{
a52d9a80 1932 struct extent_map_tree *tree;
39279cc3 1933
a52d9a80
CM
1934 tree = &BTRFS_I(page->mapping->host)->extent_tree;
1935 extent_invalidatepage(tree, page, offset);
1936 btrfs_releasepage(page, GFP_NOFS);
39279cc3
CM
1937}
1938
9ebefb18
CM
1939/*
1940 * btrfs_page_mkwrite() is not allowed to change the file size as it gets
1941 * called from a page fault handler when a page is first dirtied. Hence we must
1942 * be careful to check for EOF conditions here. We set the page up correctly
1943 * for a written page which means we get ENOSPC checking when writing into
1944 * holes and correct delalloc and unwritten extent mapping on filesystems that
1945 * support these features.
1946 *
1947 * We are not allowed to take the i_mutex here so we have to play games to
1948 * protect against truncate races as the page could now be beyond EOF. Because
1949 * vmtruncate() writes the inode size before removing pages, once we have the
1950 * page lock we can determine safely if the page is beyond EOF. If it is not
1951 * beyond EOF, then the page is guaranteed safe against truncation until we
1952 * unlock the page.
1953 */
1954int btrfs_page_mkwrite(struct vm_area_struct *vma, struct page *page)
1955{
6da6abae 1956 struct inode *inode = fdentry(vma->vm_file)->d_inode;
9ebefb18
CM
1957 unsigned long end;
1958 loff_t size;
1959 int ret = -EINVAL;
a52d9a80 1960 u64 page_start;
9ebefb18 1961
011410bd 1962 down_read(&BTRFS_I(inode)->root->snap_sem);
9ebefb18
CM
1963 lock_page(page);
1964 wait_on_page_writeback(page);
9ebefb18 1965 size = i_size_read(inode);
35ebb934 1966 page_start = (u64)page->index << PAGE_CACHE_SHIFT;
a52d9a80 1967
9ebefb18 1968 if ((page->mapping != inode->i_mapping) ||
a52d9a80 1969 (page_start > size)) {
9ebefb18
CM
1970 /* page got truncated out from underneath us */
1971 goto out_unlock;
1972 }
1973
1974 /* page is wholly or partially inside EOF */
a52d9a80 1975 if (page_start + PAGE_CACHE_SIZE > size)
9ebefb18
CM
1976 end = size & ~PAGE_CACHE_MASK;
1977 else
1978 end = PAGE_CACHE_SIZE;
1979
b888db2b 1980 ret = btrfs_cow_one_page(inode, page, end);
9ebefb18
CM
1981
1982out_unlock:
011410bd 1983 up_read(&BTRFS_I(inode)->root->snap_sem);
9ebefb18
CM
1984 unlock_page(page);
1985 return ret;
1986}
1987
39279cc3
CM
1988static void btrfs_truncate(struct inode *inode)
1989{
1990 struct btrfs_root *root = BTRFS_I(inode)->root;
1991 int ret;
1992 struct btrfs_trans_handle *trans;
d3c2fdcf 1993 unsigned long nr;
39279cc3
CM
1994
1995 if (!S_ISREG(inode->i_mode))
1996 return;
1997 if (IS_APPEND(inode) || IS_IMMUTABLE(inode))
1998 return;
1999
2000 btrfs_truncate_page(inode->i_mapping, inode->i_size);
2001
2002 mutex_lock(&root->fs_info->fs_mutex);
2003 trans = btrfs_start_transaction(root, 1);
2004 btrfs_set_trans_block_group(trans, inode);
2005
2006 /* FIXME, add redo link to tree so we don't leak on crash */
2007 ret = btrfs_truncate_in_trans(trans, root, inode);
39279cc3 2008 btrfs_update_inode(trans, root, inode);
d3c2fdcf 2009 nr = trans->blocks_used;
5f39d397 2010
39279cc3
CM
2011 ret = btrfs_end_transaction(trans, root);
2012 BUG_ON(ret);
2013 mutex_unlock(&root->fs_info->fs_mutex);
d3c2fdcf 2014 btrfs_btree_balance_dirty(root, nr);
39279cc3
CM
2015}
2016
2017int btrfs_commit_write(struct file *file, struct page *page,
2018 unsigned from, unsigned to)
2019{
e9906a98
CM
2020 loff_t pos = ((loff_t)page->index << PAGE_CACHE_SHIFT) + to;
2021 struct inode *inode = page->mapping->host;
2022
2023 btrfs_cow_one_page(inode, page, PAGE_CACHE_SIZE);
2024
e9906a98
CM
2025 if (pos > inode->i_size) {
2026 i_size_write(inode, pos);
2027 mark_inode_dirty(inode);
2028 }
2029 return 0;
39279cc3
CM
2030}
2031
2032static int create_subvol(struct btrfs_root *root, char *name, int namelen)
2033{
2034 struct btrfs_trans_handle *trans;
2035 struct btrfs_key key;
2036 struct btrfs_root_item root_item;
2037 struct btrfs_inode_item *inode_item;
5f39d397 2038 struct extent_buffer *leaf;
39279cc3
CM
2039 struct btrfs_root *new_root;
2040 struct inode *inode;
2041 struct inode *dir;
2042 int ret;
54aa1f4d 2043 int err;
39279cc3
CM
2044 u64 objectid;
2045 u64 new_dirid = BTRFS_FIRST_FREE_OBJECTID;
d3c2fdcf 2046 unsigned long nr = 1;
39279cc3
CM
2047
2048 mutex_lock(&root->fs_info->fs_mutex);
2049 trans = btrfs_start_transaction(root, 1);
2050 BUG_ON(!trans);
2051
7bb86316
CM
2052 ret = btrfs_find_free_objectid(trans, root->fs_info->tree_root,
2053 0, &objectid);
2054 if (ret)
2055 goto fail;
2056
2057 leaf = __btrfs_alloc_free_block(trans, root, root->leafsize,
2058 objectid, trans->transid, 0, 0,
2059 0, 0);
5f39d397
CM
2060 if (IS_ERR(leaf))
2061 return PTR_ERR(leaf);
2062
2063 btrfs_set_header_nritems(leaf, 0);
2064 btrfs_set_header_level(leaf, 0);
db94535d 2065 btrfs_set_header_bytenr(leaf, leaf->start);
5f39d397 2066 btrfs_set_header_generation(leaf, trans->transid);
7bb86316
CM
2067 btrfs_set_header_owner(leaf, objectid);
2068
5f39d397
CM
2069 write_extent_buffer(leaf, root->fs_info->fsid,
2070 (unsigned long)btrfs_header_fsid(leaf),
2071 BTRFS_FSID_SIZE);
2072 btrfs_mark_buffer_dirty(leaf);
39279cc3
CM
2073
2074 inode_item = &root_item.inode;
2075 memset(inode_item, 0, sizeof(*inode_item));
5f39d397
CM
2076 inode_item->generation = cpu_to_le64(1);
2077 inode_item->size = cpu_to_le64(3);
2078 inode_item->nlink = cpu_to_le32(1);
2079 inode_item->nblocks = cpu_to_le64(1);
2080 inode_item->mode = cpu_to_le32(S_IFDIR | 0755);
39279cc3 2081
db94535d
CM
2082 btrfs_set_root_bytenr(&root_item, leaf->start);
2083 btrfs_set_root_level(&root_item, 0);
39279cc3 2084 btrfs_set_root_refs(&root_item, 1);
5f39d397
CM
2085 btrfs_set_root_used(&root_item, 0);
2086
5eda7b5e
CM
2087 memset(&root_item.drop_progress, 0, sizeof(root_item.drop_progress));
2088 root_item.drop_level = 0;
5f39d397
CM
2089
2090 free_extent_buffer(leaf);
2091 leaf = NULL;
39279cc3 2092
39279cc3
CM
2093 btrfs_set_root_dirid(&root_item, new_dirid);
2094
2095 key.objectid = objectid;
2096 key.offset = 1;
39279cc3
CM
2097 btrfs_set_key_type(&key, BTRFS_ROOT_ITEM_KEY);
2098 ret = btrfs_insert_root(trans, root->fs_info->tree_root, &key,
2099 &root_item);
54aa1f4d
CM
2100 if (ret)
2101 goto fail;
39279cc3
CM
2102
2103 /*
2104 * insert the directory item
2105 */
2106 key.offset = (u64)-1;
2107 dir = root->fs_info->sb->s_root->d_inode;
2108 ret = btrfs_insert_dir_item(trans, root->fs_info->tree_root,
2109 name, namelen, dir->i_ino, &key,
2110 BTRFS_FT_DIR);
54aa1f4d
CM
2111 if (ret)
2112 goto fail;
39279cc3 2113
3954401f
CM
2114 ret = btrfs_insert_inode_ref(trans, root->fs_info->tree_root,
2115 name, namelen, objectid,
2116 root->fs_info->sb->s_root->d_inode->i_ino);
2117 if (ret)
2118 goto fail;
2119
39279cc3 2120 ret = btrfs_commit_transaction(trans, root);
54aa1f4d
CM
2121 if (ret)
2122 goto fail_commit;
39279cc3 2123
58176a96 2124 new_root = btrfs_read_fs_root(root->fs_info, &key, name, namelen);
39279cc3
CM
2125 BUG_ON(!new_root);
2126
2127 trans = btrfs_start_transaction(new_root, 1);
2128 BUG_ON(!trans);
2129
2130 inode = btrfs_new_inode(trans, new_root, new_dirid,
2131 BTRFS_I(dir)->block_group, S_IFDIR | 0700);
54aa1f4d
CM
2132 if (IS_ERR(inode))
2133 goto fail;
39279cc3
CM
2134 inode->i_op = &btrfs_dir_inode_operations;
2135 inode->i_fop = &btrfs_dir_file_operations;
34088780 2136 new_root->inode = inode;
39279cc3 2137
3954401f
CM
2138 ret = btrfs_insert_inode_ref(trans, new_root, "..", 2, new_dirid,
2139 new_dirid);
39279cc3 2140 inode->i_nlink = 1;
3954401f 2141 inode->i_size = 0;
39279cc3 2142 ret = btrfs_update_inode(trans, new_root, inode);
54aa1f4d
CM
2143 if (ret)
2144 goto fail;
2145fail:
d3c2fdcf 2146 nr = trans->blocks_used;
54aa1f4d
CM
2147 err = btrfs_commit_transaction(trans, root);
2148 if (err && !ret)
2149 ret = err;
2150fail_commit:
39279cc3 2151 mutex_unlock(&root->fs_info->fs_mutex);
d3c2fdcf 2152 btrfs_btree_balance_dirty(root, nr);
54aa1f4d 2153 return ret;
39279cc3
CM
2154}
2155
2156static int create_snapshot(struct btrfs_root *root, char *name, int namelen)
2157{
2158 struct btrfs_trans_handle *trans;
2159 struct btrfs_key key;
2160 struct btrfs_root_item new_root_item;
5f39d397 2161 struct extent_buffer *tmp;
39279cc3 2162 int ret;
54aa1f4d 2163 int err;
39279cc3 2164 u64 objectid;
d3c2fdcf 2165 unsigned long nr;
39279cc3
CM
2166
2167 if (!root->ref_cows)
2168 return -EINVAL;
2169
011410bd
CM
2170 down_write(&root->snap_sem);
2171 freeze_bdev(root->fs_info->sb->s_bdev);
2172 thaw_bdev(root->fs_info->sb->s_bdev, root->fs_info->sb);
2173
39279cc3
CM
2174 mutex_lock(&root->fs_info->fs_mutex);
2175 trans = btrfs_start_transaction(root, 1);
2176 BUG_ON(!trans);
2177
2178 ret = btrfs_update_inode(trans, root, root->inode);
54aa1f4d
CM
2179 if (ret)
2180 goto fail;
39279cc3
CM
2181
2182 ret = btrfs_find_free_objectid(trans, root->fs_info->tree_root,
2183 0, &objectid);
54aa1f4d
CM
2184 if (ret)
2185 goto fail;
39279cc3
CM
2186
2187 memcpy(&new_root_item, &root->root_item,
2188 sizeof(new_root_item));
2189
2190 key.objectid = objectid;
2191 key.offset = 1;
39279cc3 2192 btrfs_set_key_type(&key, BTRFS_ROOT_ITEM_KEY);
be20aa9d 2193
9691975d 2194 extent_buffer_get(root->node);
83df7c1d 2195 btrfs_cow_block(trans, root, root->node, NULL, 0, &tmp);
9691975d 2196 free_extent_buffer(tmp);
be20aa9d
CM
2197
2198 btrfs_copy_root(trans, root, root->node, &tmp, objectid);
2199
2200 btrfs_set_root_bytenr(&new_root_item, tmp->start);
2201 btrfs_set_root_level(&new_root_item, btrfs_header_level(tmp));
39279cc3
CM
2202 ret = btrfs_insert_root(trans, root->fs_info->tree_root, &key,
2203 &new_root_item);
be20aa9d 2204 free_extent_buffer(tmp);
54aa1f4d
CM
2205 if (ret)
2206 goto fail;
39279cc3
CM
2207
2208 /*
2209 * insert the directory item
2210 */
2211 key.offset = (u64)-1;
2212 ret = btrfs_insert_dir_item(trans, root->fs_info->tree_root,
2213 name, namelen,
2214 root->fs_info->sb->s_root->d_inode->i_ino,
2215 &key, BTRFS_FT_DIR);
2216
54aa1f4d
CM
2217 if (ret)
2218 goto fail;
39279cc3 2219
3954401f
CM
2220 ret = btrfs_insert_inode_ref(trans, root->fs_info->tree_root,
2221 name, namelen, objectid,
2222 root->fs_info->sb->s_root->d_inode->i_ino);
2223
2224 if (ret)
2225 goto fail;
54aa1f4d 2226fail:
d3c2fdcf 2227 nr = trans->blocks_used;
54aa1f4d 2228 err = btrfs_commit_transaction(trans, root);
5f39d397 2229
54aa1f4d
CM
2230 if (err && !ret)
2231 ret = err;
5f39d397 2232
39279cc3 2233 mutex_unlock(&root->fs_info->fs_mutex);
011410bd 2234 up_write(&root->snap_sem);
d3c2fdcf 2235 btrfs_btree_balance_dirty(root, nr);
54aa1f4d 2236 return ret;
39279cc3
CM
2237}
2238
86479a04
CM
2239static unsigned long force_ra(struct address_space *mapping,
2240 struct file_ra_state *ra, struct file *file,
2241 pgoff_t offset, pgoff_t last_index)
2242{
2243 pgoff_t req_size;
2244
2245#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,23)
2246 req_size = last_index - offset + 1;
2247 offset = page_cache_readahead(mapping, ra, file, offset, req_size);
2248 return offset;
2249#else
2250 req_size = min(last_index - offset + 1, (pgoff_t)128);
2251 page_cache_sync_readahead(mapping, ra, file, offset, req_size);
2252 return offset + req_size;
2253#endif
2254}
2255
2256int btrfs_defrag_file(struct file *file) {
6da6abae 2257 struct inode *inode = fdentry(file)->d_inode;
86479a04
CM
2258 struct extent_map_tree *em_tree = &BTRFS_I(inode)->extent_tree;
2259 struct page *page;
2260 unsigned long last_index;
2261 unsigned long ra_index = 0;
2262 u64 page_start;
2263 u64 page_end;
2264 unsigned long i;
2265
2266 mutex_lock(&inode->i_mutex);
2267 last_index = inode->i_size >> PAGE_CACHE_SHIFT;
2268 for (i = 0; i <= last_index; i++) {
2269 if (i == ra_index) {
2270 ra_index = force_ra(inode->i_mapping, &file->f_ra,
2271 file, ra_index, last_index);
2272 }
2273 page = grab_cache_page(inode->i_mapping, i);
2274 if (!page)
2275 goto out_unlock;
2276 if (!PageUptodate(page)) {
2277 btrfs_readpage(NULL, page);
2278 lock_page(page);
2279 if (!PageUptodate(page)) {
2280 unlock_page(page);
2281 page_cache_release(page);
2282 goto out_unlock;
2283 }
2284 }
35ebb934 2285 page_start = (u64)page->index << PAGE_CACHE_SHIFT;
86479a04
CM
2286 page_end = page_start + PAGE_CACHE_SIZE - 1;
2287
2288 lock_extent(em_tree, page_start, page_end, GFP_NOFS);
2289 set_extent_delalloc(em_tree, page_start,
2290 page_end, GFP_NOFS);
2291 unlock_extent(em_tree, page_start, page_end, GFP_NOFS);
2292 set_page_dirty(page);
2293 unlock_page(page);
2294 page_cache_release(page);
2295 balance_dirty_pages_ratelimited_nr(inode->i_mapping, 1);
2296 }
2297
2298out_unlock:
2299 mutex_unlock(&inode->i_mutex);
2300 return 0;
2301}
2302
d03581f4 2303static int btrfs_ioctl_snap_create(struct btrfs_root *root, void __user *arg)
39279cc3 2304{
4aec2b52 2305 struct btrfs_ioctl_vol_args *vol_args;
39279cc3 2306 struct btrfs_dir_item *di;
39279cc3
CM
2307 struct btrfs_path *path;
2308 u64 root_dirid;
4aec2b52
CM
2309 int namelen;
2310 int ret;
39279cc3 2311
4aec2b52 2312 vol_args = kmalloc(sizeof(*vol_args), GFP_NOFS);
5f39d397 2313
4aec2b52
CM
2314 if (!vol_args)
2315 return -ENOMEM;
2316
2317 if (copy_from_user(vol_args, arg, sizeof(*vol_args))) {
2318 ret = -EFAULT;
2319 goto out;
2320 }
2321
2322 namelen = strlen(vol_args->name);
2323 if (namelen > BTRFS_VOL_NAME_MAX) {
2324 ret = -EINVAL;
2325 goto out;
2326 }
2327 if (strchr(vol_args->name, '/')) {
2328 ret = -EINVAL;
2329 goto out;
2330 }
d03581f4
CH
2331
2332 path = btrfs_alloc_path();
4aec2b52
CM
2333 if (!path) {
2334 ret = -ENOMEM;
2335 goto out;
2336 }
d03581f4
CH
2337
2338 root_dirid = root->fs_info->sb->s_root->d_inode->i_ino,
2339 mutex_lock(&root->fs_info->fs_mutex);
2340 di = btrfs_lookup_dir_item(NULL, root->fs_info->tree_root,
2341 path, root_dirid,
4aec2b52 2342 vol_args->name, namelen, 0);
d03581f4
CH
2343 mutex_unlock(&root->fs_info->fs_mutex);
2344 btrfs_free_path(path);
4aec2b52
CM
2345
2346 if (di && !IS_ERR(di)) {
2347 ret = -EEXIST;
2348 goto out;
2349 }
2350
2351 if (IS_ERR(di)) {
2352 ret = PTR_ERR(di);
2353 goto out;
2354 }
d03581f4
CH
2355
2356 if (root == root->fs_info->tree_root)
4aec2b52
CM
2357 ret = create_subvol(root, vol_args->name, namelen);
2358 else
2359 ret = create_snapshot(root, vol_args->name, namelen);
2360out:
2361 kfree(vol_args);
2362 return ret;
d03581f4
CH
2363}
2364
2365static int btrfs_ioctl_defrag(struct file *file)
2366{
6da6abae 2367 struct inode *inode = fdentry(file)->d_inode;
d03581f4
CH
2368 struct btrfs_root *root = BTRFS_I(inode)->root;
2369
2370 switch (inode->i_mode & S_IFMT) {
2371 case S_IFDIR:
39279cc3 2372 mutex_lock(&root->fs_info->fs_mutex);
d03581f4
CH
2373 btrfs_defrag_root(root, 0);
2374 btrfs_defrag_root(root->fs_info->extent_root, 0);
39279cc3 2375 mutex_unlock(&root->fs_info->fs_mutex);
39279cc3 2376 break;
d03581f4
CH
2377 case S_IFREG:
2378 btrfs_defrag_file(file);
2379 break;
2380 }
2381
2382 return 0;
2383}
6702ed49 2384
d03581f4
CH
2385long btrfs_ioctl(struct file *file, unsigned int
2386 cmd, unsigned long arg)
2387{
6da6abae 2388 struct btrfs_root *root = BTRFS_I(fdentry(file)->d_inode)->root;
d03581f4
CH
2389
2390 switch (cmd) {
2391 case BTRFS_IOC_SNAP_CREATE:
2392 return btrfs_ioctl_snap_create(root, (void __user *)arg);
6702ed49 2393 case BTRFS_IOC_DEFRAG:
d03581f4 2394 return btrfs_ioctl_defrag(file);
39279cc3 2395 }
d03581f4
CH
2396
2397 return -ENOTTY;
39279cc3
CM
2398}
2399
39279cc3
CM
2400/*
2401 * Called inside transaction, so use GFP_NOFS
2402 */
2403struct inode *btrfs_alloc_inode(struct super_block *sb)
2404{
2405 struct btrfs_inode *ei;
2406
2407 ei = kmem_cache_alloc(btrfs_inode_cachep, GFP_NOFS);
2408 if (!ei)
2409 return NULL;
15ee9bc7 2410 ei->last_trans = 0;
39279cc3
CM
2411 return &ei->vfs_inode;
2412}
2413
2414void btrfs_destroy_inode(struct inode *inode)
2415{
2416 WARN_ON(!list_empty(&inode->i_dentry));
2417 WARN_ON(inode->i_data.nrpages);
2418
2419 kmem_cache_free(btrfs_inode_cachep, BTRFS_I(inode));
2420}
2421
44ec0b71
CM
2422#if LINUX_VERSION_CODE > KERNEL_VERSION(2,6,23)
2423static void init_once(struct kmem_cache * cachep, void *foo)
2424#else
39279cc3
CM
2425static void init_once(void * foo, struct kmem_cache * cachep,
2426 unsigned long flags)
44ec0b71 2427#endif
39279cc3
CM
2428{
2429 struct btrfs_inode *ei = (struct btrfs_inode *) foo;
2430
2431 inode_init_once(&ei->vfs_inode);
2432}
2433
2434void btrfs_destroy_cachep(void)
2435{
2436 if (btrfs_inode_cachep)
2437 kmem_cache_destroy(btrfs_inode_cachep);
2438 if (btrfs_trans_handle_cachep)
2439 kmem_cache_destroy(btrfs_trans_handle_cachep);
2440 if (btrfs_transaction_cachep)
2441 kmem_cache_destroy(btrfs_transaction_cachep);
2442 if (btrfs_bit_radix_cachep)
2443 kmem_cache_destroy(btrfs_bit_radix_cachep);
2444 if (btrfs_path_cachep)
2445 kmem_cache_destroy(btrfs_path_cachep);
2446}
2447
86479a04 2448struct kmem_cache *btrfs_cache_create(const char *name, size_t size,
92fee66d 2449 unsigned long extra_flags,
44ec0b71
CM
2450#if LINUX_VERSION_CODE > KERNEL_VERSION(2,6,23)
2451 void (*ctor)(struct kmem_cache *, void *)
2452#else
92fee66d 2453 void (*ctor)(void *, struct kmem_cache *,
44ec0b71
CM
2454 unsigned long)
2455#endif
2456 )
92fee66d
CM
2457{
2458 return kmem_cache_create(name, size, 0, (SLAB_RECLAIM_ACCOUNT |
2459 SLAB_MEM_SPREAD | extra_flags), ctor
2460#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,23)
2461 ,NULL
2462#endif
2463 );
2464}
2465
39279cc3
CM
2466int btrfs_init_cachep(void)
2467{
86479a04 2468 btrfs_inode_cachep = btrfs_cache_create("btrfs_inode_cache",
92fee66d
CM
2469 sizeof(struct btrfs_inode),
2470 0, init_once);
39279cc3
CM
2471 if (!btrfs_inode_cachep)
2472 goto fail;
86479a04
CM
2473 btrfs_trans_handle_cachep =
2474 btrfs_cache_create("btrfs_trans_handle_cache",
2475 sizeof(struct btrfs_trans_handle),
2476 0, NULL);
39279cc3
CM
2477 if (!btrfs_trans_handle_cachep)
2478 goto fail;
86479a04 2479 btrfs_transaction_cachep = btrfs_cache_create("btrfs_transaction_cache",
39279cc3 2480 sizeof(struct btrfs_transaction),
92fee66d 2481 0, NULL);
39279cc3
CM
2482 if (!btrfs_transaction_cachep)
2483 goto fail;
86479a04 2484 btrfs_path_cachep = btrfs_cache_create("btrfs_path_cache",
23223584 2485 sizeof(struct btrfs_path),
92fee66d 2486 0, NULL);
39279cc3
CM
2487 if (!btrfs_path_cachep)
2488 goto fail;
86479a04 2489 btrfs_bit_radix_cachep = btrfs_cache_create("btrfs_radix", 256,
92fee66d 2490 SLAB_DESTROY_BY_RCU, NULL);
39279cc3
CM
2491 if (!btrfs_bit_radix_cachep)
2492 goto fail;
2493 return 0;
2494fail:
2495 btrfs_destroy_cachep();
2496 return -ENOMEM;
2497}
2498
2499static int btrfs_getattr(struct vfsmount *mnt,
2500 struct dentry *dentry, struct kstat *stat)
2501{
2502 struct inode *inode = dentry->d_inode;
2503 generic_fillattr(inode, stat);
2504 stat->blksize = 256 * 1024;
2505 return 0;
2506}
2507
2508static int btrfs_rename(struct inode * old_dir, struct dentry *old_dentry,
2509 struct inode * new_dir,struct dentry *new_dentry)
2510{
2511 struct btrfs_trans_handle *trans;
2512 struct btrfs_root *root = BTRFS_I(old_dir)->root;
2513 struct inode *new_inode = new_dentry->d_inode;
2514 struct inode *old_inode = old_dentry->d_inode;
2515 struct timespec ctime = CURRENT_TIME;
2516 struct btrfs_path *path;
39279cc3
CM
2517 int ret;
2518
2519 if (S_ISDIR(old_inode->i_mode) && new_inode &&
2520 new_inode->i_size > BTRFS_EMPTY_DIR_SIZE) {
2521 return -ENOTEMPTY;
2522 }
5f39d397 2523
39279cc3
CM
2524 mutex_lock(&root->fs_info->fs_mutex);
2525 trans = btrfs_start_transaction(root, 1);
5f39d397 2526
39279cc3
CM
2527 btrfs_set_trans_block_group(trans, new_dir);
2528 path = btrfs_alloc_path();
2529 if (!path) {
2530 ret = -ENOMEM;
2531 goto out_fail;
2532 }
2533
2534 old_dentry->d_inode->i_nlink++;
2535 old_dir->i_ctime = old_dir->i_mtime = ctime;
2536 new_dir->i_ctime = new_dir->i_mtime = ctime;
2537 old_inode->i_ctime = ctime;
5f39d397 2538
39279cc3
CM
2539 ret = btrfs_unlink_trans(trans, root, old_dir, old_dentry);
2540 if (ret)
2541 goto out_fail;
2542
2543 if (new_inode) {
2544 new_inode->i_ctime = CURRENT_TIME;
2545 ret = btrfs_unlink_trans(trans, root, new_dir, new_dentry);
2546 if (ret)
2547 goto out_fail;
39279cc3
CM
2548 }
2549 ret = btrfs_add_link(trans, new_dentry, old_inode);
2550 if (ret)
2551 goto out_fail;
2552
2553out_fail:
2554 btrfs_free_path(path);
2555 btrfs_end_transaction(trans, root);
2556 mutex_unlock(&root->fs_info->fs_mutex);
2557 return ret;
2558}
2559
2560static int btrfs_symlink(struct inode *dir, struct dentry *dentry,
2561 const char *symname)
2562{
2563 struct btrfs_trans_handle *trans;
2564 struct btrfs_root *root = BTRFS_I(dir)->root;
2565 struct btrfs_path *path;
2566 struct btrfs_key key;
2567 struct inode *inode;
2568 int err;
2569 int drop_inode = 0;
2570 u64 objectid;
2571 int name_len;
2572 int datasize;
5f39d397 2573 unsigned long ptr;
39279cc3 2574 struct btrfs_file_extent_item *ei;
5f39d397 2575 struct extent_buffer *leaf;
d3c2fdcf 2576 unsigned long nr;
39279cc3
CM
2577
2578 name_len = strlen(symname) + 1;
2579 if (name_len > BTRFS_MAX_INLINE_DATA_SIZE(root))
2580 return -ENAMETOOLONG;
2581 mutex_lock(&root->fs_info->fs_mutex);
2582 trans = btrfs_start_transaction(root, 1);
2583 btrfs_set_trans_block_group(trans, dir);
2584
2585 err = btrfs_find_free_objectid(trans, root, dir->i_ino, &objectid);
2586 if (err) {
2587 err = -ENOSPC;
2588 goto out_unlock;
2589 }
2590
2591 inode = btrfs_new_inode(trans, root, objectid,
2592 BTRFS_I(dir)->block_group, S_IFLNK|S_IRWXUGO);
2593 err = PTR_ERR(inode);
2594 if (IS_ERR(inode))
2595 goto out_unlock;
2596
2597 btrfs_set_trans_block_group(trans, inode);
2598 err = btrfs_add_nondir(trans, dentry, inode);
2599 if (err)
2600 drop_inode = 1;
2601 else {
2602 inode->i_mapping->a_ops = &btrfs_aops;
2603 inode->i_fop = &btrfs_file_operations;
2604 inode->i_op = &btrfs_file_inode_operations;
a52d9a80
CM
2605 extent_map_tree_init(&BTRFS_I(inode)->extent_tree,
2606 inode->i_mapping, GFP_NOFS);
07157aac 2607 BTRFS_I(inode)->extent_tree.ops = &btrfs_extent_map_ops;
39279cc3
CM
2608 }
2609 dir->i_sb->s_dirt = 1;
2610 btrfs_update_inode_block_group(trans, inode);
2611 btrfs_update_inode_block_group(trans, dir);
2612 if (drop_inode)
2613 goto out_unlock;
2614
2615 path = btrfs_alloc_path();
2616 BUG_ON(!path);
2617 key.objectid = inode->i_ino;
2618 key.offset = 0;
39279cc3
CM
2619 btrfs_set_key_type(&key, BTRFS_EXTENT_DATA_KEY);
2620 datasize = btrfs_file_extent_calc_inline_size(name_len);
2621 err = btrfs_insert_empty_item(trans, root, path, &key,
2622 datasize);
54aa1f4d
CM
2623 if (err) {
2624 drop_inode = 1;
2625 goto out_unlock;
2626 }
5f39d397
CM
2627 leaf = path->nodes[0];
2628 ei = btrfs_item_ptr(leaf, path->slots[0],
2629 struct btrfs_file_extent_item);
2630 btrfs_set_file_extent_generation(leaf, ei, trans->transid);
2631 btrfs_set_file_extent_type(leaf, ei,
39279cc3
CM
2632 BTRFS_FILE_EXTENT_INLINE);
2633 ptr = btrfs_file_extent_inline_start(ei);
5f39d397
CM
2634 write_extent_buffer(leaf, symname, ptr, name_len);
2635 btrfs_mark_buffer_dirty(leaf);
39279cc3 2636 btrfs_free_path(path);
5f39d397 2637
39279cc3
CM
2638 inode->i_op = &btrfs_symlink_inode_operations;
2639 inode->i_mapping->a_ops = &btrfs_symlink_aops;
2640 inode->i_size = name_len - 1;
54aa1f4d
CM
2641 err = btrfs_update_inode(trans, root, inode);
2642 if (err)
2643 drop_inode = 1;
39279cc3
CM
2644
2645out_unlock:
d3c2fdcf 2646 nr = trans->blocks_used;
39279cc3
CM
2647 btrfs_end_transaction(trans, root);
2648 mutex_unlock(&root->fs_info->fs_mutex);
39279cc3
CM
2649 if (drop_inode) {
2650 inode_dec_link_count(inode);
2651 iput(inode);
2652 }
d3c2fdcf 2653 btrfs_btree_balance_dirty(root, nr);
39279cc3
CM
2654 return err;
2655}
2656
2657static struct inode_operations btrfs_dir_inode_operations = {
2658 .lookup = btrfs_lookup,
2659 .create = btrfs_create,
2660 .unlink = btrfs_unlink,
2661 .link = btrfs_link,
2662 .mkdir = btrfs_mkdir,
2663 .rmdir = btrfs_rmdir,
2664 .rename = btrfs_rename,
2665 .symlink = btrfs_symlink,
2666 .setattr = btrfs_setattr,
618e21d5 2667 .mknod = btrfs_mknod,
5103e947
JB
2668 .setxattr = generic_setxattr,
2669 .getxattr = generic_getxattr,
2670 .listxattr = btrfs_listxattr,
2671 .removexattr = generic_removexattr,
39279cc3
CM
2672};
2673
2674static struct inode_operations btrfs_dir_ro_inode_operations = {
2675 .lookup = btrfs_lookup,
2676};
2677
2678static struct file_operations btrfs_dir_file_operations = {
2679 .llseek = generic_file_llseek,
2680 .read = generic_read_dir,
2681 .readdir = btrfs_readdir,
34287aa3 2682 .unlocked_ioctl = btrfs_ioctl,
39279cc3 2683#ifdef CONFIG_COMPAT
34287aa3 2684 .compat_ioctl = btrfs_ioctl,
39279cc3
CM
2685#endif
2686};
2687
07157aac
CM
2688static struct extent_map_ops btrfs_extent_map_ops = {
2689 .fill_delalloc = run_delalloc_range,
2690 .writepage_io_hook = btrfs_writepage_io_hook,
2691 .readpage_io_hook = btrfs_readpage_io_hook,
2692 .readpage_end_io_hook = btrfs_readpage_end_io_hook,
2693};
2694
39279cc3
CM
2695static struct address_space_operations btrfs_aops = {
2696 .readpage = btrfs_readpage,
2697 .writepage = btrfs_writepage,
b293f02e 2698 .writepages = btrfs_writepages,
3ab2fb5a 2699 .readpages = btrfs_readpages,
39279cc3
CM
2700 .sync_page = block_sync_page,
2701 .prepare_write = btrfs_prepare_write,
2702 .commit_write = btrfs_commit_write,
2703 .bmap = btrfs_bmap,
a52d9a80
CM
2704 .invalidatepage = btrfs_invalidatepage,
2705 .releasepage = btrfs_releasepage,
2706 .set_page_dirty = __set_page_dirty_nobuffers,
39279cc3
CM
2707};
2708
2709static struct address_space_operations btrfs_symlink_aops = {
2710 .readpage = btrfs_readpage,
2711 .writepage = btrfs_writepage,
2bf5a725
CM
2712 .invalidatepage = btrfs_invalidatepage,
2713 .releasepage = btrfs_releasepage,
39279cc3
CM
2714};
2715
2716static struct inode_operations btrfs_file_inode_operations = {
2717 .truncate = btrfs_truncate,
2718 .getattr = btrfs_getattr,
2719 .setattr = btrfs_setattr,
5103e947
JB
2720 .setxattr = generic_setxattr,
2721 .getxattr = generic_getxattr,
2722 .listxattr = btrfs_listxattr,
2723 .removexattr = generic_removexattr,
39279cc3
CM
2724};
2725
618e21d5
JB
2726static struct inode_operations btrfs_special_inode_operations = {
2727 .getattr = btrfs_getattr,
2728 .setattr = btrfs_setattr,
2729};
2730
39279cc3
CM
2731static struct inode_operations btrfs_symlink_inode_operations = {
2732 .readlink = generic_readlink,
2733 .follow_link = page_follow_link_light,
2734 .put_link = page_put_link,
2735};
This page took 0.210781 seconds and 5 git commands to generate.