Btrfs: extent_map optimizations to cut down on CPU usage
[deliverable/linux.git] / fs / btrfs / file.c
index 1734ca69555563621ed2b6c4662d4e7923825bd8..fe28404ae7f4c4ca68ec516a19bb3008b7e346e3 100644 (file)
@@ -82,8 +82,9 @@ static void btrfs_drop_pages(struct page **pages, size_t num_pages)
 
 static int insert_inline_extent(struct btrfs_trans_handle *trans,
                                struct btrfs_root *root, struct inode *inode,
-                               u64 offset, ssize_t size,
-                               struct page *page, size_t page_offset)
+                               u64 offset, size_t size,
+                               struct page **pages, size_t page_offset,
+                               int num_pages)
 {
        struct btrfs_key key;
        struct btrfs_path *path;
@@ -91,9 +92,12 @@ static int insert_inline_extent(struct btrfs_trans_handle *trans,
        char *kaddr;
        unsigned long ptr;
        struct btrfs_file_extent_item *ei;
+       struct page *page;
        u32 datasize;
        int err = 0;
        int ret;
+       int i;
+       ssize_t cur_size;
 
        path = btrfs_alloc_path();
        if (!path)
@@ -104,25 +108,97 @@ static int insert_inline_extent(struct btrfs_trans_handle *trans,
        key.objectid = inode->i_ino;
        key.offset = offset;
        btrfs_set_key_type(&key, BTRFS_EXTENT_DATA_KEY);
-       BUG_ON(size >= PAGE_CACHE_SIZE);
-       datasize = btrfs_file_extent_calc_inline_size(size);
+       datasize = btrfs_file_extent_calc_inline_size(offset + size);
 
-       ret = btrfs_insert_empty_item(trans, root, path, &key,
-                                     datasize);
-       if (ret) {
+       ret = btrfs_search_slot(trans, root, &key, path, 0, 1);
+       if (ret < 0) {
                err = ret;
                goto fail;
        }
-       leaf = path->nodes[0];
-       ei = btrfs_item_ptr(leaf, path->slots[0],
-                           struct btrfs_file_extent_item);
-       btrfs_set_file_extent_generation(leaf, ei, trans->transid);
-       btrfs_set_file_extent_type(leaf, ei, BTRFS_FILE_EXTENT_INLINE);
-       ptr = btrfs_file_extent_inline_start(ei);
-
-       kaddr = kmap_atomic(page, KM_USER0);
-       write_extent_buffer(leaf, kaddr + page_offset, ptr, size);
-       kunmap_atomic(kaddr, KM_USER0);
+       if (ret == 1) {
+               path->slots[0]--;
+               leaf = path->nodes[0];
+               ei = btrfs_item_ptr(leaf, path->slots[0],
+                                   struct btrfs_file_extent_item);
+
+               if (btrfs_file_extent_type(leaf, ei) !=
+                   BTRFS_FILE_EXTENT_INLINE) {
+                       goto insert;
+               }
+               btrfs_item_key_to_cpu(leaf, &key, path->slots[0]);
+               ret = 0;
+       }
+       if (ret == 0) {
+               u32 found_size;
+               u64 found_start;
+
+               leaf = path->nodes[0];
+               ei = btrfs_item_ptr(leaf, path->slots[0],
+                                   struct btrfs_file_extent_item);
+
+               if (btrfs_file_extent_type(leaf, ei) !=
+                   BTRFS_FILE_EXTENT_INLINE) {
+                       err = ret;
+                       btrfs_print_leaf(root, leaf);
+                       printk("found wasn't inline offset %Lu inode %lu\n",
+                              offset, inode->i_ino);
+                       goto fail;
+               }
+               found_start = key.offset;
+               found_size = btrfs_file_extent_inline_len(leaf,
+                                         btrfs_item_nr(leaf, path->slots[0]));
+
+               if (found_size < offset + size) {
+                       btrfs_release_path(root, path);
+                       ret = btrfs_search_slot(trans, root, &key, path,
+                                               offset + size - found_size -
+                                               found_start, 1);
+                       BUG_ON(ret != 0);
+                       ret = btrfs_extend_item(trans, root, path,
+                                               offset + size - found_size -
+                                               found_start);
+                       if (ret) {
+                               err = ret;
+                               goto fail;
+                       }
+                       leaf = path->nodes[0];
+                       ei = btrfs_item_ptr(leaf, path->slots[0],
+                                           struct btrfs_file_extent_item);
+               }
+       } else {
+insert:
+               btrfs_release_path(root, path);
+               ret = btrfs_insert_empty_item(trans, root, path, &key,
+                                             datasize);
+               if (ret) {
+                       err = ret;
+                       printk("got bad ret %d\n", ret);
+                       goto fail;
+               }
+               leaf = path->nodes[0];
+               ei = btrfs_item_ptr(leaf, path->slots[0],
+                                   struct btrfs_file_extent_item);
+               btrfs_set_file_extent_generation(leaf, ei, trans->transid);
+               btrfs_set_file_extent_type(leaf, ei, BTRFS_FILE_EXTENT_INLINE);
+       }
+       ptr = btrfs_file_extent_inline_start(ei) + offset;
+
+       cur_size = size;
+       i = 0;
+       while (size > 0) {
+               page = pages[i];
+               kaddr = kmap_atomic(page, KM_USER0);
+               cur_size = min(PAGE_CACHE_SIZE - page_offset, size);
+               write_extent_buffer(leaf, kaddr + page_offset, ptr, cur_size);
+               kunmap_atomic(kaddr, KM_USER0);
+               page_offset = 0;
+               ptr += cur_size;
+               size -= cur_size;
+               if (i >= num_pages) {
+                       printk("i %d num_pages %d\n", i, num_pages);
+               }
+               i++;
+       }
        btrfs_mark_buffer_dirty(leaf);
 fail:
        btrfs_free_path(path);
@@ -142,11 +218,12 @@ static int dirty_and_release_pages(struct btrfs_trans_handle *trans,
        struct inode *inode = file->f_path.dentry->d_inode;
        struct extent_map *em;
        struct extent_map_tree *em_tree = &BTRFS_I(inode)->extent_tree;
-       u64 hint_block;
-       u64 num_blocks;
+       u64 hint_byte;
+       u64 num_bytes;
        u64 start_pos;
        u64 end_of_last_block;
        u64 end_pos = pos + write_bytes;
+       u32 inline_size;
        loff_t isize = i_size_read(inode);
 
        em = alloc_extent_map(GFP_NOFS);
@@ -156,11 +233,12 @@ static int dirty_and_release_pages(struct btrfs_trans_handle *trans,
        em->bdev = inode->i_sb->s_bdev;
 
        start_pos = pos & ~((u64)root->sectorsize - 1);
-       num_blocks = (write_bytes + pos - start_pos + root->sectorsize - 1) >>
-                       inode->i_blkbits;
+       num_bytes = (write_bytes + pos - start_pos +
+                   root->sectorsize - 1) & ~((u64)root->sectorsize - 1);
 
        down_read(&BTRFS_I(inode)->root->snap_sem);
-       end_of_last_block = start_pos + (num_blocks << inode->i_blkbits) - 1;
+       end_of_last_block = start_pos + num_bytes - 1;
+
        lock_extent(em_tree, start_pos, end_of_last_block, GFP_NOFS);
        mutex_lock(&root->fs_info->fs_mutex);
        trans = btrfs_start_transaction(root, 1);
@@ -169,8 +247,8 @@ static int dirty_and_release_pages(struct btrfs_trans_handle *trans,
                goto out_unlock;
        }
        btrfs_set_trans_block_group(trans, inode);
-       inode->i_blocks += num_blocks << 3;
-       hint_block = 0;
+       inode->i_blocks += num_bytes >> 9;
+       hint_byte = 0;
 
        if ((end_of_last_block & 4095) == 0) {
                printk("strange end of last %Lu %zu %Lu\n", start_pos, write_bytes, end_of_last_block);
@@ -191,11 +269,11 @@ static int dirty_and_release_pages(struct btrfs_trans_handle *trans,
                        err = btrfs_drop_extents(trans, root, inode,
                                                 last_pos_in_file,
                                                 last_pos_in_file + hole_size,
-                                                &hint_block);
+                                                last_pos_in_file,
+                                                &hint_byte);
                        if (err)
                                goto failed;
 
-                       hole_size >>= inode->i_blkbits;
                        err = btrfs_insert_file_extent(trans, root,
                                                       inode->i_ino,
                                                       last_pos_in_file,
@@ -209,9 +287,11 @@ static int dirty_and_release_pages(struct btrfs_trans_handle *trans,
         * either allocate an extent for the new bytes or setup the key
         * to show we are doing inline data in the extent
         */
-       if (isize >= PAGE_CACHE_SIZE || pos + write_bytes < inode->i_size ||
-           pos + write_bytes - start_pos > BTRFS_MAX_INLINE_DATA_SIZE(root)) {
+       inline_size = end_pos;
+       if (isize >= BTRFS_MAX_INLINE_DATA_SIZE(root) ||
+           inline_size >= BTRFS_MAX_INLINE_DATA_SIZE(root)) {
                u64 last_end;
+
                for (i = 0; i < num_pages; i++) {
                        struct page *p = pages[i];
                        SetPageUptodate(p);
@@ -222,23 +302,18 @@ static int dirty_and_release_pages(struct btrfs_trans_handle *trans,
                set_extent_delalloc(em_tree, start_pos, end_of_last_block,
                                 GFP_NOFS);
        } else {
-               struct page *p = pages[0];
+               u64 aligned_end;
                /* step one, delete the existing extents in this range */
-               /* FIXME blocksize != pagesize */
+               aligned_end = (pos + write_bytes + root->sectorsize - 1) &
+                       ~((u64)root->sectorsize - 1);
                err = btrfs_drop_extents(trans, root, inode, start_pos,
-                        (pos + write_bytes + root->sectorsize -1) &
-                        ~((u64)root->sectorsize - 1), &hint_block);
+                                        aligned_end, end_pos, &hint_byte);
                if (err)
                        goto failed;
-
                err = insert_inline_extent(trans, root, inode, start_pos,
-                                          end_pos - start_pos, p, 0);
+                                          end_pos - start_pos, pages, 0,
+                                          num_pages);
                BUG_ON(err);
-               em->start = start_pos;
-               em->end = end_pos - 1;
-               em->block_start = EXTENT_MAP_INLINE;
-               em->block_end = EXTENT_MAP_INLINE;
-               add_extent_mapping(em_tree, em);
        }
        if (end_pos > isize) {
                i_size_write(inode, end_pos);
@@ -283,7 +358,7 @@ int btrfs_drop_extent_cache(struct inode *inode, u64 start, u64 end)
  */
 int btrfs_drop_extents(struct btrfs_trans_handle *trans,
                       struct btrfs_root *root, struct inode *inode,
-                      u64 start, u64 end, u64 *hint_block)
+                      u64 start, u64 end, u64 inline_end, u64 *hint_byte)
 {
        int ret;
        struct btrfs_key key;
@@ -346,8 +421,7 @@ next_slot:
                        found_type = btrfs_file_extent_type(leaf, extent);
                        if (found_type == BTRFS_FILE_EXTENT_REG) {
                                extent_end = key.offset +
-                                (btrfs_file_extent_num_blocks(leaf, extent) <<
-                                        inode->i_blkbits);
+                                    btrfs_file_extent_num_bytes(leaf, extent);
                                found_extent = 1;
                        } else if (found_type == BTRFS_FILE_EXTENT_INLINE) {
                                struct btrfs_item *item;
@@ -386,22 +460,22 @@ next_slot:
 
                if (end < extent_end && end >= key.offset) {
                        if (found_extent) {
-                               u64 disk_blocknr =
-                                   btrfs_file_extent_disk_blocknr(leaf,extent);
-                               u64 disk_num_blocks =
-                                   btrfs_file_extent_disk_num_blocks(leaf,
+                               u64 disk_bytenr =
+                                   btrfs_file_extent_disk_bytenr(leaf, extent);
+                               u64 disk_num_bytes =
+                                   btrfs_file_extent_disk_num_bytes(leaf,
                                                                      extent);
                                read_extent_buffer(leaf, &old,
                                                   (unsigned long)extent,
                                                   sizeof(old));
-                               if (disk_blocknr != 0) {
+                               if (disk_bytenr != 0) {
                                        ret = btrfs_inc_extent_ref(trans, root,
-                                                disk_blocknr, disk_num_blocks);
+                                                disk_bytenr, disk_num_bytes);
                                        BUG_ON(ret);
                                }
                        }
-                       WARN_ON(found_inline);
-                       bookend = 1;
+                       if (!found_inline)
+                               bookend = 1;
                }
                /* truncate existing extent */
                if (start > key.offset) {
@@ -410,55 +484,58 @@ next_slot:
                        keep = 1;
                        WARN_ON(start & (root->sectorsize - 1));
                        if (found_extent) {
-                               new_num = (start - key.offset) >>
-                                       inode->i_blkbits;
-                               old_num = btrfs_file_extent_num_blocks(leaf,
-                                                                      extent);
-                               *hint_block =
-                                       btrfs_file_extent_disk_blocknr(leaf,
-                                                                      extent);
-                               if (btrfs_file_extent_disk_blocknr(leaf,
-                                                                  extent)) {
+                               new_num = start - key.offset;
+                               old_num = btrfs_file_extent_num_bytes(leaf,
+                                                                     extent);
+                               *hint_byte =
+                                       btrfs_file_extent_disk_bytenr(leaf,
+                                                                     extent);
+                               if (btrfs_file_extent_disk_bytenr(leaf,
+                                                                 extent)) {
                                        inode->i_blocks -=
-                                               (old_num - new_num) << 3;
+                                               (old_num - new_num) >> 9;
                                }
-                               btrfs_set_file_extent_num_blocks(leaf,
-                                                                extent,
-                                                                new_num);
+                               btrfs_set_file_extent_num_bytes(leaf, extent,
+                                                               new_num);
                                btrfs_mark_buffer_dirty(leaf);
-                       } else {
-                               WARN_ON(1);
+                       } else if (end > extent_end &&
+                                  key.offset < inline_end &&
+                                  inline_end < extent_end) {
+                               u32 new_size;
+                               new_size = btrfs_file_extent_calc_inline_size(
+                                                  inline_end - key.offset);
+                               btrfs_truncate_item(trans, root, path,
+                                                   new_size);
                        }
                }
                /* delete the entire extent */
                if (!keep) {
-                       u64 disk_blocknr = 0;
-                       u64 disk_num_blocks = 0;
-                       u64 extent_num_blocks = 0;
+                       u64 disk_bytenr = 0;
+                       u64 disk_num_bytes = 0;
+                       u64 extent_num_bytes = 0;
                        if (found_extent) {
-                               disk_blocknr =
-                                     btrfs_file_extent_disk_blocknr(leaf,
+                               disk_bytenr =
+                                     btrfs_file_extent_disk_bytenr(leaf,
                                                                     extent);
-                               disk_num_blocks =
-                                     btrfs_file_extent_disk_num_blocks(leaf,
-                                                                       extent);
-                               extent_num_blocks =
-                                     btrfs_file_extent_num_blocks(leaf,
-                                                                  extent);
-                               *hint_block =
-                                       btrfs_file_extent_disk_blocknr(leaf,
+                               disk_num_bytes =
+                                     btrfs_file_extent_disk_num_bytes(leaf,
                                                                       extent);
+                               extent_num_bytes =
+                                     btrfs_file_extent_num_bytes(leaf, extent);
+                               *hint_byte =
+                                       btrfs_file_extent_disk_bytenr(leaf,
+                                                                     extent);
                        }
                        ret = btrfs_del_item(trans, root, path);
                        /* TODO update progress marker and return */
                        BUG_ON(ret);
                        btrfs_release_path(root, path);
                        extent = NULL;
-                       if (found_extent && disk_blocknr != 0) {
-                               inode->i_blocks -= extent_num_blocks << 3;
+                       if (found_extent && disk_bytenr != 0) {
+                               inode->i_blocks -= extent_num_bytes >> 9;
                                ret = btrfs_free_extent(trans, root,
-                                                       disk_blocknr,
-                                                       disk_num_blocks, 0);
+                                                       disk_bytenr,
+                                                       disk_num_bytes, 0);
                        }
 
                        BUG_ON(ret);
@@ -491,20 +568,19 @@ next_slot:
                                            (unsigned long)extent, sizeof(old));
 
                        btrfs_set_file_extent_offset(leaf, extent,
-                                   le64_to_cpu(old.offset) +
-                                   ((end - key.offset) >> inode->i_blkbits));
-                       WARN_ON(le64_to_cpu(old.num_blocks) <
-                               (extent_end - end) >> inode->i_blkbits);
-                       btrfs_set_file_extent_num_blocks(leaf, extent,
-                                   (extent_end - end) >> inode->i_blkbits);
-
+                                   le64_to_cpu(old.offset) + end - key.offset);
+                       WARN_ON(le64_to_cpu(old.num_bytes) <
+                               (extent_end - end));
+                       btrfs_set_file_extent_num_bytes(leaf, extent,
+                                                       extent_end - end);
                        btrfs_set_file_extent_type(leaf, extent,
                                                   BTRFS_FILE_EXTENT_REG);
+
                        btrfs_mark_buffer_dirty(path->nodes[0]);
-                       if (le64_to_cpu(old.disk_blocknr) != 0) {
+                       if (le64_to_cpu(old.disk_bytenr) != 0) {
                                inode->i_blocks +=
-                                     btrfs_file_extent_num_blocks(leaf,
-                                                                  extent) << 3;
+                                     btrfs_file_extent_num_bytes(leaf,
+                                                                 extent) >> 9;
                        }
                        ret = 0;
                        goto out;
@@ -531,12 +607,9 @@ static int prepare_pages(struct btrfs_root *root,
        unsigned long index = pos >> PAGE_CACHE_SHIFT;
        struct inode *inode = file->f_path.dentry->d_inode;
        int err = 0;
-       u64 num_blocks;
        u64 start_pos;
 
        start_pos = pos & ~((u64)root->sectorsize - 1);
-       num_blocks = (write_bytes + pos - start_pos + root->sectorsize - 1) >>
-                       inode->i_blkbits;
 
        memset(pages, 0, num_pages * sizeof(struct page *));
 
This page took 0.033727 seconds and 5 git commands to generate.