summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
Diffstat (limited to 'sys-fs/btrfs/files/btrfs-0.16-hotfix-1.patch')
-rw-r--r--sys-fs/btrfs/files/btrfs-0.16-hotfix-1.patch992
1 files changed, 0 insertions, 992 deletions
diff --git a/sys-fs/btrfs/files/btrfs-0.16-hotfix-1.patch b/sys-fs/btrfs/files/btrfs-0.16-hotfix-1.patch
deleted file mode 100644
index dcd6c397cb9b..000000000000
--- a/sys-fs/btrfs/files/btrfs-0.16-hotfix-1.patch
+++ /dev/null
@@ -1,992 +0,0 @@
-diff -Nurp btrfs-0.16/async-thread.c btrfs-0.16.new/async-thread.c
---- btrfs-0.16/async-thread.c 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/async-thread.c 2008-08-20 17:43:19.211404694 -0600
-@@ -49,6 +49,8 @@ struct btrfs_worker_thread {
- /* number of things on the pending list */
- atomic_t num_pending;
-
-+ unsigned long sequence;
-+
- /* protects the pending list. */
- spinlock_t lock;
-
-@@ -153,7 +155,7 @@ int btrfs_stop_workers(struct btrfs_work
- /*
- * simple init on struct btrfs_workers
- */
--void btrfs_init_workers(struct btrfs_workers *workers, int max)
-+void btrfs_init_workers(struct btrfs_workers *workers, char *name, int max)
- {
- workers->num_workers = 0;
- INIT_LIST_HEAD(&workers->worker_list);
-@@ -161,6 +163,7 @@ void btrfs_init_workers(struct btrfs_wor
- spin_lock_init(&workers->lock);
- workers->max_workers = max;
- workers->idle_thresh = 32;
-+ workers->name = name;
- }
-
- /*
-@@ -184,7 +187,9 @@ int btrfs_start_workers(struct btrfs_wor
- INIT_LIST_HEAD(&worker->worker_list);
- spin_lock_init(&worker->lock);
- atomic_set(&worker->num_pending, 0);
-- worker->task = kthread_run(worker_loop, worker, "btrfs");
-+ worker->task = kthread_run(worker_loop, worker,
-+ "btrfs-%s-%d", workers->name,
-+ workers->num_workers + i);
- worker->workers = workers;
- if (IS_ERR(worker->task)) {
- kfree(worker);
-@@ -194,6 +199,7 @@ int btrfs_start_workers(struct btrfs_wor
-
- spin_lock_irq(&workers->lock);
- list_add_tail(&worker->worker_list, &workers->idle_list);
-+ worker->idle = 1;
- workers->num_workers++;
- spin_unlock_irq(&workers->lock);
- }
-@@ -235,7 +241,10 @@ static struct btrfs_worker_thread *next_
- */
- next = workers->worker_list.next;
- worker = list_entry(next, struct btrfs_worker_thread, worker_list);
-- list_move_tail(next, &workers->worker_list);
-+ atomic_inc(&worker->num_pending);
-+ worker->sequence++;
-+ if (worker->sequence % workers->idle_thresh == 0)
-+ list_move_tail(next, &workers->worker_list);
- return worker;
- }
-
-diff -Nurp btrfs-0.16/async-thread.h btrfs-0.16.new/async-thread.h
---- btrfs-0.16/async-thread.h 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/async-thread.h 2008-08-20 17:43:19.211404694 -0600
-@@ -69,11 +69,14 @@ struct btrfs_workers {
-
- /* lock for finding the next worker thread to queue on */
- spinlock_t lock;
-+
-+ /* extra name for this worker */
-+ char *name;
- };
-
- int btrfs_queue_worker(struct btrfs_workers *workers, struct btrfs_work *work);
- int btrfs_start_workers(struct btrfs_workers *workers, int num_workers);
- int btrfs_stop_workers(struct btrfs_workers *workers);
--void btrfs_init_workers(struct btrfs_workers *workers, int max);
-+void btrfs_init_workers(struct btrfs_workers *workers, char *name, int max);
- int btrfs_requeue_work(struct btrfs_work *work);
- #endif
-diff -Nurp btrfs-0.16/compat.h btrfs-0.16.new/compat.h
---- btrfs-0.16/compat.h 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/compat.h 2008-08-20 17:43:19.501402495 -0600
-@@ -1,6 +1,9 @@
- #ifndef _COMPAT_H_
- #define _COMPAT_H_
-
-+#if LINUX_VERSION_CODE <= KERNEL_VERSION(2,6,26)
-+#define trylock_page(page) (!TestSetPageLocked(page))
-+#endif
-
- /*
- * Even if AppArmor isn't enabled, it still has different prototypes.
-diff -Nurp btrfs-0.16/ctree.h btrfs-0.16.new/ctree.h
---- btrfs-0.16/ctree.h 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/ctree.h 2008-08-20 17:43:19.521406669 -0600
-@@ -526,6 +526,7 @@ struct btrfs_fs_info {
- struct btrfs_transaction *running_transaction;
- wait_queue_head_t transaction_throttle;
- wait_queue_head_t transaction_wait;
-+ wait_queue_head_t async_submit_wait;
- struct btrfs_super_block super_copy;
- struct btrfs_super_block super_for_commit;
- struct block_device *__bdev;
-@@ -544,6 +545,7 @@ struct btrfs_fs_info {
- struct list_head hashers;
- struct list_head dead_roots;
- atomic_t nr_async_submits;
-+ atomic_t nr_async_bios;
-
- /*
- * this is used by the balancing code to wait for all the pending
-@@ -1648,7 +1650,7 @@ int btrfs_csum_truncate(struct btrfs_tra
- /* inode.c */
-
- /* RHEL and EL kernels have a patch that renames PG_checked to FsMisc */
--#ifdef ClearPageFsMisc
-+#if defined(ClearPageFsMisc) && !defined(ClearPageChecked)
- #define ClearPageChecked ClearPageFsMisc
- #define SetPageChecked SetPageFsMisc
- #define PageChecked PageFsMisc
-diff -Nurp btrfs-0.16/disk-io.c btrfs-0.16.new/disk-io.c
---- btrfs-0.16/disk-io.c 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/disk-io.c 2008-08-20 17:43:19.541408335 -0600
-@@ -429,14 +429,38 @@ int btrfs_bio_wq_end_io(struct btrfs_fs_
- return 0;
- }
-
-+unsigned long btrfs_async_submit_limit(struct btrfs_fs_info *info)
-+{
-+ unsigned long limit = min_t(unsigned long,
-+ info->workers.max_workers,
-+ info->fs_devices->open_devices);
-+ return 256 * limit;
-+}
-+
-+int btrfs_congested_async(struct btrfs_fs_info *info, int iodone)
-+{
-+ return atomic_read(&info->nr_async_bios) >
-+ btrfs_async_submit_limit(info);
-+}
-+
- static void run_one_async_submit(struct btrfs_work *work)
- {
- struct btrfs_fs_info *fs_info;
- struct async_submit_bio *async;
-+ int limit;
-
- async = container_of(work, struct async_submit_bio, work);
- fs_info = BTRFS_I(async->inode)->root->fs_info;
-+
-+ limit = btrfs_async_submit_limit(fs_info);
-+ limit = limit * 2 / 3;
-+
- atomic_dec(&fs_info->nr_async_submits);
-+
-+ if (atomic_read(&fs_info->nr_async_submits) < limit &&
-+ waitqueue_active(&fs_info->async_submit_wait))
-+ wake_up(&fs_info->async_submit_wait);
-+
- async->submit_bio_hook(async->inode, async->rw, async->bio,
- async->mirror_num);
- kfree(async);
-@@ -447,6 +471,7 @@ int btrfs_wq_submit_bio(struct btrfs_fs_
- extent_submit_bio_hook_t *submit_bio_hook)
- {
- struct async_submit_bio *async;
-+ int limit = btrfs_async_submit_limit(fs_info);
-
- async = kmalloc(sizeof(*async), GFP_NOFS);
- if (!async)
-@@ -461,6 +486,10 @@ int btrfs_wq_submit_bio(struct btrfs_fs_
- async->work.flags = 0;
- atomic_inc(&fs_info->nr_async_submits);
- btrfs_queue_worker(&fs_info->workers, &async->work);
-+
-+ wait_event_timeout(fs_info->async_submit_wait,
-+ (atomic_read(&fs_info->nr_async_submits) < limit),
-+ HZ/10);
- return 0;
- }
-
-@@ -475,11 +504,11 @@ static int __btree_submit_bio_hook(struc
-
- /*
- * when we're called for a write, we're already in the async
-- * submission context. Just jump ingo btrfs_map_bio
-+ * submission context. Just jump into btrfs_map_bio
- */
- if (rw & (1 << BIO_RW)) {
- return btrfs_map_bio(BTRFS_I(inode)->root, rw, bio,
-- mirror_num, 0);
-+ mirror_num, 1);
- }
-
- /*
-@@ -511,6 +540,12 @@ static int btree_writepage(struct page *
- {
- struct extent_io_tree *tree;
- tree = &BTRFS_I(page->mapping->host)->io_tree;
-+
-+ if (current->flags & PF_MEMALLOC) {
-+ redirty_page_for_writepage(wbc, page);
-+ unlock_page(page);
-+ return 0;
-+ }
- return extent_write_full_page(tree, page, btree_get_extent, wbc);
- }
-
-@@ -522,16 +557,11 @@ static int btree_writepages(struct addre
- if (wbc->sync_mode == WB_SYNC_NONE) {
- u64 num_dirty;
- u64 start = 0;
-- unsigned long thresh = 96 * 1024 * 1024;
-+ unsigned long thresh = 8 * 1024 * 1024;
-
- if (wbc->for_kupdate)
- return 0;
-
-- if (current_is_pdflush()) {
-- thresh = 96 * 1024 * 1024;
-- } else {
-- thresh = 8 * 1024 * 1024;
-- }
- num_dirty = count_range_bits(tree, &start, (u64)-1,
- thresh, EXTENT_DIRTY);
- if (num_dirty < thresh) {
-@@ -938,15 +968,13 @@ static int btrfs_congested_fn(void *cong
- {
- struct btrfs_fs_info *info = (struct btrfs_fs_info *)congested_data;
- int ret = 0;
-- int limit = 256 * info->fs_devices->open_devices;
- struct list_head *cur;
- struct btrfs_device *device;
- struct backing_dev_info *bdi;
-
- if ((bdi_bits & (1 << BDI_write_congested)) &&
-- atomic_read(&info->nr_async_submits) > limit) {
-+ btrfs_congested_async(info, 0))
- return 1;
-- }
-
- list_for_each(cur, &info->fs_devices->devices) {
- device = list_entry(cur, struct btrfs_device, dev_list);
-@@ -1250,6 +1278,7 @@ struct btrfs_root *open_ctree(struct sup
- INIT_LIST_HEAD(&fs_info->space_info);
- btrfs_mapping_init(&fs_info->mapping_tree);
- atomic_set(&fs_info->nr_async_submits, 0);
-+ atomic_set(&fs_info->nr_async_bios, 0);
- atomic_set(&fs_info->throttles, 0);
- atomic_set(&fs_info->throttle_gen, 0);
- fs_info->sb = sb;
-@@ -1311,6 +1340,7 @@ struct btrfs_root *open_ctree(struct sup
- mutex_init(&fs_info->volume_mutex);
- init_waitqueue_head(&fs_info->transaction_throttle);
- init_waitqueue_head(&fs_info->transaction_wait);
-+ init_waitqueue_head(&fs_info->async_submit_wait);
-
- #if 0
- ret = add_hasher(fs_info, "crc32c");
-@@ -1347,8 +1377,11 @@ struct btrfs_root *open_ctree(struct sup
- * queue work function gets called at interrupt time, and so it
- * cannot dynamically grow.
- */
-- btrfs_init_workers(&fs_info->workers, fs_info->thread_pool_size);
-- btrfs_init_workers(&fs_info->submit_workers, fs_info->thread_pool_size);
-+ btrfs_init_workers(&fs_info->workers, "worker",
-+ fs_info->thread_pool_size);
-+ btrfs_init_workers(&fs_info->submit_workers, "submit",
-+ min_t(u64, fs_devices->num_devices,
-+ fs_info->thread_pool_size));
-
- /* a higher idle thresh on the submit workers makes it much more
- * likely that bios will be send down in a sane order to the
-@@ -1356,9 +1389,18 @@ struct btrfs_root *open_ctree(struct sup
- */
- fs_info->submit_workers.idle_thresh = 64;
-
-- btrfs_init_workers(&fs_info->fixup_workers, 1);
-- btrfs_init_workers(&fs_info->endio_workers, fs_info->thread_pool_size);
-- btrfs_init_workers(&fs_info->endio_write_workers,
-+ /* fs_info->workers is responsible for checksumming file data
-+ * blocks and metadata. Using a larger idle thresh allows each
-+ * worker thread to operate on things in roughly the order they
-+ * were sent by the writeback daemons, improving overall locality
-+ * of the IO going down the pipe.
-+ */
-+ fs_info->workers.idle_thresh = 128;
-+
-+ btrfs_init_workers(&fs_info->fixup_workers, "fixup", 1);
-+ btrfs_init_workers(&fs_info->endio_workers, "endio",
-+ fs_info->thread_pool_size);
-+ btrfs_init_workers(&fs_info->endio_write_workers, "endio-write",
- fs_info->thread_pool_size);
-
- /*
-@@ -1823,10 +1865,10 @@ void btrfs_btree_balance_dirty(struct bt
- struct extent_io_tree *tree;
- u64 num_dirty;
- u64 start = 0;
-- unsigned long thresh = 16 * 1024 * 1024;
-+ unsigned long thresh = 96 * 1024 * 1024;
- tree = &BTRFS_I(root->fs_info->btree_inode)->io_tree;
-
-- if (current_is_pdflush())
-+ if (current_is_pdflush() || current->flags & PF_MEMALLOC)
- return;
-
- num_dirty = count_range_bits(tree, &start, (u64)-1,
-diff -Nurp btrfs-0.16/disk-io.h btrfs-0.16.new/disk-io.h
---- btrfs-0.16/disk-io.h 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/disk-io.h 2008-08-20 17:43:19.541408335 -0600
-@@ -72,4 +72,6 @@ int btrfs_bio_wq_end_io(struct btrfs_fs_
- int btrfs_wq_submit_bio(struct btrfs_fs_info *fs_info, struct inode *inode,
- int rw, struct bio *bio, int mirror_num,
- extent_submit_bio_hook_t *submit_bio_hook);
-+int btrfs_congested_async(struct btrfs_fs_info *info, int iodone);
-+unsigned long btrfs_async_submit_limit(struct btrfs_fs_info *info);
- #endif
-diff -Nurp btrfs-0.16/extent_io.c btrfs-0.16.new/extent_io.c
---- btrfs-0.16/extent_io.c 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/extent_io.c 2008-08-20 17:43:19.561407722 -0600
-@@ -14,6 +14,9 @@
- #include <linux/pagevec.h>
- #include "extent_io.h"
- #include "extent_map.h"
-+#include "compat.h"
-+#include "ctree.h"
-+#include "btrfs_inode.h"
-
- /* temporary define until extent_map moves out of btrfs */
- struct kmem_cache *btrfs_cache_create(const char *name, size_t size,
-@@ -1393,15 +1396,11 @@ static int end_bio_extent_writepage(stru
- {
- int uptodate = err == 0;
- struct bio_vec *bvec = bio->bi_io_vec + bio->bi_vcnt - 1;
-- struct extent_state *state = bio->bi_private;
-- struct extent_io_tree *tree = state->tree;
-- struct rb_node *node;
-+ struct extent_io_tree *tree;
- u64 start;
- u64 end;
-- u64 cur;
- int whole_page;
- int ret;
-- unsigned long flags;
-
- #if LINUX_VERSION_CODE <= KERNEL_VERSION(2,6,23)
- if (bio->bi_size)
-@@ -1409,6 +1408,8 @@ static int end_bio_extent_writepage(stru
- #endif
- do {
- struct page *page = bvec->bv_page;
-+ tree = &BTRFS_I(page->mapping->host)->io_tree;
-+
- start = ((u64)page->index << PAGE_CACHE_SHIFT) +
- bvec->bv_offset;
- end = start + bvec->bv_len - 1;
-@@ -1422,7 +1423,7 @@ static int end_bio_extent_writepage(stru
- prefetchw(&bvec->bv_page->flags);
- if (tree->ops && tree->ops->writepage_end_io_hook) {
- ret = tree->ops->writepage_end_io_hook(page, start,
-- end, state, uptodate);
-+ end, NULL, uptodate);
- if (ret)
- uptodate = 0;
- }
-@@ -1430,9 +1431,8 @@ static int end_bio_extent_writepage(stru
- if (!uptodate && tree->ops &&
- tree->ops->writepage_io_failed_hook) {
- ret = tree->ops->writepage_io_failed_hook(bio, page,
-- start, end, state);
-+ start, end, NULL);
- if (ret == 0) {
-- state = NULL;
- uptodate = (err == 0);
- continue;
- }
-@@ -1444,68 +1444,7 @@ static int end_bio_extent_writepage(stru
- SetPageError(page);
- }
-
-- /*
-- * bios can get merged in funny ways, and so we need to
-- * be careful with the state variable. We know the
-- * state won't be merged with others because it has
-- * WRITEBACK set, but we can't be sure each biovec is
-- * sequential in the file. So, if our cached state
-- * doesn't match the expected end, search the tree
-- * for the correct one.
-- */
--
-- spin_lock_irqsave(&tree->lock, flags);
-- if (!state || state->end != end) {
-- state = NULL;
-- node = __etree_search(tree, start, NULL, NULL);
-- if (node) {
-- state = rb_entry(node, struct extent_state,
-- rb_node);
-- if (state->end != end ||
-- !(state->state & EXTENT_WRITEBACK))
-- state = NULL;
-- }
-- if (!state) {
-- spin_unlock_irqrestore(&tree->lock, flags);
-- clear_extent_writeback(tree, start,
-- end, GFP_ATOMIC);
-- goto next_io;
-- }
-- }
-- cur = end;
-- while(1) {
-- struct extent_state *clear = state;
-- cur = state->start;
-- node = rb_prev(&state->rb_node);
-- if (node) {
-- state = rb_entry(node,
-- struct extent_state,
-- rb_node);
-- } else {
-- state = NULL;
-- }
--
-- clear_state_bit(tree, clear, EXTENT_WRITEBACK,
-- 1, 0);
-- if (cur == start)
-- break;
-- if (cur < start) {
-- WARN_ON(1);
-- break;
-- }
-- if (!node)
-- break;
-- }
-- /* before releasing the lock, make sure the next state
-- * variable has the expected bits set and corresponds
-- * to the correct offsets in the file
-- */
-- if (state && (state->end + 1 != start ||
-- !(state->state & EXTENT_WRITEBACK))) {
-- state = NULL;
-- }
-- spin_unlock_irqrestore(&tree->lock, flags);
--next_io:
-+ clear_extent_writeback(tree, start, end, GFP_ATOMIC);
-
- if (whole_page)
- end_page_writeback(page);
-@@ -1538,13 +1477,9 @@ static int end_bio_extent_readpage(struc
- {
- int uptodate = test_bit(BIO_UPTODATE, &bio->bi_flags);
- struct bio_vec *bvec = bio->bi_io_vec + bio->bi_vcnt - 1;
-- struct extent_state *state = bio->bi_private;
-- struct extent_io_tree *tree = state->tree;
-- struct rb_node *node;
-+ struct extent_io_tree *tree;
- u64 start;
- u64 end;
-- u64 cur;
-- unsigned long flags;
- int whole_page;
- int ret;
-
-@@ -1555,6 +1490,8 @@ static int end_bio_extent_readpage(struc
-
- do {
- struct page *page = bvec->bv_page;
-+ tree = &BTRFS_I(page->mapping->host)->io_tree;
-+
- start = ((u64)page->index << PAGE_CACHE_SHIFT) +
- bvec->bv_offset;
- end = start + bvec->bv_len - 1;
-@@ -1569,80 +1506,26 @@ static int end_bio_extent_readpage(struc
-
- if (uptodate && tree->ops && tree->ops->readpage_end_io_hook) {
- ret = tree->ops->readpage_end_io_hook(page, start, end,
-- state);
-+ NULL);
- if (ret)
- uptodate = 0;
- }
- if (!uptodate && tree->ops &&
- tree->ops->readpage_io_failed_hook) {
- ret = tree->ops->readpage_io_failed_hook(bio, page,
-- start, end, state);
-+ start, end, NULL);
- if (ret == 0) {
-- state = NULL;
- uptodate =
- test_bit(BIO_UPTODATE, &bio->bi_flags);
- continue;
- }
- }
-
-- spin_lock_irqsave(&tree->lock, flags);
-- if (!state || state->end != end) {
-- state = NULL;
-- node = __etree_search(tree, start, NULL, NULL);
-- if (node) {
-- state = rb_entry(node, struct extent_state,
-- rb_node);
-- if (state->end != end ||
-- !(state->state & EXTENT_LOCKED))
-- state = NULL;
-- }
-- if (!state) {
-- spin_unlock_irqrestore(&tree->lock, flags);
-- if (uptodate)
-- set_extent_uptodate(tree, start, end,
-- GFP_ATOMIC);
-- unlock_extent(tree, start, end, GFP_ATOMIC);
-- goto next_io;
-- }
-- }
-+ if (uptodate)
-+ set_extent_uptodate(tree, start, end,
-+ GFP_ATOMIC);
-+ unlock_extent(tree, start, end, GFP_ATOMIC);
-
-- cur = end;
-- while(1) {
-- struct extent_state *clear = state;
-- cur = state->start;
-- node = rb_prev(&state->rb_node);
-- if (node) {
-- state = rb_entry(node,
-- struct extent_state,
-- rb_node);
-- } else {
-- state = NULL;
-- }
-- if (uptodate) {
-- set_state_cb(tree, clear, EXTENT_UPTODATE);
-- clear->state |= EXTENT_UPTODATE;
-- }
-- clear_state_bit(tree, clear, EXTENT_LOCKED,
-- 1, 0);
-- if (cur == start)
-- break;
-- if (cur < start) {
-- WARN_ON(1);
-- break;
-- }
-- if (!node)
-- break;
-- }
-- /* before releasing the lock, make sure the next state
-- * variable has the expected bits set and corresponds
-- * to the correct offsets in the file
-- */
-- if (state && (state->end + 1 != start ||
-- !(state->state & EXTENT_LOCKED))) {
-- state = NULL;
-- }
-- spin_unlock_irqrestore(&tree->lock, flags);
--next_io:
- if (whole_page) {
- if (uptodate) {
- SetPageUptodate(page);
-@@ -1682,8 +1565,7 @@ static int end_bio_extent_preparewrite(s
- {
- const int uptodate = test_bit(BIO_UPTODATE, &bio->bi_flags);
- struct bio_vec *bvec = bio->bi_io_vec + bio->bi_vcnt - 1;
-- struct extent_state *state = bio->bi_private;
-- struct extent_io_tree *tree = state->tree;
-+ struct extent_io_tree *tree;
- u64 start;
- u64 end;
-
-@@ -1694,6 +1576,8 @@ static int end_bio_extent_preparewrite(s
-
- do {
- struct page *page = bvec->bv_page;
-+ tree = &BTRFS_I(page->mapping->host)->io_tree;
-+
- start = ((u64)page->index << PAGE_CACHE_SHIFT) +
- bvec->bv_offset;
- end = start + bvec->bv_len - 1;
-@@ -1764,7 +1648,7 @@ static int submit_one_bio(int rw, struct
- BUG_ON(state->end != end);
- spin_unlock_irq(&tree->lock);
-
-- bio->bi_private = state;
-+ bio->bi_private = NULL;
-
- bio_get(bio);
-
-@@ -3055,7 +2939,7 @@ int read_extent_buffer_pages(struct exte
- for (i = start_i; i < num_pages; i++) {
- page = extent_buffer_page(eb, i);
- if (!wait) {
-- if (TestSetPageLocked(page))
-+ if (!trylock_page(page))
- goto unlock_exit;
- } else {
- lock_page(page);
-diff -Nurp btrfs-0.16/extent_map.c btrfs-0.16.new/extent_map.c
---- btrfs-0.16/extent_map.c 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/extent_map.c 2008-08-20 17:43:19.571405082 -0600
-@@ -207,7 +207,14 @@ int add_extent_mapping(struct extent_map
- int ret = 0;
- struct extent_map *merge = NULL;
- struct rb_node *rb;
-+ struct extent_map *exist;
-
-+ exist = lookup_extent_mapping(tree, em->start, em->len);
-+ if (exist) {
-+ free_extent_map(exist);
-+ ret = -EEXIST;
-+ goto out;
-+ }
- assert_spin_locked(&tree->lock);
- rb = tree_insert(&tree->map, em->start, &em->rb_node);
- if (rb) {
-diff -Nurp btrfs-0.16/file-item.c btrfs-0.16.new/file-item.c
---- btrfs-0.16/file-item.c 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/file-item.c 2008-08-20 17:43:19.571405082 -0600
-@@ -134,7 +134,6 @@ int btrfs_lookup_file_extent(struct btrf
- return ret;
- }
-
--#if 0 /* broken */
- int btrfs_lookup_bio_sums(struct btrfs_root *root, struct inode *inode,
- struct bio *bio)
- {
-@@ -151,6 +150,8 @@ int btrfs_lookup_bio_sums(struct btrfs_r
- struct extent_io_tree *io_tree = &BTRFS_I(inode)->io_tree;
-
- path = btrfs_alloc_path();
-+ if (bio->bi_size > PAGE_CACHE_SIZE * 8)
-+ path->reada = 2;
-
- WARN_ON(bio->bi_vcnt <= 0);
-
-@@ -211,7 +212,6 @@ found:
- btrfs_free_path(path);
- return 0;
- }
--#endif
-
- int btrfs_csum_one_bio(struct btrfs_root *root, struct inode *inode,
- struct bio *bio)
-@@ -321,6 +321,7 @@ again:
- file_key.offset = offset;
- btrfs_set_key_type(&file_key, BTRFS_CSUM_ITEM_KEY);
-
-+ mutex_lock(&BTRFS_I(inode)->csum_mutex);
- item = btrfs_lookup_csum(trans, root, path, objectid, offset, 1);
- if (!IS_ERR(item)) {
- leaf = path->nodes[0];
-@@ -367,7 +368,7 @@ again:
- ret = btrfs_search_slot(trans, root, &file_key, path,
- BTRFS_CRC32_SIZE, 1);
- if (ret < 0)
-- goto fail;
-+ goto fail_unlock;
- if (ret == 0) {
- BUG();
- }
-@@ -411,10 +412,10 @@ insert:
- ret = btrfs_insert_empty_item(trans, root, path, &file_key,
- ins_size);
- if (ret < 0)
-- goto fail;
-+ goto fail_unlock;
- if (ret != 0) {
- WARN_ON(1);
-- goto fail;
-+ goto fail_unlock;
- }
- csum:
- leaf = path->nodes[0];
-@@ -427,6 +428,8 @@ found:
- item_end = (struct btrfs_csum_item *)((unsigned char *)item_end +
- btrfs_item_size_nr(leaf, path->slots[0]));
- eb_token = NULL;
-+ mutex_unlock(&BTRFS_I(inode)->csum_mutex);
-+ cond_resched();
- next_sector:
-
- if (!eb_token ||
-@@ -467,13 +470,18 @@ next_sector:
- eb_token = NULL;
- }
- btrfs_mark_buffer_dirty(path->nodes[0]);
-+ cond_resched();
- if (total_bytes < sums->len) {
- btrfs_release_path(root, path);
- goto again;
- }
--fail:
-+out:
- btrfs_free_path(path);
- return ret;
-+
-+fail_unlock:
-+ mutex_unlock(&BTRFS_I(inode)->csum_mutex);
-+ goto out;
- }
-
- int btrfs_csum_truncate(struct btrfs_trans_handle *trans,
-diff -Nurp btrfs-0.16/inode.c btrfs-0.16.new/inode.c
---- btrfs-0.16/inode.c 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/inode.c 2008-08-20 17:43:19.601409609 -0600
-@@ -389,15 +389,15 @@ int btrfs_submit_bio_hook(struct inode *
- ret = btrfs_bio_wq_end_io(root->fs_info, bio, 0);
- BUG_ON(ret);
-
-- if (!(rw & (1 << BIO_RW))) {
-- goto mapit;
-- }
--
- if (btrfs_test_opt(root, NODATASUM) ||
- btrfs_test_flag(inode, NODATASUM)) {
- goto mapit;
- }
-
-+ if (!(rw & (1 << BIO_RW))) {
-+ btrfs_lookup_bio_sums(root, inode, bio);
-+ goto mapit;
-+ }
- return btrfs_wq_submit_bio(BTRFS_I(inode)->root->fs_info,
- inode, rw, bio, mirror_num,
- __btrfs_submit_bio_hook);
-@@ -415,10 +415,8 @@ static noinline int add_pending_csums(st
- btrfs_set_trans_block_group(trans, inode);
- list_for_each(cur, list) {
- sum = list_entry(cur, struct btrfs_ordered_sum, list);
-- mutex_lock(&BTRFS_I(inode)->csum_mutex);
- btrfs_csum_file_blocks(trans, BTRFS_I(inode)->root,
- inode, sum);
-- mutex_unlock(&BTRFS_I(inode)->csum_mutex);
- }
- return 0;
- }
-@@ -605,58 +603,6 @@ int btrfs_writepage_end_io_hook(struct p
- return btrfs_finish_ordered_io(page->mapping->host, start, end);
- }
-
--int btrfs_readpage_io_hook(struct page *page, u64 start, u64 end)
--{
-- int ret = 0;
-- struct inode *inode = page->mapping->host;
-- struct btrfs_root *root = BTRFS_I(inode)->root;
-- struct extent_io_tree *io_tree = &BTRFS_I(inode)->io_tree;
-- struct btrfs_csum_item *item;
-- struct btrfs_path *path = NULL;
-- u32 csum;
--
-- if (btrfs_test_opt(root, NODATASUM) ||
-- btrfs_test_flag(inode, NODATASUM))
-- return 0;
--
-- /*
-- * It is possible there is an ordered extent that has
-- * not yet finished for this range in the file. If so,
-- * that extent will have a csum cached, and it will insert
-- * the sum after all the blocks in the extent are fully
-- * on disk. So, look for an ordered extent and use the
-- * sum if found. We have to do this before looking in the
-- * btree because csum items are pre-inserted based on
-- * the file size. btrfs_lookup_csum might find an item
-- * that still hasn't been fully filled.
-- */
-- ret = btrfs_find_ordered_sum(inode, start, &csum);
-- if (ret == 0)
-- goto found;
--
-- ret = 0;
-- path = btrfs_alloc_path();
-- item = btrfs_lookup_csum(NULL, root, path, inode->i_ino, start, 0);
-- if (IS_ERR(item)) {
-- ret = PTR_ERR(item);
-- /* a csum that isn't present is a preallocated region. */
-- if (ret == -ENOENT || ret == -EFBIG)
-- ret = 0;
-- csum = 0;
-- printk("no csum found for inode %lu start %Lu\n", inode->i_ino,
-- start);
-- goto out;
-- }
-- read_extent_buffer(path->nodes[0], &csum, (unsigned long)item,
-- BTRFS_CRC32_SIZE);
--found:
-- set_state_private(io_tree, start, csum);
--out:
-- if (path)
-- btrfs_free_path(path);
-- return ret;
--}
--
- struct io_failure_record {
- struct page *page;
- u64 start;
-@@ -1655,8 +1601,20 @@ static int btrfs_setattr(struct dentry *
- btrfs_truncate_page(inode->i_mapping, inode->i_size);
-
- hole_size = block_end - hole_start;
-- btrfs_wait_ordered_range(inode, hole_start, hole_size);
-- lock_extent(io_tree, hole_start, block_end - 1, GFP_NOFS);
-+ while(1) {
-+ struct btrfs_ordered_extent *ordered;
-+ btrfs_wait_ordered_range(inode, hole_start, hole_size);
-+
-+ lock_extent(io_tree, hole_start, block_end - 1, GFP_NOFS);
-+ ordered = btrfs_lookup_ordered_extent(inode, hole_start);
-+ if (ordered) {
-+ unlock_extent(io_tree, hole_start,
-+ block_end - 1, GFP_NOFS);
-+ btrfs_put_ordered_extent(ordered);
-+ } else {
-+ break;
-+ }
-+ }
-
- trans = btrfs_start_transaction(root, 1);
- btrfs_set_trans_block_group(trans, inode);
-@@ -1833,6 +1791,7 @@ static int btrfs_init_locked_inode(struc
- inode->i_ino = args->ino;
- BTRFS_I(inode)->root = args->root;
- BTRFS_I(inode)->delalloc_bytes = 0;
-+ inode->i_mapping->writeback_index = 0;
- BTRFS_I(inode)->disk_i_size = 0;
- BTRFS_I(inode)->index_cnt = (u64)-1;
- extent_map_tree_init(&BTRFS_I(inode)->extent_tree, GFP_NOFS);
-@@ -2239,6 +2198,7 @@ static struct inode *btrfs_new_inode(str
- mutex_init(&BTRFS_I(inode)->csum_mutex);
- mutex_init(&BTRFS_I(inode)->extent_mutex);
- BTRFS_I(inode)->delalloc_bytes = 0;
-+ inode->i_mapping->writeback_index = 0;
- BTRFS_I(inode)->disk_i_size = 0;
- BTRFS_I(inode)->root = root;
-
-@@ -2486,6 +2446,7 @@ static int btrfs_create(struct inode *di
- mutex_init(&BTRFS_I(inode)->extent_mutex);
- BTRFS_I(inode)->delalloc_bytes = 0;
- BTRFS_I(inode)->disk_i_size = 0;
-+ inode->i_mapping->writeback_index = 0;
- BTRFS_I(inode)->io_tree.ops = &btrfs_extent_io_ops;
- btrfs_ordered_inode_tree_init(&BTRFS_I(inode)->ordered_tree);
- }
-@@ -3549,6 +3510,7 @@ static int btrfs_symlink(struct inode *d
- mutex_init(&BTRFS_I(inode)->extent_mutex);
- BTRFS_I(inode)->delalloc_bytes = 0;
- BTRFS_I(inode)->disk_i_size = 0;
-+ inode->i_mapping->writeback_index = 0;
- BTRFS_I(inode)->io_tree.ops = &btrfs_extent_io_ops;
- btrfs_ordered_inode_tree_init(&BTRFS_I(inode)->ordered_tree);
- }
-@@ -3654,7 +3616,6 @@ static struct extent_io_ops btrfs_extent
- .fill_delalloc = run_delalloc_range,
- .submit_bio_hook = btrfs_submit_bio_hook,
- .merge_bio_hook = btrfs_merge_bio_hook,
-- .readpage_io_hook = btrfs_readpage_io_hook,
- .readpage_end_io_hook = btrfs_readpage_end_io_hook,
- .writepage_end_io_hook = btrfs_writepage_end_io_hook,
- .writepage_start_hook = btrfs_writepage_start_hook,
-diff -Nurp btrfs-0.16/transaction.c btrfs-0.16.new/transaction.c
---- btrfs-0.16/transaction.c 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/transaction.c 2008-08-20 17:43:19.641404933 -0600
-@@ -303,12 +303,12 @@ int btrfs_write_and_wait_transaction(str
- struct btrfs_root *root)
- {
- int ret;
-- int err;
-+ int err = 0;
- int werr = 0;
- struct extent_io_tree *dirty_pages;
- struct page *page;
- struct inode *btree_inode = root->fs_info->btree_inode;
-- u64 start;
-+ u64 start = 0;
- u64 end;
- unsigned long index;
-
-@@ -317,12 +317,13 @@ int btrfs_write_and_wait_transaction(str
- }
- dirty_pages = &trans->transaction->dirty_pages;
- while(1) {
-- ret = find_first_extent_bit(dirty_pages, 0, &start, &end,
-+ ret = find_first_extent_bit(dirty_pages, start, &start, &end,
- EXTENT_DIRTY);
- if (ret)
- break;
-- clear_extent_dirty(dirty_pages, start, end, GFP_NOFS);
- while(start <= end) {
-+ cond_resched();
-+
- index = start >> PAGE_CACHE_SHIFT;
- start = (u64)(index + 1) << PAGE_CACHE_SHIFT;
- page = find_lock_page(btree_inode->i_mapping, index);
-@@ -343,7 +344,30 @@ int btrfs_write_and_wait_transaction(str
- page_cache_release(page);
- }
- }
-- err = filemap_fdatawait(btree_inode->i_mapping);
-+ while(1) {
-+ ret = find_first_extent_bit(dirty_pages, 0, &start, &end,
-+ EXTENT_DIRTY);
-+ if (ret)
-+ break;
-+
-+ clear_extent_dirty(dirty_pages, start, end, GFP_NOFS);
-+ while(start <= end) {
-+ index = start >> PAGE_CACHE_SHIFT;
-+ start = (u64)(index + 1) << PAGE_CACHE_SHIFT;
-+ page = find_get_page(btree_inode->i_mapping, index);
-+ if (!page)
-+ continue;
-+ if (PageDirty(page)) {
-+ lock_page(page);
-+ err = write_one_page(page, 0);
-+ if (err)
-+ werr = err;
-+ }
-+ wait_on_page_writeback(page);
-+ page_cache_release(page);
-+ cond_resched();
-+ }
-+ }
- if (err)
- werr = err;
- return werr;
-diff -Nurp btrfs-0.16/volumes.c btrfs-0.16.new/volumes.c
---- btrfs-0.16/volumes.c 2008-08-05 12:13:37.000000000 -0600
-+++ btrfs-0.16.new/volumes.c 2008-08-20 17:43:19.651405254 -0600
-@@ -138,12 +138,18 @@ int run_scheduled_bios(struct btrfs_devi
- {
- struct bio *pending;
- struct backing_dev_info *bdi;
-+ struct btrfs_fs_info *fs_info;
- struct bio *tail;
- struct bio *cur;
- int again = 0;
- unsigned long num_run = 0;
-+ unsigned long limit;
-
- bdi = device->bdev->bd_inode->i_mapping->backing_dev_info;
-+ fs_info = device->dev_root->fs_info;
-+ limit = btrfs_async_submit_limit(fs_info);
-+ limit = limit * 2 / 3;
-+
- loop:
- spin_lock(&device->io_lock);
-
-@@ -179,7 +185,11 @@ loop:
- cur = pending;
- pending = pending->bi_next;
- cur->bi_next = NULL;
-- atomic_dec(&device->dev_root->fs_info->nr_async_submits);
-+ atomic_dec(&fs_info->nr_async_bios);
-+
-+ if (atomic_read(&fs_info->nr_async_bios) < limit &&
-+ waitqueue_active(&fs_info->async_submit_wait))
-+ wake_up(&fs_info->async_submit_wait);
-
- BUG_ON(atomic_read(&cur->bi_cnt) == 0);
- bio_get(cur);
-@@ -2135,6 +2145,7 @@ int schedule_bio(struct btrfs_root *root
- int rw, struct bio *bio)
- {
- int should_queue = 1;
-+ unsigned long limit;
-
- /* don't bother with additional async steps for reads, right now */
- if (!(rw & (1 << BIO_RW))) {
-@@ -2145,12 +2156,12 @@ int schedule_bio(struct btrfs_root *root
- }
-
- /*
-- * nr_async_sumbits allows us to reliably return congestion to the
-+ * nr_async_bios allows us to reliably return congestion to the
- * higher layers. Otherwise, the async bio makes it appear we have
- * made progress against dirty pages when we've really just put it
- * on a queue for later
- */
-- atomic_inc(&root->fs_info->nr_async_submits);
-+ atomic_inc(&root->fs_info->nr_async_bios);
- WARN_ON(bio->bi_next);
- bio->bi_next = NULL;
- bio->bi_rw |= rw;
-@@ -2171,6 +2182,11 @@ int schedule_bio(struct btrfs_root *root
- if (should_queue)
- btrfs_queue_worker(&root->fs_info->submit_workers,
- &device->work);
-+
-+ limit = btrfs_async_submit_limit(root->fs_info);
-+ wait_event_timeout(root->fs_info->async_submit_wait,
-+ (atomic_read(&root->fs_info->nr_async_bios) < limit),
-+ HZ/10);
- return 0;
- }
-