Re: [PATCH] Btrfs: set page->private to the eb

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On 03/09/2012 02:37 AM, Josef Bacik wrote:
> We spend a lot of time looking up extent buffers from pages when we could just
> store the pointer to the eb the page is associated with in page->private.  This
> patch does just that, and it makes things a little simpler and reduces a bit of
> CPU overhead involved with doing metadata IO.  Thanks,
> 

Hi Josef,

This is not against the normal branch, so we must inform people that. :)

Have a quick look, and I guess it is for "Btrfs: allow metadata blocks larger than the page size", isn't it?

thanks,
liubo

> Signed-off-by: Josef Bacik <josef@xxxxxxxxxx>
> ---
>  fs/btrfs/disk-io.c   |   92 ++++++++++++-------------------------------------
>  fs/btrfs/extent_io.c |   92 ++++++++++++++++++++++++++++++++++++-------------
>  fs/btrfs/extent_io.h |    1 +
>  3 files changed, 91 insertions(+), 94 deletions(-)
> 
> diff --git a/fs/btrfs/disk-io.c b/fs/btrfs/disk-io.c
> index 33114bc..6f97129 100644
> --- a/fs/btrfs/disk-io.c
> +++ b/fs/btrfs/disk-io.c
> @@ -403,39 +403,28 @@ static int csum_dirty_buffer(struct btrfs_root *root, struct page *page)
>  	struct extent_io_tree *tree;
>  	u64 start = (u64)page->index << PAGE_CACHE_SHIFT;
>  	u64 found_start;
> -	unsigned long len;
>  	struct extent_buffer *eb;
>  
>  	tree = &BTRFS_I(page->mapping->host)->io_tree;
>  
> -	if (page->private == EXTENT_PAGE_PRIVATE)
> -		goto out;
> -	if (!page->private) {
> -		WARN_ON(1);
> -		goto out;
> -	}
> -	len = page->private >> 2;
> -	WARN_ON(len == 0);
> -
> -	eb = find_extent_buffer(tree, start, len);
> +	eb = (struct extent_buffer *)page->private;
> +	if (page != eb->pages[0])
> +		return 0;
>  
>  	found_start = btrfs_header_bytenr(eb);
>  	if (found_start != start) {
>  		WARN_ON(1);
> -		goto err;
> +		return 0;
>  	}
>  	if (eb->pages[0] != page) {
>  		WARN_ON(1);
> -		goto err;
> +		return 0;
>  	}
>  	if (!PageUptodate(page)) {
>  		WARN_ON(1);
> -		goto err;
> +		return 0;
>  	}
>  	csum_tree_block(root, eb, 0);
> -err:
> -	free_extent_buffer(eb);
> -out:
>  	return 0;
>  }
>  
> @@ -566,7 +555,6 @@ static int btree_readpage_end_io_hook(struct page *page, u64 start, u64 end,
>  	struct extent_io_tree *tree;
>  	u64 found_start;
>  	int found_level;
> -	unsigned long len;
>  	struct extent_buffer *eb;
>  	struct btrfs_root *root = BTRFS_I(page->mapping->host)->root;
>  	int ret = 0;
> @@ -576,13 +564,8 @@ static int btree_readpage_end_io_hook(struct page *page, u64 start, u64 end,
>  		goto out;
>  
>  	tree = &BTRFS_I(page->mapping->host)->io_tree;
> -	len = page->private >> 2;
> +	eb = (struct extent_buffer *)page->private;
>  
> -	eb = find_eb_for_page(tree, page, max(root->leafsize, root->nodesize));
> -	if (!eb) {
> -		ret = -EIO;
> -		goto out;
> -	}
>  	reads_done = atomic_dec_and_test(&eb->pages_reading);
>  	if (!reads_done)
>  		goto err;
> @@ -631,7 +614,6 @@ err:
>  
>  	if (ret && eb)
>  		clear_extent_buffer_uptodate(tree, eb, NULL);
> -	free_extent_buffer(eb);
>  out:
>  	return ret;
>  }
> @@ -640,31 +622,17 @@ static int btree_io_failed_hook(struct bio *failed_bio,
>  			 struct page *page, u64 start, u64 end,
>  			 int mirror_num, struct extent_state *state)
>  {
> -	struct extent_io_tree *tree;
> -	unsigned long len;
>  	struct extent_buffer *eb;
>  	struct btrfs_root *root = BTRFS_I(page->mapping->host)->root;
>  
> -	tree = &BTRFS_I(page->mapping->host)->io_tree;
> -	if (page->private == EXTENT_PAGE_PRIVATE)
> -		goto out;
> -	if (!page->private)
> -		goto out;
> -
> -	len = page->private >> 2;
> -	WARN_ON(len == 0);
> -
> -	eb = alloc_extent_buffer(tree, start, len);
> -	if (eb == NULL)
> -		goto out;
> +	eb = (struct extent_buffer *)page->private;
> +	if (page != eb->pages[0])
> +		return -EIO;
>  
>  	if (test_bit(EXTENT_BUFFER_READAHEAD, &eb->bflags)) {
>  		clear_bit(EXTENT_BUFFER_READAHEAD, &eb->bflags);
>  		btree_readahead_hook(root, eb, eb->start, -EIO);
>  	}
> -	free_extent_buffer(eb);
> -
> -out:
>  	return -EIO;	/* we fixed nothing */
>  }
>  
> @@ -955,10 +923,8 @@ static int btree_readpage(struct file *file, struct page *page)
>  
>  static int btree_releasepage(struct page *page, gfp_t gfp_flags)
>  {
> -	struct extent_io_tree *tree;
>  	struct extent_map_tree *map;
> -	struct extent_buffer *eb;
> -	struct btrfs_root *root;
> +	struct extent_io_tree *tree;
>  	int ret;
>  
>  	if (PageWriteback(page) || PageDirty(page))
> @@ -967,26 +933,11 @@ static int btree_releasepage(struct page *page, gfp_t gfp_flags)
>  	tree = &BTRFS_I(page->mapping->host)->io_tree;
>  	map = &BTRFS_I(page->mapping->host)->extent_tree;
>  
> -	root = BTRFS_I(page->mapping->host)->root;
> -	if (page->private == EXTENT_PAGE_PRIVATE) {
> -		eb = find_eb_for_page(tree, page, max(root->leafsize, root->nodesize));
> -		free_extent_buffer(eb);
> -		if (eb)
> -			return 0;
> -	}
> -
>  	ret = try_release_extent_state(map, tree, page, gfp_flags);
>  	if (!ret)
>  		return 0;
>  
> -	ret = try_release_extent_buffer(tree, page);
> -	if (ret == 1) {
> -		ClearPagePrivate(page);
> -		set_page_private(page, 0);
> -		page_cache_release(page);
> -	}
> -
> -	return ret;
> +	return try_release_extent_buffer(tree, page);
>  }
>  
>  static void btree_invalidatepage(struct page *page, unsigned long offset)
> @@ -3173,17 +3124,21 @@ static int btree_lock_page_hook(struct page *page, void *data,
>  {
>  	struct inode *inode = page->mapping->host;
>  	struct btrfs_root *root = BTRFS_I(inode)->root;
> -	struct extent_io_tree *io_tree = &BTRFS_I(inode)->io_tree;
>  	struct extent_buffer *eb;
> -	unsigned long len;
> -	u64 bytenr = page_offset(page);
>  
> -	if (page->private == EXTENT_PAGE_PRIVATE)
> +	/*
> +	 * We culled this eb but the page is still hanging out on the mapping,
> +	 * carry on.
> +	 */
> +	if (!PagePrivate(page))
>  		goto out;
>  
> -	len = page->private >> 2;
> -	eb = find_extent_buffer(io_tree, bytenr, len);
> -	if (!eb)
> +	eb = (struct extent_buffer *)page->private;
> +	if (!eb) {
> +		WARN_ON(1);
> +		goto out;
> +	}
> +	if (page != eb->pages[0])
>  		goto out;
>  
>  	if (!btrfs_try_tree_write_lock(eb)) {
> @@ -3202,7 +3157,6 @@ static int btree_lock_page_hook(struct page *page, void *data,
>  	}
>  
>  	btrfs_tree_unlock(eb);
> -	free_extent_buffer(eb);
>  out:
>  	if (!trylock_page(page)) {
>  		flush_fn(data);
> diff --git a/fs/btrfs/extent_io.c b/fs/btrfs/extent_io.c
> index d4795fc..197595a 100644
> --- a/fs/btrfs/extent_io.c
> +++ b/fs/btrfs/extent_io.c
> @@ -2462,19 +2462,24 @@ static int submit_extent_page(int rw, struct extent_io_tree *tree,
>  	return ret;
>  }
>  
> -void set_page_extent_mapped(struct page *page)
> +void attach_extent_buffer_page(struct extent_buffer *eb, struct page *page)
>  {
>  	if (!PagePrivate(page)) {
>  		SetPagePrivate(page);
>  		page_cache_get(page);
> -		set_page_private(page, EXTENT_PAGE_PRIVATE);
> +		set_page_private(page, (unsigned long)eb);
> +	} else {
> +		WARN_ON(page->private != (unsigned long)eb);
>  	}
>  }
>  
> -static void set_page_extent_head(struct page *page, unsigned long len)
> +void set_page_extent_mapped(struct page *page)
>  {
> -	WARN_ON(!PagePrivate(page));
> -	set_page_private(page, EXTENT_PAGE_PRIVATE_FIRST_PAGE | len << 2);
> +	if (!PagePrivate(page)) {
> +		SetPagePrivate(page);
> +		page_cache_get(page);
> +		set_page_private(page, EXTENT_PAGE_PRIVATE);
> +	}
>  }
>  
>  /*
> @@ -3567,6 +3572,7 @@ static struct extent_buffer *__alloc_extent_buffer(struct extent_io_tree *tree,
>  		return NULL;
>  	eb->start = start;
>  	eb->len = len;
> +	eb->tree = tree;
>  	rwlock_init(&eb->lock);
>  	atomic_set(&eb->write_locks, 0);
>  	atomic_set(&eb->read_locks, 0);
> @@ -3619,8 +3625,31 @@ static void btrfs_release_extent_buffer_page(struct extent_buffer *eb,
>  	do {
>  		index--;
>  		page = extent_buffer_page(eb, index);
> -		if (page)
> +		if (page) {
> +			spin_lock(&page->mapping->private_lock);
> +			/*
> +			 * We do this since we'll remove the pages after we've
> +			 * removed the eb from the radix tree, so we could race
> +			 * and have this page now attached to the new eb.  So
> +			 * only clear page_private if it's still connected to
> +			 * this eb.
> +			 */
> +			if (PagePrivate(page) &&
> +			    page->private == (unsigned long)eb) {
> +				/*
> +				 * We need to make sure we haven't be attached
> +				 * to a new eb.
> +				 */
> +				ClearPagePrivate(page);
> +				set_page_private(page, 0);
> +				/* One for the page private */
> +				page_cache_release(page);
> +			}
> +			spin_unlock(&page->mapping->private_lock);
> +
> +			/* One for when we alloced the page */
>  			page_cache_release(page);
> +		}
>  	} while (index != start_idx);
>  }
>  
> @@ -3665,6 +3694,32 @@ struct extent_buffer *alloc_extent_buffer(struct extent_io_tree *tree,
>  			WARN_ON(1);
>  			goto free_eb;
>  		}
> +
> +		spin_lock(&mapping->private_lock);
> +		if (PagePrivate(p)) {
> +			/*
> +			 * We could have already allocated an eb for this page
> +			 * and attached one so lets see if we can get a ref on
> +			 * the existing eb, and if we can we know it's good and
> +			 * we can just return that one, else we know we can just
> +			 * overwrite page->private.
> +			 */
> +			exists = (struct extent_buffer *)p->private;
> +			if (atomic_inc_not_zero(&exists->refs)) {
> +				spin_unlock(&mapping->private_lock);
> +				unlock_page(p);
> +				goto free_eb;
> +			}
> +
> +			/* 
> +			 * Do this so attach doesn't complain and we need to
> +			 * drop the ref the old guy had.
> +			 */
> +			ClearPagePrivate(p);
> +			page_cache_release(p);
> +		}
> +		attach_extent_buffer_page(eb, p);
> +		spin_unlock(&mapping->private_lock);
>  		mark_page_accessed(p);
>  		eb->pages[i] = p;
>  		if (!PageUptodate(p))
> @@ -3687,7 +3742,6 @@ struct extent_buffer *alloc_extent_buffer(struct extent_io_tree *tree,
>  	if (ret == -EEXIST) {
>  		exists = radix_tree_lookup(&tree->buffer,
>  						start >> PAGE_CACHE_SHIFT);
> -		/* add one reference for the caller */
>  		atomic_inc(&exists->refs);
>  		spin_unlock(&tree->buffer_lock);
>  		radix_tree_preload_end();
> @@ -3707,12 +3761,9 @@ struct extent_buffer *alloc_extent_buffer(struct extent_io_tree *tree,
>  	 * after the extent buffer is in the radix tree so
>  	 * it doesn't get lost
>  	 */
> -	set_page_extent_mapped(eb->pages[0]);
> -	set_page_extent_head(eb->pages[0], eb->len);
>  	SetPageChecked(eb->pages[0]);
>  	for (i = 1; i < num_pages; i++) {
>  		p = extent_buffer_page(eb, i);
> -		set_page_extent_mapped(p);
>  		ClearPageChecked(p);
>  		unlock_page(p);
>  	}
> @@ -3776,10 +3827,6 @@ int clear_extent_buffer_dirty(struct extent_io_tree *tree,
>  		lock_page(page);
>  		WARN_ON(!PagePrivate(page));
>  
> -		set_page_extent_mapped(page);
> -		if (i == 0)
> -			set_page_extent_head(page, eb->len);
> -
>  		clear_page_dirty_for_io(page);
>  		spin_lock_irq(&page->mapping->tree_lock);
>  		if (!PageDirty(page)) {
> @@ -3991,9 +4038,6 @@ int read_extent_buffer_pages(struct extent_io_tree *tree,
>  	atomic_set(&eb->pages_reading, num_reads);
>  	for (i = start_i; i < num_pages; i++) {
>  		page = extent_buffer_page(eb, i);
> -		set_page_extent_mapped(page);
> -		if (i == 0)
> -			set_page_extent_head(page, eb->len);
>  		if (!PageUptodate(page)) {
>  			ClearPageError(page);
>  			err = __extent_read_full_page(tree, page,
> @@ -4376,22 +4420,19 @@ static inline void btrfs_release_extent_buffer_rcu(struct rcu_head *head)
>  	struct extent_buffer *eb =
>  			container_of(head, struct extent_buffer, rcu_head);
>  
> -	btrfs_release_extent_buffer(eb);
> +	__free_extent_buffer(eb);
>  }
>  
>  int try_release_extent_buffer(struct extent_io_tree *tree, struct page *page)
>  {
>  	u64 start = page_offset(page);
> -	struct extent_buffer *eb;
> +	struct extent_buffer *eb = (struct extent_buffer *)page->private;
>  	int ret = 1;
>  
> -	spin_lock(&tree->buffer_lock);
> -	eb = radix_tree_lookup(&tree->buffer, start >> PAGE_CACHE_SHIFT);
> -	if (!eb) {
> -		spin_unlock(&tree->buffer_lock);
> -		return ret;
> -	}
> +	if (!PagePrivate(page) || !eb)
> +		return 1;
>  
> +	spin_lock(&tree->buffer_lock);
>  	if (atomic_read(&eb->refs) > 1 ||
>  	    test_bit(EXTENT_BUFFER_DIRTY, &eb->bflags)) {
>  		ret = 0;
> @@ -4407,6 +4448,7 @@ int try_release_extent_buffer(struct extent_io_tree *tree, struct page *page)
>  		goto out;
>  	}
>  	radix_tree_delete(&tree->buffer, start >> PAGE_CACHE_SHIFT);
> +	btrfs_release_extent_buffer_page(eb, 0);
>  out:
>  	spin_unlock(&tree->buffer_lock);
>  
> diff --git a/fs/btrfs/extent_io.h b/fs/btrfs/extent_io.h
> index 9b6c8f3..f030a2d 100644
> --- a/fs/btrfs/extent_io.h
> +++ b/fs/btrfs/extent_io.h
> @@ -127,6 +127,7 @@ struct extent_buffer {
>  	unsigned long map_start;
>  	unsigned long map_len;
>  	unsigned long bflags;
> +	struct extent_io_tree *tree;
>  	atomic_t refs;
>  	atomic_t pages_reading;
>  	struct list_head leak_list;

--
To unsubscribe from this list: send the line "unsubscribe linux-btrfs" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html


[Index of Archives]     [Linux Filesystem Development]     [Linux NFS]     [Linux NILFS]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]

  Powered by Linux