<!-- MHonArc v2.6.19 -->
<!--X-Subject: [PATCH 41/52] vfs: add basic delayed allocation support -->
<!--X-From-R13: "Furbqber Ff'b" &#60;glgfbNzvg.rqh> -->
<!--X-Date: Sat, 5 Jul 2008 10:38:35 &#45;0700 -->
<!--X-Message-Id: 1215279378&#45;30504&#45;42&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Content-Type: text/plain -->
<!--X-Reference: 1215279378&#45;30504&#45;1&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;2&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;3&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;4&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;5&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;6&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;7&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;8&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;9&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;10&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;11&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;12&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;13&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;14&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;15&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;16&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;17&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;18&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;19&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;20&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;21&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;22&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;23&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;24&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;25&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;26&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;27&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;28&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;29&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;30&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;31&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;32&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;33&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;34&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;35&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;36&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;37&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;38&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;39&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;40&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Reference: 1215279378&#45;30504&#45;41&#45;git&#45;send&#45;email&#45;tytso@mit.edu -->
<!--X-Head-End-->
<!doctype html public "-//W3C//DTD HTML//EN">
<html>
<head>
<script async src="//pagead2.googlesyndication.com/pagead/js/adsbygoogle.js"></script>
<script>
     (adsbygoogle = window.adsbygoogle || []).push({
          google_ad_client: "ca-pub-3422782820843221",
          enable_page_level_ads: true
     });
</script>
<meta name="viewport" content="width=device-width, initial-scale=1">
<meta name="description" content="Linux Ext4: [PATCH 41/52] vfs: add basic delayed allocation support">
<style>
<!--
 pre {white-space: pre-wrap;}
-->
</style>
<title>[PATCH 41/52] vfs: add basic delayed allocation support (Linux Ext4)</title>
<link rel="alternate" type="application/rss+xml" title="Linux Ext4" href="//feedproxy.google.com/LinuxExt4">
</head>
<body itemscope itemtype="//schema.org/Article" vlink=green>
<!--X-Body-Begin-->
<!--X-User-Header-->
<!--X-User-Header-End-->
<!--X-TopPNI-->
<form action="//www.google.com" id="cse-search-box" target="_blank">
  <div>
    <input type="hidden" name="cx" value="partner-pub-3422782820843221:9580497365" />
    <input type="hidden" name="ie" value="UTF-8" />
    <input type="text" name="q" size="55" />
    <input type="submit" name="sa" value="Search" />
  </div>
</form>
<script type="text/javascript" src="//www.google.com/coop/cse/brand?form=cse-search-box&amp;lang=en"></script>
<h1 itemprop="name">[PATCH 41/52] vfs: add basic delayed allocation support</h1>
[<a href="msg07652.html">Date Prev</a>][<a href="msg07654.html">Date Next</a>][<a href="msg07618.html">Thread Prev</a>][<a href="msg07654.html">Thread Next</a>][<a href="mail80.html#07653">Date Index</a>][<a href="thrd80.html#07653">Thread Index</a>]


<p>&nbsp;<br>
<script async src="//pagead2.googlesyndication.com/pagead/js/adsbygoogle.js"></script>
<!-- responsive test for archives -->
<ins class="adsbygoogle"
     style="display:block"
     data-ad-client="ca-pub-3422782820843221"
     data-ad-slot="6345952567"
     data-ad-format="auto"></ins>
<script>
(adsbygoogle = window.adsbygoogle || []).push({});
</script>

<!--X-TopPNI-End-->
<!--X-MsgBody-->
<!--X-Subject-Header-Begin-->
<hr>
<!--X-Subject-Header-End-->
<!--X-Head-of-Message-->
<ul>
<li><em>To</em>: Ext4 Developers List &lt;<a href="mailto:linux-ext4@DOMAIN.HIDDEN">linux-ext4@xxxxxxxxxxxxxxx</a>&gt;,   Linux Kernel Developers List &lt;<a href="mailto:linux-kernel@DOMAIN.HIDDEN">linux-kernel@xxxxxxxxxxxxxxx</a>&gt;</li>
<li><em>Subject</em>: [PATCH 41/52] vfs: add basic delayed allocation support</li>
<li><em>From</em>: &quot;Theodore Ts'o&quot; &lt;<a href="mailto:tytso@DOMAIN.HIDDEN">tytso@xxxxxxx</a>&gt;</li>
<li><em>Date</em>: Sat,  5 Jul 2008 13:36:07 -0400</li>
<li><em>Cc</em>: Alex Tomas &lt;<a href="mailto:alex@DOMAIN.HIDDEN">alex@xxxxxxxxxxxxx</a>&gt;, Mingming Cao &lt;<a href="mailto:cmm@DOMAIN.HIDDEN">cmm@xxxxxxxxxx</a>&gt;,   Dave Kleikamp &lt;<a href="mailto:shaggy@DOMAIN.HIDDEN">shaggy@xxxxxxxxxxxxxxxxxx</a>&gt;, &quot;Theodore Ts'o&quot; &lt;<a href="mailto:tytso@DOMAIN.HIDDEN">tytso@xxxxxxx</a>&gt;</li>
<li><em>In-reply-to</em>: &lt;<a href="mailto:1215279378-30504-41-git-send-email-tytso@DOMAIN.HIDDEN">1215279378-30504-41-git-send-email-tytso@xxxxxxx</a>&gt;</li>
</ul>
<!--X-Head-of-Message-End-->
<!--X-Head-Body-Sep-Begin-->
<!-- AddThis Button BEGIN -->
<div class="addthis_toolbox addthis_default_style ">
<a class="addthis_button_preferred_1"></a>
<a class="addthis_button_preferred_2"></a>
<a class="addthis_button_preferred_3"></a>
<a class="addthis_button_preferred_4"></a>
<a class="addthis_button_compact"></a>
<a class="addthis_counter addthis_bubble_style"></a>
</div>
<script type="text/javascript" src="//s7.addthis.com/js/300/addthis_widget.js#pubid=ra-5196c2ae1be43d18&async=1&domready=1"></script>
<!-- AddThis Button END -->
<hr>
<script async src="//pagead2.googlesyndication.com/pagead/js/adsbygoogle.js"></script>
<!-- responsive link 1 -->
<ins class="adsbygoogle"
     style="display:block"
     data-ad-client="ca-pub-3422782820843221"
     data-ad-slot="8681825769"
     data-ad-format="link"></ins>
<script>
(adsbygoogle = window.adsbygoogle || []).push({});
</script>
<p>
<div class="content" itemprop="articleBody">
<!--X-Head-Body-Sep-End-->
<!--X-Body-of-Message-->
<pre>From: Alex Tomas &lt;alex@xxxxxxxxxxxxx&gt;

* block_prepare_write() can be passed a special -&gt;get_block() which
   doesn't allocate blocks, but reserve them and mark bh delayed

* a filesystem can use mpage_da_writepages() with other -&gt;get_block()
  which doesn't defer allocation. mpage_da_writepages() finds all
  non-allocated blocks and try to allocate them with minimal calls
  to -&gt;get_block(), then submit IO using __mpage_writepage()

Updated fix from  Valerie Clement &lt;valerie.clement@xxxxxxxx&gt;
fixes a filesystem corruption issue when the filesystem is
mounted with the delalloc option and blocksize &lt; pagesize.

Updated fix from Mingming Cao &lt;cmm@xxxxxxxxxx&gt; to clear
buffer_delay in block_write_full_page() after allocation to those
delayed buffer.

Signed-off-by: Alex Tomas &lt;alex@xxxxxxxxxxxxx&gt;
Signed-off-by: Mingming Cao &lt;cmm@xxxxxxxxxx&gt;
Signed-off-by: Dave Kleikamp &lt;shaggy@xxxxxxxxxxxxxxxxxx&gt;
Signed-off-by: &quot;Theodore Ts'o&quot; &lt;tytso@xxxxxxx&gt;
---
 fs/buffer.c           |    7 +-
 fs/mpage.c            |  405 +++++++++++++++++++++++++++++++++++++++++++++++++
 include/linux/mpage.h |    2 +
 3 files changed, 412 insertions(+), 2 deletions(-)

diff --git a/fs/buffer.c b/fs/buffer.c
index a413008..7a2d909 100644
--- a/fs/buffer.c
+++ b/fs/buffer.c
@@ -1691,11 +1691,13 @@ static int __block_write_full_page(struct inode *inode, struct page *page,
 			 */
 			clear_buffer_dirty(bh);
 			set_buffer_uptodate(bh);
-		} else if (!buffer_mapped(bh) &amp;&amp; buffer_dirty(bh)) {
+		} else if ((!buffer_mapped(bh) || buffer_delay(bh))
+			    &amp;&amp; buffer_dirty(bh)) {
 			WARN_ON(bh-&gt;b_size != blocksize);
 			err = get_block(inode, block, bh, 1);
 			if (err)
 				goto recover;
+			clear_buffer_delay(bh);
 			if (buffer_new(bh)) {
 				/* blockdev mappings never come here */
 				clear_buffer_new(bh);
@@ -1774,7 +1776,8 @@ recover:
 	bh = head;
 	/* Recovery: lock and submit the mapped buffers */
 	do {
-		if (buffer_mapped(bh) &amp;&amp; buffer_dirty(bh)) {
+		if (buffer_mapped(bh) &amp;&amp; buffer_dirty(bh)
+			&amp;&amp; !buffer_delay(bh)) {
 			lock_buffer(bh);
 			mark_buffer_async_write(bh);
 		} else {
diff --git a/fs/mpage.c b/fs/mpage.c
index 235e4d3..cde7f11 100644
--- a/fs/mpage.c
+++ b/fs/mpage.c
@@ -10,6 +10,8 @@
  *		Initial version
  * 27Jun2002	axboe@xxxxxxx
  *		use bio_add_page() to build bio's just the right size
+ * 26Jul2007	alex@xxxxxxxxxxxxx AKA bzzz
+ *		basic delayed allocation support
  */
 
 #include &lt;linux/kernel.h&gt;
@@ -710,3 +712,406 @@ int mpage_writepage(struct page *page, get_block_t get_block,
 	return ret;
 }
 EXPORT_SYMBOL(mpage_writepage);
+
+/*
+ * Delayed allocation stuff
+ */
+
+struct mpage_da_data {
+	struct inode *inode;
+	struct buffer_head lbh;			/* extent of blocks */
+	unsigned long first_page, next_page;	/* extent of pages */
+	get_block_t *get_block;
+	struct writeback_control *wbc;
+};
+
+
+/*
+ * mpage_da_submit_io - walks through extent of pages and try to write
+ * them with __mpage_writepage()
+ *
+ * @mpd-&gt;inode: inode
+ * @mpd-&gt;first_page: first page of the extent
+ * @mpd-&gt;next_page: page after the last page of the extent
+ * @mpd-&gt;get_block: the filesystem's block mapper function
+ *
+ * By the time mpage_da_submit_io() is called we expect all blocks
+ * to be allocated. this may be wrong if allocation failed.
+ *
+ * As pages are already locked by write_cache_pages(), we can't use it
+ */
+static int mpage_da_submit_io(struct mpage_da_data *mpd)
+{
+	struct address_space *mapping = mpd-&gt;inode-&gt;i_mapping;
+	struct mpage_data mpd_pp = {
+		.bio = NULL,
+		.last_block_in_bio = 0,
+		.get_block = mpd-&gt;get_block,
+		.use_writepage = 1,
+	};
+	int ret = 0, err, nr_pages, i;
+	unsigned long index, end;
+	struct pagevec pvec;
+
+	BUG_ON(mpd-&gt;next_page &lt;= mpd-&gt;first_page);
+
+	pagevec_init(&amp;pvec, 0);
+	index = mpd-&gt;first_page;
+	end = mpd-&gt;next_page - 1;
+
+	while (index &lt;= end) {
+		/* XXX: optimize tail */
+		nr_pages = pagevec_lookup(&amp;pvec, mapping, index, PAGEVEC_SIZE);
+		if (nr_pages == 0)
+			break;
+		for (i = 0; i &lt; nr_pages; i++) {
+			struct page *page = pvec.pages[i];
+
+			index = page-&gt;index;
+			if (index &gt; end)
+				break;
+			index++;
+
+			err = __mpage_writepage(page, mpd-&gt;wbc, &amp;mpd_pp);
+
+			/*
+			 * In error case, we have to continue because
+			 * remaining pages are still locked
+			 * XXX: unlock and re-dirty them?
+			 */
+			if (ret == 0)
+				ret = err;
+		}
+		pagevec_release(&amp;pvec);
+	}
+	if (mpd_pp.bio)
+		mpage_bio_submit(WRITE, mpd_pp.bio);
+
+	return ret;
+}
+
+/*
+ * mpage_put_bnr_to_bhs - walk blocks and assign them actual numbers
+ *
+ * @mpd-&gt;inode - inode to walk through
+ * @exbh-&gt;b_blocknr - first block on a disk
+ * @exbh-&gt;b_size - amount of space in bytes
+ * @logical - first logical block to start assignment with
+ *
+ * the function goes through all passed space and put actual disk
+ * block numbers into buffer heads, dropping BH_Delay
+ */
+static void mpage_put_bnr_to_bhs(struct mpage_da_data *mpd, sector_t logical,
+				 struct buffer_head *exbh)
+{
+	struct inode *inode = mpd-&gt;inode;
+	struct address_space *mapping = inode-&gt;i_mapping;
+	int blocks = exbh-&gt;b_size &gt;&gt; inode-&gt;i_blkbits;
+	sector_t pblock = exbh-&gt;b_blocknr, cur_logical;
+	struct buffer_head *head, *bh;
+	unsigned long index, end;
+	struct pagevec pvec;
+	int nr_pages, i;
+
+	index = logical &gt;&gt; (PAGE_CACHE_SHIFT - inode-&gt;i_blkbits);
+	end = (logical + blocks - 1) &gt;&gt; (PAGE_CACHE_SHIFT - inode-&gt;i_blkbits);
+	cur_logical = index &lt;&lt; (PAGE_CACHE_SHIFT - inode-&gt;i_blkbits);
+
+	pagevec_init(&amp;pvec, 0);
+
+	while (index &lt;= end) {
+		/* XXX: optimize tail */
+		nr_pages = pagevec_lookup(&amp;pvec, mapping, index, PAGEVEC_SIZE);
+		if (nr_pages == 0)
+			break;
+		for (i = 0; i &lt; nr_pages; i++) {
+			struct page *page = pvec.pages[i];
+
+			index = page-&gt;index;
+			if (index &gt; end)
+				break;
+			index++;
+
+			BUG_ON(!PageLocked(page));
+			BUG_ON(PageWriteback(page));
+			BUG_ON(!page_has_buffers(page));
+
+			bh = page_buffers(page);
+			head = bh;
+
+			/* skip blocks out of the range */
+			do {
+				if (cur_logical &gt;= logical)
+					break;
+				cur_logical++;
+			} while ((bh = bh-&gt;b_this_page) != head);
+
+			do {
+				if (cur_logical &gt;= logical + blocks)
+					break;
+
+				if (buffer_delay(bh)) {
+					bh-&gt;b_blocknr = pblock;
+					clear_buffer_delay(bh);
+				} else if (buffer_mapped(bh)) {
+					BUG_ON(bh-&gt;b_blocknr != pblock);
+				}
+
+				cur_logical++;
+				pblock++;
+			} while ((bh = bh-&gt;b_this_page) != head);
+		}
+		pagevec_release(&amp;pvec);
+	}
+}
+
+
+/*
+ * __unmap_underlying_blocks - just a helper function to unmap
+ * set of blocks described by @bh
+ */
+static inline void __unmap_underlying_blocks(struct inode *inode,
+					     struct buffer_head *bh)
+{
+	struct block_device *bdev = inode-&gt;i_sb-&gt;s_bdev;
+	int blocks, i;
+
+	blocks = bh-&gt;b_size &gt;&gt; inode-&gt;i_blkbits;
+	for (i = 0; i &lt; blocks; i++)
+		unmap_underlying_metadata(bdev, bh-&gt;b_blocknr + i);
+}
+
+/*
+ * mpage_da_map_blocks - go through given space
+ *
+ * @mpd-&gt;lbh - bh describing space
+ * @mpd-&gt;get_block - the filesystem's block mapper function
+ *
+ * The function skips space we know is already mapped to disk blocks.
+ *
+ * The function ignores errors -&gt;get_block() returns, thus real
+ * error handling is postponed to __mpage_writepage()
+ */
+static void mpage_da_map_blocks(struct mpage_da_data *mpd)
+{
+	struct buffer_head *lbh = &amp;mpd-&gt;lbh;
+	int err = 0, remain = lbh-&gt;b_size;
+	sector_t next = lbh-&gt;b_blocknr;
+	struct buffer_head new;
+
+	/*
+	 * We consider only non-mapped and non-allocated blocks
+	 */
+	if (buffer_mapped(lbh) &amp;&amp; !buffer_delay(lbh))
+		return;
+
+	while (remain) {
+		new.b_state = lbh-&gt;b_state;
+		new.b_blocknr = 0;
+		new.b_size = remain;
+		err = mpd-&gt;get_block(mpd-&gt;inode, next, &amp;new, 1);
+		if (err) {
+			/*
+			 * Rather than implement own error handling
+			 * here, we just leave remaining blocks
+			 * unallocated and try again with -&gt;writepage()
+			 */
+			break;
+		}
+		BUG_ON(new.b_size == 0);
+
+		if (buffer_new(&amp;new))
+			__unmap_underlying_blocks(mpd-&gt;inode, &amp;new);
+
+		/*
+		 * If blocks are delayed marked, we need to
+		 * put actual blocknr and drop delayed bit
+		 */
+		if (buffer_delay(lbh))
+			mpage_put_bnr_to_bhs(mpd, next, &amp;new);
+
+			/* go for the remaining blocks */
+			next += new.b_size &gt;&gt; mpd-&gt;inode-&gt;i_blkbits;
+			remain -= new.b_size;
+		}
+}
+
+#define BH_FLAGS ((1 &lt;&lt; BH_Uptodate) | (1 &lt;&lt; BH_Mapped) | (1 &lt;&lt; BH_Delay))
+
+/*
+ * mpage_add_bh_to_extent - try to add one more block to extent of blocks
+ *
+ * @mpd-&gt;lbh - extent of blocks
+ * @logical - logical number of the block in the file
+ * @bh - bh of the block (used to access block's state)
+ *
+ * the function is used to collect contig. blocks in same state
+ */
+static void mpage_add_bh_to_extent(struct mpage_da_data *mpd,
+				   sector_t logical, struct buffer_head *bh)
+{
+	struct buffer_head *lbh = &amp;mpd-&gt;lbh;
+	sector_t next;
+
+	next = lbh-&gt;b_blocknr + (lbh-&gt;b_size &gt;&gt; mpd-&gt;inode-&gt;i_blkbits);
+
+	/*
+	 * First block in the extent
+	 */
+	if (lbh-&gt;b_size == 0) {
+		lbh-&gt;b_blocknr = logical;
+		lbh-&gt;b_size = bh-&gt;b_size;
+		lbh-&gt;b_state = bh-&gt;b_state &amp; BH_FLAGS;
+		return;
+	}
+
+	/*
+	 * Can we merge the block to our big extent?
+	 */
+	if (logical == next &amp;&amp; (bh-&gt;b_state &amp; BH_FLAGS) == lbh-&gt;b_state) {
+		lbh-&gt;b_size += bh-&gt;b_size;
+		return;
+	}
+
+	/*
+	 * We couldn't merge the block to our extent, so we
+	 * need to flush current  extent and start new one
+	 */
+	mpage_da_map_blocks(mpd);
+
+	/*
+	 * Now start a new extent
+	 */
+	lbh-&gt;b_size = bh-&gt;b_size;
+	lbh-&gt;b_state = bh-&gt;b_state &amp; BH_FLAGS;
+	lbh-&gt;b_blocknr = logical;
+}
+
+/*
+ * __mpage_da_writepage - finds extent of pages and blocks
+ *
+ * @page: page to consider
+ * @wbc: not used, we just follow rules
+ * @data: context
+ *
+ * The function finds extents of pages and scan them for all blocks.
+ */
+static int __mpage_da_writepage(struct page *page,
+				struct writeback_control *wbc, void *data)
+{
+	struct mpage_da_data *mpd = data;
+	struct inode *inode = mpd-&gt;inode;
+	struct buffer_head *bh, *head, fake;
+	sector_t logical;
+
+	/*
+	 * Can we merge this page to current extent?
+	 */
+	if (mpd-&gt;next_page != page-&gt;index) {
+		/*
+		 * Nope, we can't. So, we map non-allocated blocks
+		 * and start IO on them using __mpage_writepage()
+		 */
+		if (mpd-&gt;next_page != mpd-&gt;first_page) {
+			mpage_da_map_blocks(mpd);
+			mpage_da_submit_io(mpd);
+		}
+
+		/*
+		 * Start next extent of pages ...
+		 */
+		mpd-&gt;first_page = page-&gt;index;
+
+		/*
+		 * ... and blocks
+		 */
+		mpd-&gt;lbh.b_size = 0;
+		mpd-&gt;lbh.b_state = 0;
+		mpd-&gt;lbh.b_blocknr = 0;
+	}
+
+	mpd-&gt;next_page = page-&gt;index + 1;
+	logical = (sector_t) page-&gt;index &lt;&lt;
+		  (PAGE_CACHE_SHIFT - inode-&gt;i_blkbits);
+
+	if (!page_has_buffers(page)) {
+		/*
+		 * There is no attached buffer heads yet (mmap?)
+		 * we treat the page asfull of dirty blocks
+		 */
+		bh = &amp;fake;
+		bh-&gt;b_size = PAGE_CACHE_SIZE;
+		bh-&gt;b_state = 0;
+		set_buffer_dirty(bh);
+		set_buffer_uptodate(bh);
+		mpage_add_bh_to_extent(mpd, logical, bh);
+	} else {
+		/*
+		 * Page with regular buffer heads, just add all dirty ones
+		 */
+		head = page_buffers(page);
+		bh = head;
+		do {
+			BUG_ON(buffer_locked(bh));
+			if (buffer_dirty(bh))
+				mpage_add_bh_to_extent(mpd, logical, bh);
+			logical++;
+		} while ((bh = bh-&gt;b_this_page) != head);
+	}
+
+	return 0;
+}
+
+/*
+ * mpage_da_writepages - walk the list of dirty pages of the given
+ * address space, allocates non-allocated blocks, maps newly-allocated
+ * blocks to existing bhs and issue IO them
+ *
+ * @mapping: address space structure to write
+ * @wbc: subtract the number of written pages from *@wbc-&gt;nr_to_write
+ * @get_block: the filesystem's block mapper function.
+ *
+ * This is a library function, which implements the writepages()
+ * address_space_operation.
+ *
+ * In order to avoid duplication of logic that deals with partial pages,
+ * multiple bio per page, etc, we find non-allocated blocks, allocate
+ * them with minimal calls to -&gt;get_block() and re-use __mpage_writepage()
+ *
+ * It's important that we call __mpage_writepage() only once for each
+ * involved page, otherwise we'd have to implement more complicated logic
+ * to deal with pages w/o PG_lock or w/ PG_writeback and so on.
+ *
+ * See comments to mpage_writepages()
+ */
+int mpage_da_writepages(struct address_space *mapping,
+			struct writeback_control *wbc, get_block_t get_block)
+{
+	struct mpage_da_data mpd;
+	int ret;
+
+	if (!get_block)
+		return generic_writepages(mapping, wbc);
+
+	mpd.wbc = wbc;
+	mpd.inode = mapping-&gt;host;
+	mpd.lbh.b_size = 0;
+	mpd.lbh.b_state = 0;
+	mpd.lbh.b_blocknr = 0;
+	mpd.first_page = 0;
+	mpd.next_page = 0;
+	mpd.get_block = get_block;
+
+	ret = write_cache_pages(mapping, wbc, __mpage_da_writepage, &amp;mpd);
+
+	/*
+	 * Handle last extent of pages
+	 */
+	if (mpd.next_page != mpd.first_page) {
+		mpage_da_map_blocks(&amp;mpd);
+		mpage_da_submit_io(&amp;mpd);
+	}
+
+	return ret;
+}
+EXPORT_SYMBOL(mpage_da_writepages);
diff --git a/include/linux/mpage.h b/include/linux/mpage.h
index 068a0c9..1f67d34 100644
--- a/include/linux/mpage.h
+++ b/include/linux/mpage.h
@@ -18,6 +18,8 @@ int mpage_readpages(struct address_space *mapping, struct list_head *pages,
 int mpage_readpage(struct page *page, get_block_t get_block);
 int mpage_writepages(struct address_space *mapping,
 		struct writeback_control *wbc, get_block_t get_block);
+int mpage_da_writepages(struct address_space *mapping,
+		struct writeback_control *wbc, get_block_t get_block);
 int mpage_writepage(struct page *page, get_block_t *get_block,
 		struct writeback_control *wbc);
 
-- 
1.5.6.rc3.1.g36b7.dirty

--
To unsubscribe from this list: send the line &quot;unsubscribe linux-ext4&quot; in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  <a  rel="nofollow" href="http://vger.kernel.org/majordomo-info.html">http://vger.kernel.org/majordomo-info.html</a>
</pre>
<!--X-Body-of-Message-End-->
<!--X-MsgBody-End-->
<!--X-Follow-Ups-->
</div>
<hr>
<ul><li><strong>Follow-Ups</strong>:
<ul>
<li><strong><a name="07654" href="msg07654.html">[PATCH 42/52] ext4: Add basic delayed allocation support</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
</ul></li></ul>
<!--X-Follow-Ups-End-->
<!--X-References-->
<ul><li><strong>References</strong>:
<ul>
<li><strong><a name="07615" href="msg07615.html">Ext4 patches for the next merge window</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07647" href="msg07647.html">[PATCH 01/52] ext4: fix comments to say &quot;ext4&quot;</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07622" href="msg07622.html">[PATCH 02/52] ext4: start searching for the right extent from the goal group.</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07608" href="msg07608.html">[PATCH 03/52] ext4: Use BUG_ON() instead of BUG()</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07621" href="msg07621.html">[PATCH 04/52] ext4: switch to seq_files</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07652" href="msg07652.html">[PATCH 05/52] ext4: improve some code in rb tree part of dir.c</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07614" href="msg07614.html">[PATCH 06/52] ext4: Fix ext4_mb_init_cache return error</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07659" href="msg07659.html">[PATCH 07/52] ext4: add error processing when calling ext4_mb_init_cache in mballoc</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07651" href="msg07651.html">[PATCH 08/52] ext4: miscellaneous error checks and coding cleanups for mballoc</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07658" href="msg07658.html">[PATCH 09/52] ext4: remove double definitions of xattr macros</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07609" href="msg07609.html">[PATCH 10/52] ext4: Rename read_block_bitmap() to ext4_read_block_bitmap()</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07642" href="msg07642.html">[PATCH 11/52] ext4: Remove unused variable from ext4_show_options</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07610" href="msg07610.html">[PATCH 12/52] jbd2: Add commit time into the commit block</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07633" href="msg07633.html">[PATCH 13/52] ext4: New inode allocation for FLEX_BG meta-data groups.</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07643" href="msg07643.html">[PATCH 14/52] jbd2: fix race between jbd2_journal_try_to_free_buffers() and jbd2 commit transaction</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07649" href="msg07649.html">[PATCH 15/52] ext4: remove redundant code in ext4_fill_super()</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07646" href="msg07646.html">[PATCH 16/52] ext4: remove quota allocation when ext4_mb_new_blocks fails</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07645" href="msg07645.html">[PATCH 17/52] ext4: Update i_disksize properly when allocating from fallocate area.</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07644" href="msg07644.html">[PATCH 18/52] ext4: return error when calling ext4_ext_split failed</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07660" href="msg07660.html">[PATCH 19/52] ext4: Make ext4_ext_find_extent fills ext_path completely</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07650" href="msg07650.html">[PATCH 20/52] ext4: Fix ext4_ext_journal_restart() to reflect errors up to the caller</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07648" href="msg07648.html">[PATCH 21/52] ext4: cleanup never-used magic numbers from htree code</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07641" href="msg07641.html">[PATCH 22/52] ext4: Fix sparse warning</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07655" href="msg07655.html">[PATCH 23/52] ext4: fix ext4_init_block_bitmap() for metablock block group</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07635" href="msg07635.html">[PATCH 24/52] ext4: Use inode preallocation with -o noextents</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07634" href="msg07634.html">[PATCH 25/52] ext4: cleanup block allocator</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07657" href="msg07657.html">[PATCH 26/52] ext4: call blkdev_issue_flush on fsync</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07630" href="msg07630.html">[PATCH 27/52] ext4: mballoc avoid use root reserved blocks for non root allocation</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07629" href="msg07629.html">[PATCH 28/52] ext4: Set journal pointer to NULL when journal is released</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07656" href="msg07656.html">[PATCH 29/52] ext4: use atomic functions to set bh_state</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07639" href="msg07639.html">[PATCH 30/52] ext4: Add missing unlock to an error path in ext4_quota_write()</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07624" href="msg07624.html">[PATCH 31/52] ext4: fix online resize with mballoc</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07611" href="msg07611.html">[PATCH 32/52] ext4: Documentation updates.</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07623" href="msg07623.html">[PATCH 33/52] ext4: Use page_mkwrite vma_operations to get mmap write notification.</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07632" href="msg07632.html">[PATCH 34/52] vfs: Move mark_inode_dirty() from under page lock in generic_write_end()</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07636" href="msg07636.html">[PATCH 35/52] ext4: Invert the locking order of page_lock and transaction start</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07620" href="msg07620.html">[PATCH 36/52] ext4: Fix lock inversion in ext4_ext_truncate()</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07612" href="msg07612.html">[PATCH 37/52] vfs: export filemap_fdatawrite_range()</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07613" href="msg07613.html">[PATCH 38/52] jbd2: Implement data=ordered mode handling via inodes</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07640" href="msg07640.html">[PATCH 39/52] ext4: Use new framework for data=ordered mode in JBD2</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
<li><strong><a name="07618" href="msg07618.html">[PATCH 40/52] jbd2: Remove data=ordered mode support using jbd buffer heads</a></strong>
<ul><li><em>From:</em> Theodore Ts'o</li></ul></li>
</ul></li></ul>
<!--X-References-End-->
<!--X-BotPNI-->
<ul>
<li>Prev by Date:
<strong><a href="msg07652.html">[PATCH 05/52] ext4: improve some code in rb tree part of dir.c</a></strong>
</li>
<li>Next by Date:
<strong><a href="msg07654.html">[PATCH 42/52] ext4: Add basic delayed allocation support</a></strong>
</li>
<li>Previous by thread:
<strong><a href="msg07618.html">[PATCH 40/52] jbd2: Remove data=ordered mode support using jbd buffer heads</a></strong>
</li>
<li>Next by thread:
<strong><a href="msg07654.html">[PATCH 42/52] ext4: Add basic delayed allocation support</a></strong>
</li>
<li>Index(es):
<ul>
<li><a href="mail80.html#07653"><strong>Date</strong></a></li>
<li><a href="thrd80.html#07653"><strong>Thread</strong></a></li>
</ul>
</li>
</ul>

<!--X-BotPNI-End-->
<!--X-User-Footer-->
<center>
<font size=-1>
<a href=/lists/>[Index&nbsp;of&nbsp;Archives]</a>
&nbsp;
&nbsp;
<a href=/lists/reiserfs-devel/>[Reiser&nbsp;Filesystem&nbsp;Development]</a>
&nbsp;
&nbsp;
<a href=/lists/ceph-devel/>[Ceph&nbsp;FS]</a>
&nbsp;
&nbsp;
<a href=/lists/newbies/>[Kernel&nbsp;Newbies]</a>
&nbsp;
&nbsp;
<a href=/lists/security/>[Security]</a>
&nbsp;
&nbsp;
<a href=/lists/netfilter/>[Netfilter]</a>
&nbsp;
&nbsp;
<a href=/lists/bugtraq/>[Bugtraq]</a>
&nbsp;
&nbsp;
<a href=/lists/linux-fsdevel/>[Linux&nbsp;FS]</a>
&nbsp;
&nbsp;
<a href=https://yosemitenews.info/>[Yosemite&nbsp;National&nbsp;Park]</a>
&nbsp;
&nbsp;
<a href=/lists/mips/>[MIPS&nbsp;Linux]</a>
&nbsp;
&nbsp;
<a href=/lists/arm/>[ARM&nbsp;Linux]</a>
&nbsp;
&nbsp;
<a href=/lists/security/>[Linux&nbsp;Security]</a>
&nbsp;
&nbsp;
<a href=/lists/raid/>[Linux&nbsp;RAID]</a>
&nbsp;
&nbsp;
<a href=/lists/samba/>[Samba]</a>
&nbsp;
&nbsp;
<a href=/lists/dm-devel/>[Device&nbsp;Mapper]</a>
&nbsp;
&nbsp;
<a href=/lists/linux-media/>[Linux&nbsp;Media]</a>
</font>
</center>
<hr>
<p>
<div>
<script async src="//pagead2.googlesyndication.com/pagead/js/adsbygoogle.js"></script>
<ins class="adsbygoogle"
     style="display:block"
     data-ad-format="autorelaxed"
     data-ad-client="ca-pub-3422782820843221"
     data-ad-slot="1424524564"></ins>
<script>
     (adsbygoogle = window.adsbygoogle || []).push({});
</script>
</div>
<table width=100%>
<tr>
<td align=left>&nbsp;</td>
<td align=right><a href=/lists/><img src=/button_01.gif border=0 alt="Powered by Linux"></a></td>
</tr>
</table>
<!--X-User-Footer-End-->
<script type="text/javascript"> 
 function initAddThis() {
    addthis.init()
 }
initAddThis();
</script>
<script>
  (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
  (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
  m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
  })(window,document,'script','//www.google-analytics.com/analytics.js','ga');
  ga('create', 'UA-760190-1', 'auto');
  ga('send', 'pageview');
</script>
</body>
</html>