Placeholder pages allow DIO to use locking rules similar to that of writepage. DIO can now fill holes, and it can extend the file via get_block(). i_mutex can be dropped during writes if we are writing inside i_size. Signed-off-by: Chris Mason <chris.mason@xxxxxxxxxx> diff -r 5cd028318654 -r 1a7105ab9c19 fs/direct-io.c --- a/fs/direct-io.c Tue Feb 06 20:02:49 2007 -0500 +++ b/fs/direct-io.c Tue Feb 06 20:02:55 2007 -0500 @@ -1,3 +1,4 @@ + GFP_KERNEL, 1); /* * fs/direct-io.c * @@ -70,6 +71,7 @@ struct dio { int rw; loff_t i_size; /* i_size when submitted */ int lock_type; /* doesn't change */ + int reacquire_i_mutex; /* should we get i_mutex when done? */ unsigned blkbits; /* doesn't change */ unsigned blkfactor; /* When we're using an alignment which is finer than the filesystem's soft @@ -308,6 +310,9 @@ static int dio_complete(struct dio *dio, dio->map_bh.b_private); dio_unlock_page_range(dio); + if (dio->reacquire_i_mutex) + mutex_lock(&dio->inode->i_mutex); + if (ret == 0) ret = dio->page_errors; if (ret == 0) @@ -593,13 +598,8 @@ static int get_more_blocks(struct dio *d map_bh->b_size = fs_count << dio->inode->i_blkbits; create = dio->rw & WRITE; - if (dio->lock_type == DIO_LOCKING) { - if (dio->block_in_file < (i_size_read(dio->inode) >> - dio->blkbits)) - create = 0; - } else if (dio->lock_type == DIO_NO_LOCKING) { + if (dio->lock_type == DIO_NO_LOCKING) create = 0; - } index = fs_startblk >> (PAGE_CACHE_SHIFT - dio->inode->i_blkbits); end = (dio->final_block_in_request >> dio->blkfactor) >> @@ -1289,6 +1289,13 @@ __blockdev_direct_IO(int rw, struct kioc dio->is_async = !is_sync_kiocb(iocb) && !((rw & WRITE) && (end > i_size_read(inode))); + /* if our write is inside i_size, we can drop i_mutex */ + dio->reacquire_i_mutex = 0; + if ((rw & WRITE) && dio_lock_type == DIO_LOCKING && + end <= i_size_read(inode) && is_sync_kiocb(iocb)) { + dio->reacquire_i_mutex = 1; + mutex_unlock(&inode->i_mutex); + } retval = direct_io_worker(rw, iocb, inode, iov, offset, nr_segs, blkbits, get_block, end_io, dio); out: diff -r 5cd028318654 -r 1a7105ab9c19 mm/filemap.c --- a/mm/filemap.c Tue Feb 06 20:02:49 2007 -0500 +++ b/mm/filemap.c Tue Feb 06 20:02:55 2007 -0500 @@ -2840,10 +2840,19 @@ generic_file_direct_IO(int rw, struct ki retval = mapping->a_ops->direct_IO(rw, iocb, iov, offset, nr_segs); if (rw == WRITE && mapping->nrpages) { + int err; pgoff_t end = (offset + write_len - 1) >> PAGE_CACHE_SHIFT; - int err = invalidate_inode_pages2_range(mapping, - offset >> PAGE_CACHE_SHIFT, end); + + /* O_DIRECT is allowed to drop i_mutex, so more data + * could have been dirtied by others. Start io one more + * time + */ + err = filemap_fdatawrite_range(mapping, offset, + offset + write_len - 1); + if (!err) + err = invalidate_inode_pages2_range(mapping, + offset >> PAGE_CACHE_SHIFT, end); if (err) retval = err; } - To unsubscribe from this list: send the line "unsubscribe linux-fsdevel" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html