On Tue, Oct 10, 2017 at 03:42:08PM +0800, Eryu Guan wrote: > From: Zheng Liu <wenqing.lz@xxxxxxxxxx> > > In this commit a new test case is added to test that i_size races > don't occur under dio reads/writes. We add a program in /src dir, > which has a writer to issue some append dio writes. Meanwhile it > has a reader in this test to do some dio reads. As we expect, > reader should read nothing or data with 'a'. But it might read some > data with '0'. > > The bug can be reproduced by this test case [1]. > > 1. http://patchwork.ozlabs.org/patch/311761/ > > This ostensibly tests commit: > 9fe55eea7 Fix race when checking i_size on direct i/o read > > Update by Eric Sandeen: > - update to recent xfstests > - update commit log > > Update by Eryu Guan: > - add aio-dio support to the test and add 'aio' group > - add ability to test different alignments > - move test from src/ to src/aio-dio-regress/ > - add .gitignore entry > - rebase against latest xfstests with various minor fixes & cleanups > - update commit log > > Signed-off-by: Zheng Liu <wenqing.lz@xxxxxxxxxx> > Signed-off-by: Eric Sandeen <sandeen@xxxxxxxxxx> > Signed-off-by: Eryu Guan <eguan@xxxxxxxxxx> > --- > v2: > - start background reader in a thread first then start writer only after > reader starts issuing reads > > Confirmed that v2 still reproduces the bug reliably with unpatched > kernel and test passed with v4.14-rc3 kernel. > > Eric's original post > http://www.spinics.net/lists/fstests/msg06978.html > > .gitignore | 1 + > .../aio-dio-append-write-read-race.c | 230 +++++++++++++++++++++ > tests/generic/464 | 75 +++++++ > tests/generic/464.out | 3 + > tests/generic/group | 1 + > 5 files changed, 310 insertions(+) > create mode 100644 src/aio-dio-regress/aio-dio-append-write-read-race.c > create mode 100755 tests/generic/464 > create mode 100644 tests/generic/464.out > ... > diff --git a/src/aio-dio-regress/aio-dio-append-write-read-race.c b/src/aio-dio-regress/aio-dio-append-write-read-race.c > new file mode 100644 > index 000000000000..2956599c1474 > --- /dev/null > +++ b/src/aio-dio-regress/aio-dio-append-write-read-race.c > @@ -0,0 +1,230 @@ ... > +static void *reader(void *arg) > +{ > + struct io_data *data = (struct io_data *)arg; > + int ret; > + > + memset(data->buf, 'b', data->blksize); > + do { > + ret = pread(data->fd, data->buf, data->blksize, data->offset); > + if (ret < 0) > + perror("read file"); > + if (!reader_ready) > + reader_ready = 1; Hmm, this looks potentially racy with the associated reader_ready = 0 down in writer(). Once writer() executes, suppose it resets reader_read, then reader() reads the data, resets reader_ready = 1 and exits. ISTM reader_ready would incorrectly == 1 the next time around the loop. I think it's fine to set reader_ready = 1 after the memset(). Then just reinit it to 0 in main() before the reader thread is started (instead of down in writer())..? Brian > + } while (ret <= 0); > + > + return NULL; > +} > + > +static void *writer(struct io_data *data) > +{ > + int ret; > + > + while (!reader_ready) > + usleep(1); > + > + if (data->use_aio) { > + struct io_context *ctx = NULL; > + struct io_event evs[1]; > + struct iocb iocb; > + struct iocb *iocbs[] = { &iocb }; > + > + ret = io_setup(1, &ctx); > + if (ret) { > + fprintf(stderr, "error %s during io_setup\n", > + strerror(ret)); > + return NULL; > + } > + io_prep_pwrite(&iocb, data->fd, data->buf, data->blksize, data->offset); > + ret = io_submit(ctx, 1, iocbs); > + if (ret != 1) { > + fprintf(stderr, "error %s during io_submit\n", > + strerror(ret)); > + return NULL; > + } > + ret = io_getevents(ctx, 1, 1, evs, NULL); > + if (ret != 1) { > + fprintf(stderr, "error %s during io_getevents\n", > + strerror(ret)); > + return NULL; > + } > + } else { > + ret = pwrite(data->fd, data->buf, data->blksize, data->offset); > + if (ret < 0) > + perror("write file failed"); > + } > + > + reader_ready = 0; > + return NULL; > +} > + > +int main(int argc, char *argv[]) > +{ > + pthread_t tid; > + struct io_data wdata; > + struct io_data rdata; > + size_t max_blocks = 128; /* 128 */ > + size_t blksize = 1 * 1024 * 1024; /* 1M */ > + char *rbuf = NULL, *wbuf = NULL; > + int rfd = 0, wfd = 0; > + int i, j, c; > + int use_aio = 1; > + int ret = 0; > + int io_align = 4096; > + char *prog; > + char *testfile; > + > + > + prog = basename(argv[0]); > + > + while ((c = getopt(argc, argv, "a:d")) != -1) { > + switch (c) { > + case 'a': > + io_align = strtol(optarg, NULL, 0); > + break; > + case 'd': > + use_aio = 0; > + break; > + default: > + usage(prog); > + } > + } > + if (optind != argc - 1) > + usage(prog); > + testfile = argv[optind]; > + > + wfd = open(testfile, O_CREAT|O_DIRECT|O_WRONLY|O_TRUNC, 0644); > + if (wfd < 0) { > + perror("open for write"); > + exit(1); > + } > + > + rfd = open(testfile, O_DIRECT|O_RDONLY, 0644); > + if (rfd < 0) { > + perror("open for read"); > + ret = 1; > + goto err; > + } > + > + ret = posix_memalign((void **)&wbuf, io_align, blksize); > + if (ret) { > + fprintf(stderr, "failed to alloc memory: %s\n", strerror(ret)); > + ret = 1; > + goto err; > + } > + > + ret = posix_memalign((void **)&rbuf, io_align, blksize); > + if (ret) { > + fprintf(stderr, "failed to alloc memory: %s\n", strerror(ret)); > + ret = 1; > + goto err; > + } > + > + memset(wbuf, 'a', blksize); > + wdata.fd = wfd; > + wdata.blksize = blksize; > + wdata.buf = wbuf; > + wdata.use_aio = use_aio; > + rdata.fd = rfd; > + rdata.blksize = blksize; > + rdata.buf = rbuf; > + > + for (i = 0; i < max_blocks; i++) { > + wdata.offset = rdata.offset = i * blksize; > + > + ret = pthread_create(&tid, NULL, reader, &rdata); > + if (ret) { > + fprintf(stderr, "create reader thread failed: %s\n", > + strerror(ret)); > + ret = 1; > + goto err; > + } > + > + writer(&wdata); > + > + ret = pthread_join(tid, NULL); > + if (ret) { > + fprintf(stderr, "pthread join reader failed: %s\n", > + strerror(ret)); > + ret = 1; > + goto err; > + } > + > + for (j = 0; j < blksize; j++) { > + if (rdata.buf[j] != 'a') { > + fprintf(stderr, "encounter an error: " > + "block %d offset %d, content %x\n", > + i, j, rbuf[j]); > + ret = 1; > + goto err; > + } > + } > + } > + > +err: > + if (rfd) > + close(rfd); > + if (wfd) > + close(wfd); > + if (rbuf) > + free(rbuf); > + if (wbuf) > + free(wbuf); > + > + exit(ret); > +} > diff --git a/tests/generic/464 b/tests/generic/464 > new file mode 100755 > index 000000000000..b0423c91a7cf > --- /dev/null > +++ b/tests/generic/464 > @@ -0,0 +1,75 @@ > +#! /bin/bash > +# FS QA Test No. 464 > +# > +# Test i_size is updated properly under dio read/write > +# > +#----------------------------------------------------------------------- > +# Copyright (c) 2013 Alibaba Group. All Rights Reserved. > +# Copyright (c) 2017 Red Hat Inc. All Rights Reserved. > +# > +# This program is free software; you can redistribute it and/or > +# modify it under the terms of the GNU General Public License as > +# published by the Free Software Foundation. > +# > +# This program is distributed in the hope that it would be useful, > +# but WITHOUT ANY WARRANTY; without even the implied warranty of > +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the > +# GNU General Public License for more details. > +# > +# You should have received a copy of the GNU General Public License > +# along with this program; if not, write the Free Software Foundation, > +# Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA > +#----------------------------------------------------------------------- > +# > + > +seq=`basename $0` > +seqres=$RESULT_DIR/$seq > +echo "QA output created by $seq" > + > +here=`pwd` > +tmp=/tmp/$$ > +status=1 # failure is the default! > +trap "_cleanup; exit \$status" 0 1 2 3 15 > + > +_cleanup() > +{ > + cd / > + rm -f $tmp.* $testfile.* > +} > + > +# get standard environment, filters and checks > +. ./common/rc > +. ./common/filter > + > +# real QA test starts here > +_supported_fs generic > +_supported_os Linux > + > +_require_aiodio aio-dio-append-write-read-race > +_require_test_program "feature" > + > +testfile=$TEST_DIR/$seq.$$ > +min_dio_align=`_min_dio_alignment $TEST_DEV` > +page_size=`$here/src/feature -s` > + > +rm -f $seqres.full > + > +echo "non-aio dio test" > +align=$min_dio_align > +while [ $align -le $page_size ]; do > + echo "$AIO_TEST -a $align -d $testfile.$align" >> $seqres.full > + $AIO_TEST -a $align -d $testfile.$align 2>&1 | tee -a $seqres.full > + align=$((align * 2)) > +done > + > +echo "aio-dio test" > +align=$min_dio_align > +while [ $align -le $page_size ]; do > + echo "$AIO_TEST -a $align $testfile.$align" >> $seqres.full > + $AIO_TEST -a $align $testfile.$align 2>&1 | tee -a $seqres.full > + align=$((align * 2)) > +done > + > +# success, all done > +status=0 > +exit > diff --git a/tests/generic/464.out b/tests/generic/464.out > new file mode 100644 > index 000000000000..14e66fe7d778 > --- /dev/null > +++ b/tests/generic/464.out > @@ -0,0 +1,3 @@ > +QA output created by 464 > +non-aio dio test > +aio-dio test > diff --git a/tests/generic/group b/tests/generic/group > index 9f173e7a63c9..556add16286b 100644 > --- a/tests/generic/group > +++ b/tests/generic/group > @@ -466,3 +466,4 @@ > 461 auto shutdown stress > 462 auto quick dax > 463 auto rw > +464 auto rw quick aio > -- > 2.13.6 > > -- > To unsubscribe from this list: send the line "unsubscribe fstests" in > the body of a message to majordomo@xxxxxxxxxxxxxxx > More majordomo info at http://vger.kernel.org/majordomo-info.html -- To unsubscribe from this list: send the line "unsubscribe linux-xfs" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html