On Wed, Feb 08, 2017 at 03:09:07PM +0800, Xiong Zhou wrote:
> On Wed, Feb 08, 2017 at 02:56:51PM +0800, Xiong Zhou wrote:
> > On Tue, Feb 07, 2017 at 09:05:21PM -0800, Dan Williams wrote:
> > > On Tue, Feb 7, 2017 at 8:49 PM, Xiong Zhou <[email protected]> wrote:
> > > > On Tue, Feb 07, 2017 at 08:10:14PM -0800, Dan Williams wrote:
> > > >> On Tue, Feb 7, 2017 at 7:51 PM, Xiong Zhou <[email protected]> wrote:
> > > >> > On Fri, Jan 20, 2017 at 12:40:07PM +0800, Xiong Zhou wrote:
> > > >> >> Hi,
> > > >> >>
> > > >> >> At first, I am not sure whether this is an issue.
> > > >> >>
> > > >> >> mmap a file in a DAX mountpoint, open another file
> > > >> >> in a non-DAX mountpoint with O_DIRECT, write the
> > > >> >> mapped area to the other file.
> > > >> >>
> > > >> >> This write Success on pmem ramdisk(memmap=2G!20G like)
> > > >> >> This write Fail(Bad address) on nvdimm pmem devices.
> > > >> >> This write Fail(Bad address) on brd based ramdisk.
> > > >> >>
> > > >> >> If we skip the O_DIRECT flag, all tests pass.
> > > >> >>
> > > >> >> If we write from DAX to DAX, all tests pass.
> > > >> >> If we write from non-DAX to DAX, all tests pass.
> > > >> >>
> > > >> > snip..
> > > >> >
> > > >> > To falloc instead of pwrite while initiating test files,
> > > >> > ( Thanks Ross! :)
> > > >> > the write call returned success, however the following
> > > >> > read back to mmaped area FAILED the same way:
> > > >> >
> > > >> > return (Bad address) on raw-mode nvdimm device;
> > > >> > return (Success)     on memory-mode nvdimm device;
> > > >> > return (Bad address) on brd based ramdisk.
> > > >> >
> > > >> > Also, this only happends with O_DIRECT flag on.
> > > >> >
> > > >> > This smells like an issue to me, still looking into why
> > > >> > read can't get that page..
> > > >> >
> > > >>
> > > >> Why does it smell like an issue? Any path that calls get_user_pages()
> > > >
> > > > Because the write call gets its page and succeeds, while read back 
> > > > fails.
> > > > __get_user_pages on the same address first pass, then fail.
> > > 
> > > Ok, I might have misread your description. Can you tell me the exact
> > > reproduction steps so I can give it a try?
> > 
> > Reproducer attached.
> > 

Attachment issue..

You need root to run this, assuming your pmem device is /dev/pmem0.

Steps:
  sh test.sh /dev/pmem0

Thanks for your time!

----- test.sh --------------------------------------
#!/bin/bash
[ -z "$1" ] && { echo "$0 <dev>"; exit 1; }

DEV="$1"
MNT=/tbdmnt
cc t_mmap_dio.c
mkdir -p $MNT
wipefs -af $DEV > /dev/null
#mkfs.xfs -fq -d su=2m,sw=1 $DEV && \
mkfs.xfs -fq $DEV && \
mount -o dax $DEV $MNT && \
#xfs_io -f -c "w 0 268435456" $MNT/ts > /dev/null && \
#xfs_io -f -c "w 0 268435456" /root/td > /dev/null
xfs_io -f -c "falloc 0 268435456" $MNT/ts > /dev/null && \
xfs_io -f -c "falloc 0 268435456" /root/td > /dev/null
if ./a.out $MNT/ts /root/td 16777216 "$DEV" ; then
        echo dio PASS
else
        echo dio FAIL
fi

rm -f $MNT/ts /root/td
xfs_io -f -c "falloc 0 268435456" $MNT/ts > /dev/null
xfs_io -f -c "falloc 0 268435456" /root/td > /dev/null

if ./a.out -b $MNT/ts /root/td 16777216 "$DEV" ; then
        echo buffered IO PASS
else
        echo buffered IO FAIL
fi
umount $MNT

--------------------------------------------------------


----- t_mmap_dio.c ----------------------------------
/*
 * This programme was originally written by
 *     Jeff Moyer <[email protected]>
 *
 * Copyright (C) 2016, Red Hat, Inc.
 */
#define _GNU_SOURCE 1
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <fcntl.h>
#include <sys/mman.h>
#include <libaio.h>
#include <errno.h>
#include <sys/time.h>

void usage(char *prog)
{
        fprintf(stderr,
                "usage: %s <src file> <dest file> <size> <msg>\n",
                prog);
        exit(1);
}

void err_exit(char *op, unsigned long len, char *s)
{
        fprintf(stderr, "%s(%s) len %lu %s\n",
                op, strerror(errno), len, s);
        exit(1);
}

int main(int argc, char **argv)
{
        int fd, fd2, ret, dio = 1;
        char *map;
        char *msg;
        char *sfile;
        char *dfile;
        unsigned long len, opt;

        if (argc < 4)
                usage(basename(argv[0]));

        while ((opt = getopt(argc, argv, "b")) != -1)
                dio = 0;

        sfile = argv[optind];
        dfile = argv[optind + 1];
        msg = argv[optind + 3];
        len = strtoul(argv[optind + 2], NULL, 10);
        if (errno == ERANGE)
                err_exit("strtoul", 0, msg);

        /* Open source file and mmap*/
        fd = open(sfile, O_RDWR, 0644);
        if (fd < 0)
                err_exit("open src", len, msg);

        map = (char *)mmap(NULL, len,
                PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0);
        if (map == MAP_FAILED)
                err_exit("mmap", len, msg);

        if (dio == 1) {
                /* Open dest file with O_DIRECT */
                fd2 = open(dfile, O_RDWR|O_DIRECT, 0644);
                if (fd2 < 0)
                        err_exit("open dest", len, msg);
        } else {
                /* Open dest file without O_DIRECT */
                fd2 = open(dfile, O_RDWR, 0644);
                if (fd2 < 0)
                        err_exit("open dest", len, msg);
        }

        /* First, test storing to dest file from source mapping */
        ret = write(fd2, map, len);
        if (ret != len)
                err_exit("write", len, msg);

        ret = fsync(fd2);
        if (ret != 0)
                err_exit("fsync", len, msg);

        ret = (int)lseek(fd2, 0, SEEK_SET);
        if (ret == -1)
                err_exit("lseek", len, msg);

        /* Next, test reading from dest file into source mapping */
        ret = read(fd2, map, len);
        if (ret != len)
                err_exit("read", len, msg);
        ret = msync(map, len, MS_SYNC);
        if (ret < 0)
                err_exit("msync", len, msg);

        ret = munmap(map, len);
        if (ret < 0)
                err_exit("munmap", len, msg);

        ret = close(fd);
        if (ret < 0)
                err_exit("clsoe fd", len, msg);

        ret = close(fd2);
        if (ret < 0)
                err_exit("close fd2", len, msg);

        exit(0);
}

----------------------------------------------
----- my log -------------
sh-4.2# uname -r
4.10.0-rc7-master-f7d6040+
sh-4.2# whoami 
root
sh-4.2# pwd
/root
sh-4.2# sh test.sh /dev/pmem0
dio PASS
buffered IO PASS
sh-4.2# sh test.sh /dev/pmem2
read(Bad address) len 16777216 /dev/pmem2
dio FAIL
buffered IO PASS
sh-4.2# modprobe brd rd_size=$((1*1024*1024))
sh-4.2# sh test.sh /dev/ram0
read(Bad address) len 16777216 /dev/ram0
dio FAIL
buffered IO PASS
sh-4.2# 
sh-4.2# ndctl list
[
  {
    "dev":"namespace1.0",
    "mode":"memory",
    "size":8453619712,
    "uuid":"0013265e-06ff-4397-b62a-3078c1346cbc",
    "blockdev":"pmem1"
  },
  {
    "dev":"namespace3.0",
    "mode":"raw",
    "size":8589934592,
    "blockdev":"pmem3"
  },
  {
    "dev":"namespace0.0",
    "mode":"memory",
    "size":8453619712,
    "uuid":"c31e0719-00b3-4ffd-848c-659a74350ae5",
    "blockdev":"pmem0"
  },
  {
    "dev":"namespace2.0",
    "mode":"raw",
    "size":8589934592,
    "blockdev":"pmem2"
  }
]
sh-4.2#
_______________________________________________
Linux-nvdimm mailing list
[email protected]
https://lists.01.org/mailman/listinfo/linux-nvdimm
_______________________________________________
Linux-nvdimm mailing list
[email protected]
https://lists.01.org/mailman/listinfo/linux-nvdimm

Reply via email to