Skip to content

Commit

Permalink
dax: update I/O path to do proper PMEM flushing
Browse files Browse the repository at this point in the history
Update the DAX I/O path so that all operations that store data (I/O
writes, zeroing blocks, punching holes, etc.) properly synchronize the
stores to media using the PMEM API.  This ensures that the data DAX is
writing is durable on media before the operation completes.

Signed-off-by: Ross Zwisler <ross.zwisler@linux.intel.com>
Reviewed-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Dan Williams <dan.j.williams@intel.com>
  • Loading branch information
Ross Zwisler authored and Dan Williams committed Aug 20, 2015
1 parent 5de490d commit 2765cfb
Showing 1 changed file with 25 additions and 14 deletions.
39 changes: 25 additions & 14 deletions fs/dax.c
Original file line number Diff line number Diff line change
Expand Up @@ -23,6 +23,7 @@
#include <linux/memcontrol.h>
#include <linux/mm.h>
#include <linux/mutex.h>
#include <linux/pmem.h>
#include <linux/sched.h>
#include <linux/uio.h>
#include <linux/vmstat.h>
Expand All @@ -46,10 +47,7 @@ int dax_clear_blocks(struct inode *inode, sector_t block, long size)
unsigned pgsz = PAGE_SIZE - offset_in_page(addr);
if (pgsz > count)
pgsz = count;
if (pgsz < PAGE_SIZE)
memset(addr, 0, pgsz);
else
clear_page(addr);
clear_pmem((void __pmem *)addr, pgsz);
addr += pgsz;
size -= pgsz;
count -= pgsz;
Expand All @@ -59,6 +57,7 @@ int dax_clear_blocks(struct inode *inode, sector_t block, long size)
}
} while (size);

wmb_pmem();
return 0;
}
EXPORT_SYMBOL_GPL(dax_clear_blocks);
Expand All @@ -70,15 +69,16 @@ static long dax_get_addr(struct buffer_head *bh, void **addr, unsigned blkbits)
return bdev_direct_access(bh->b_bdev, sector, addr, &pfn, bh->b_size);
}

/* the clear_pmem() calls are ordered by a wmb_pmem() in the caller */
static void dax_new_buf(void *addr, unsigned size, unsigned first, loff_t pos,
loff_t end)
{
loff_t final = end - pos + first; /* The final byte of the buffer */

if (first > 0)
memset(addr, 0, first);
clear_pmem((void __pmem *)addr, first);
if (final < size)
memset(addr + final, 0, size - final);
clear_pmem((void __pmem *)addr + final, size - final);
}

static bool buffer_written(struct buffer_head *bh)
Expand Down Expand Up @@ -108,12 +108,13 @@ static ssize_t dax_io(struct inode *inode, struct iov_iter *iter,
loff_t bh_max = start;
void *addr;
bool hole = false;
bool need_wmb = false;

if (iov_iter_rw(iter) != WRITE)
end = min(end, i_size_read(inode));

while (pos < end) {
unsigned len;
size_t len;
if (pos == max) {
unsigned blkbits = inode->i_blkbits;
sector_t block = pos >> blkbits;
Expand Down Expand Up @@ -145,18 +146,22 @@ static ssize_t dax_io(struct inode *inode, struct iov_iter *iter,
retval = dax_get_addr(bh, &addr, blkbits);
if (retval < 0)
break;
if (buffer_unwritten(bh) || buffer_new(bh))
if (buffer_unwritten(bh) || buffer_new(bh)) {
dax_new_buf(addr, retval, first, pos,
end);
need_wmb = true;
}
addr += first;
size = retval - first;
}
max = min(pos + size, end);
}

if (iov_iter_rw(iter) == WRITE)
len = copy_from_iter_nocache(addr, max - pos, iter);
else if (!hole)
if (iov_iter_rw(iter) == WRITE) {
len = copy_from_iter_pmem((void __pmem *)addr,
max - pos, iter);
need_wmb = true;
} else if (!hole)
len = copy_to_iter(addr, max - pos, iter);
else
len = iov_iter_zero(max - pos, iter);
Expand All @@ -168,6 +173,9 @@ static ssize_t dax_io(struct inode *inode, struct iov_iter *iter,
addr += len;
}

if (need_wmb)
wmb_pmem();

return (pos == start) ? retval : pos - start;
}

Expand Down Expand Up @@ -303,8 +311,10 @@ static int dax_insert_mapping(struct inode *inode, struct buffer_head *bh,
goto out;
}

if (buffer_unwritten(bh) || buffer_new(bh))
clear_page(addr);
if (buffer_unwritten(bh) || buffer_new(bh)) {
clear_pmem((void __pmem *)addr, PAGE_SIZE);
wmb_pmem();
}

error = vm_insert_mixed(vma, vaddr, pfn);

Expand Down Expand Up @@ -542,7 +552,8 @@ int dax_zero_page_range(struct inode *inode, loff_t from, unsigned length,
err = dax_get_addr(&bh, &addr, inode->i_blkbits);
if (err < 0)
return err;
memset(addr + offset, 0, length);
clear_pmem((void __pmem *)addr + offset, length);
wmb_pmem();
}

return 0;
Expand Down

0 comments on commit 2765cfb

Please sign in to comment.