Skip to content

Commit 11e63f6

Browse files
committed
x86, pmem: fix broken __copy_user_nocache cache-bypass assumptions
Before we rework the "pmem api" to stop abusing __copy_user_nocache() for memcpy_to_pmem() we need to fix cases where we may strand dirty data in the cpu cache. The problem occurs when copy_from_iter_pmem() is used for arbitrary data transfers from userspace. There is no guarantee that these transfers, performed by dax_iomap_actor(), will have aligned destinations or aligned transfer lengths. Backstop the usage __copy_user_nocache() with explicit cache management in these unaligned cases. Yes, copy_from_iter_pmem() is now too big for an inline, but addressing that is saved for a later patch that moves the entirety of the "pmem api" into the pmem driver directly. Fixes: 5de490d ("pmem: add copy_from_iter_pmem() and clear_pmem()") Cc: <stable@vger.kernel.org> Cc: <x86@kernel.org> Cc: Jan Kara <jack@suse.cz> Cc: Jeff Moyer <jmoyer@redhat.com> Cc: Ingo Molnar <mingo@redhat.com> Cc: Christoph Hellwig <hch@lst.de> Cc: "H. Peter Anvin" <hpa@zytor.com> Cc: Al Viro <viro@zeniv.linux.org.uk> Cc: Thomas Gleixner <tglx@linutronix.de> Cc: Matthew Wilcox <mawilcox@microsoft.com> Reviewed-by: Ross Zwisler <ross.zwisler@linux.intel.com> Signed-off-by: Toshi Kani <toshi.kani@hpe.com> Signed-off-by: Dan Williams <dan.j.williams@intel.com>
1 parent 956a4cd commit 11e63f6

File tree

1 file changed

+31
-11
lines changed

1 file changed

+31
-11
lines changed

arch/x86/include/asm/pmem.h

Lines changed: 31 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,8 @@ static inline int arch_memcpy_from_pmem(void *dst, const void *src, size_t n)
5555
* @size: number of bytes to write back
5656
*
5757
* Write back a cache range using the CLWB (cache line write back)
58-
* instruction.
58+
* instruction. Note that @size is internally rounded up to be cache
59+
* line size aligned.
5960
*/
6061
static inline void arch_wb_cache_pmem(void *addr, size_t size)
6162
{
@@ -69,15 +70,6 @@ static inline void arch_wb_cache_pmem(void *addr, size_t size)
6970
clwb(p);
7071
}
7172

72-
/*
73-
* copy_from_iter_nocache() on x86 only uses non-temporal stores for iovec
74-
* iterators, so for other types (bvec & kvec) we must do a cache write-back.
75-
*/
76-
static inline bool __iter_needs_pmem_wb(struct iov_iter *i)
77-
{
78-
return iter_is_iovec(i) == false;
79-
}
80-
8173
/**
8274
* arch_copy_from_iter_pmem - copy data from an iterator to PMEM
8375
* @addr: PMEM destination address
@@ -94,7 +86,35 @@ static inline size_t arch_copy_from_iter_pmem(void *addr, size_t bytes,
9486
/* TODO: skip the write-back by always using non-temporal stores */
9587
len = copy_from_iter_nocache(addr, bytes, i);
9688

97-
if (__iter_needs_pmem_wb(i))
89+
/*
90+
* In the iovec case on x86_64 copy_from_iter_nocache() uses
91+
* non-temporal stores for the bulk of the transfer, but we need
92+
* to manually flush if the transfer is unaligned. A cached
93+
* memory copy is used when destination or size is not naturally
94+
* aligned. That is:
95+
* - Require 8-byte alignment when size is 8 bytes or larger.
96+
* - Require 4-byte alignment when size is 4 bytes.
97+
*
98+
* In the non-iovec case the entire destination needs to be
99+
* flushed.
100+
*/
101+
if (iter_is_iovec(i)) {
102+
unsigned long flushed, dest = (unsigned long) addr;
103+
104+
if (bytes < 8) {
105+
if (!IS_ALIGNED(dest, 4) || (bytes != 4))
106+
arch_wb_cache_pmem(addr, 1);
107+
} else {
108+
if (!IS_ALIGNED(dest, 8)) {
109+
dest = ALIGN(dest, boot_cpu_data.x86_clflush_size);
110+
arch_wb_cache_pmem(addr, 1);
111+
}
112+
113+
flushed = dest - (unsigned long) addr;
114+
if (bytes > flushed && !IS_ALIGNED(bytes - flushed, 8))
115+
arch_wb_cache_pmem(addr + bytes - 1, 1);
116+
}
117+
} else
98118
arch_wb_cache_pmem(addr, bytes);
99119

100120
return len;

0 commit comments

Comments
 (0)