18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 28c2ecf20Sopenharmony_ci/* 38c2ecf20Sopenharmony_ci * User address space access functions. 48c2ecf20Sopenharmony_ci * 58c2ecf20Sopenharmony_ci * Copyright 1997 Andi Kleen <ak@muc.de> 68c2ecf20Sopenharmony_ci * Copyright 1997 Linus Torvalds 78c2ecf20Sopenharmony_ci * Copyright 2002 Andi Kleen <ak@suse.de> 88c2ecf20Sopenharmony_ci */ 98c2ecf20Sopenharmony_ci#include <linux/export.h> 108c2ecf20Sopenharmony_ci#include <linux/uaccess.h> 118c2ecf20Sopenharmony_ci#include <linux/highmem.h> 128c2ecf20Sopenharmony_ci 138c2ecf20Sopenharmony_ci/* 148c2ecf20Sopenharmony_ci * Zero Userspace 158c2ecf20Sopenharmony_ci */ 168c2ecf20Sopenharmony_ci 178c2ecf20Sopenharmony_ciunsigned long __clear_user(void __user *addr, unsigned long size) 188c2ecf20Sopenharmony_ci{ 198c2ecf20Sopenharmony_ci long __d0; 208c2ecf20Sopenharmony_ci might_fault(); 218c2ecf20Sopenharmony_ci /* no memory constraint because it doesn't change any memory gcc knows 228c2ecf20Sopenharmony_ci about */ 238c2ecf20Sopenharmony_ci stac(); 248c2ecf20Sopenharmony_ci asm volatile( 258c2ecf20Sopenharmony_ci " testq %[size8],%[size8]\n" 268c2ecf20Sopenharmony_ci " jz 4f\n" 278c2ecf20Sopenharmony_ci " .align 16\n" 288c2ecf20Sopenharmony_ci "0: movq $0,(%[dst])\n" 298c2ecf20Sopenharmony_ci " addq $8,%[dst]\n" 308c2ecf20Sopenharmony_ci " decl %%ecx ; jnz 0b\n" 318c2ecf20Sopenharmony_ci "4: movq %[size1],%%rcx\n" 328c2ecf20Sopenharmony_ci " testl %%ecx,%%ecx\n" 338c2ecf20Sopenharmony_ci " jz 2f\n" 348c2ecf20Sopenharmony_ci "1: movb $0,(%[dst])\n" 358c2ecf20Sopenharmony_ci " incq %[dst]\n" 368c2ecf20Sopenharmony_ci " decl %%ecx ; jnz 1b\n" 378c2ecf20Sopenharmony_ci "2:\n" 388c2ecf20Sopenharmony_ci ".section .fixup,\"ax\"\n" 398c2ecf20Sopenharmony_ci "3: lea 0(%[size1],%[size8],8),%[size8]\n" 408c2ecf20Sopenharmony_ci " jmp 2b\n" 418c2ecf20Sopenharmony_ci ".previous\n" 428c2ecf20Sopenharmony_ci _ASM_EXTABLE_UA(0b, 3b) 438c2ecf20Sopenharmony_ci _ASM_EXTABLE_UA(1b, 2b) 448c2ecf20Sopenharmony_ci : [size8] "=&c"(size), [dst] "=&D" (__d0) 458c2ecf20Sopenharmony_ci : [size1] "r"(size & 7), "[size8]" (size / 8), "[dst]"(addr)); 468c2ecf20Sopenharmony_ci clac(); 478c2ecf20Sopenharmony_ci return size; 488c2ecf20Sopenharmony_ci} 498c2ecf20Sopenharmony_ciEXPORT_SYMBOL(__clear_user); 508c2ecf20Sopenharmony_ci 518c2ecf20Sopenharmony_ciunsigned long clear_user(void __user *to, unsigned long n) 528c2ecf20Sopenharmony_ci{ 538c2ecf20Sopenharmony_ci if (access_ok(to, n)) 548c2ecf20Sopenharmony_ci return __clear_user(to, n); 558c2ecf20Sopenharmony_ci return n; 568c2ecf20Sopenharmony_ci} 578c2ecf20Sopenharmony_ciEXPORT_SYMBOL(clear_user); 588c2ecf20Sopenharmony_ci 598c2ecf20Sopenharmony_ci#ifdef CONFIG_ARCH_HAS_UACCESS_FLUSHCACHE 608c2ecf20Sopenharmony_ci/** 618c2ecf20Sopenharmony_ci * clean_cache_range - write back a cache range with CLWB 628c2ecf20Sopenharmony_ci * @vaddr: virtual start address 638c2ecf20Sopenharmony_ci * @size: number of bytes to write back 648c2ecf20Sopenharmony_ci * 658c2ecf20Sopenharmony_ci * Write back a cache range using the CLWB (cache line write back) 668c2ecf20Sopenharmony_ci * instruction. Note that @size is internally rounded up to be cache 678c2ecf20Sopenharmony_ci * line size aligned. 688c2ecf20Sopenharmony_ci */ 698c2ecf20Sopenharmony_cistatic void clean_cache_range(void *addr, size_t size) 708c2ecf20Sopenharmony_ci{ 718c2ecf20Sopenharmony_ci u16 x86_clflush_size = boot_cpu_data.x86_clflush_size; 728c2ecf20Sopenharmony_ci unsigned long clflush_mask = x86_clflush_size - 1; 738c2ecf20Sopenharmony_ci void *vend = addr + size; 748c2ecf20Sopenharmony_ci void *p; 758c2ecf20Sopenharmony_ci 768c2ecf20Sopenharmony_ci for (p = (void *)((unsigned long)addr & ~clflush_mask); 778c2ecf20Sopenharmony_ci p < vend; p += x86_clflush_size) 788c2ecf20Sopenharmony_ci clwb(p); 798c2ecf20Sopenharmony_ci} 808c2ecf20Sopenharmony_ci 818c2ecf20Sopenharmony_civoid arch_wb_cache_pmem(void *addr, size_t size) 828c2ecf20Sopenharmony_ci{ 838c2ecf20Sopenharmony_ci clean_cache_range(addr, size); 848c2ecf20Sopenharmony_ci} 858c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(arch_wb_cache_pmem); 868c2ecf20Sopenharmony_ci 878c2ecf20Sopenharmony_cilong __copy_user_flushcache(void *dst, const void __user *src, unsigned size) 888c2ecf20Sopenharmony_ci{ 898c2ecf20Sopenharmony_ci unsigned long flushed, dest = (unsigned long) dst; 908c2ecf20Sopenharmony_ci long rc = __copy_user_nocache(dst, src, size, 0); 918c2ecf20Sopenharmony_ci 928c2ecf20Sopenharmony_ci /* 938c2ecf20Sopenharmony_ci * __copy_user_nocache() uses non-temporal stores for the bulk 948c2ecf20Sopenharmony_ci * of the transfer, but we need to manually flush if the 958c2ecf20Sopenharmony_ci * transfer is unaligned. A cached memory copy is used when 968c2ecf20Sopenharmony_ci * destination or size is not naturally aligned. That is: 978c2ecf20Sopenharmony_ci * - Require 8-byte alignment when size is 8 bytes or larger. 988c2ecf20Sopenharmony_ci * - Require 4-byte alignment when size is 4 bytes. 998c2ecf20Sopenharmony_ci */ 1008c2ecf20Sopenharmony_ci if (size < 8) { 1018c2ecf20Sopenharmony_ci if (!IS_ALIGNED(dest, 4) || size != 4) 1028c2ecf20Sopenharmony_ci clean_cache_range(dst, size); 1038c2ecf20Sopenharmony_ci } else { 1048c2ecf20Sopenharmony_ci if (!IS_ALIGNED(dest, 8)) { 1058c2ecf20Sopenharmony_ci dest = ALIGN(dest, boot_cpu_data.x86_clflush_size); 1068c2ecf20Sopenharmony_ci clean_cache_range(dst, 1); 1078c2ecf20Sopenharmony_ci } 1088c2ecf20Sopenharmony_ci 1098c2ecf20Sopenharmony_ci flushed = dest - (unsigned long) dst; 1108c2ecf20Sopenharmony_ci if (size > flushed && !IS_ALIGNED(size - flushed, 8)) 1118c2ecf20Sopenharmony_ci clean_cache_range(dst + size - 1, 1); 1128c2ecf20Sopenharmony_ci } 1138c2ecf20Sopenharmony_ci 1148c2ecf20Sopenharmony_ci return rc; 1158c2ecf20Sopenharmony_ci} 1168c2ecf20Sopenharmony_ci 1178c2ecf20Sopenharmony_civoid __memcpy_flushcache(void *_dst, const void *_src, size_t size) 1188c2ecf20Sopenharmony_ci{ 1198c2ecf20Sopenharmony_ci unsigned long dest = (unsigned long) _dst; 1208c2ecf20Sopenharmony_ci unsigned long source = (unsigned long) _src; 1218c2ecf20Sopenharmony_ci 1228c2ecf20Sopenharmony_ci /* cache copy and flush to align dest */ 1238c2ecf20Sopenharmony_ci if (!IS_ALIGNED(dest, 8)) { 1248c2ecf20Sopenharmony_ci size_t len = min_t(size_t, size, ALIGN(dest, 8) - dest); 1258c2ecf20Sopenharmony_ci 1268c2ecf20Sopenharmony_ci memcpy((void *) dest, (void *) source, len); 1278c2ecf20Sopenharmony_ci clean_cache_range((void *) dest, len); 1288c2ecf20Sopenharmony_ci dest += len; 1298c2ecf20Sopenharmony_ci source += len; 1308c2ecf20Sopenharmony_ci size -= len; 1318c2ecf20Sopenharmony_ci if (!size) 1328c2ecf20Sopenharmony_ci return; 1338c2ecf20Sopenharmony_ci } 1348c2ecf20Sopenharmony_ci 1358c2ecf20Sopenharmony_ci /* 4x8 movnti loop */ 1368c2ecf20Sopenharmony_ci while (size >= 32) { 1378c2ecf20Sopenharmony_ci asm("movq (%0), %%r8\n" 1388c2ecf20Sopenharmony_ci "movq 8(%0), %%r9\n" 1398c2ecf20Sopenharmony_ci "movq 16(%0), %%r10\n" 1408c2ecf20Sopenharmony_ci "movq 24(%0), %%r11\n" 1418c2ecf20Sopenharmony_ci "movnti %%r8, (%1)\n" 1428c2ecf20Sopenharmony_ci "movnti %%r9, 8(%1)\n" 1438c2ecf20Sopenharmony_ci "movnti %%r10, 16(%1)\n" 1448c2ecf20Sopenharmony_ci "movnti %%r11, 24(%1)\n" 1458c2ecf20Sopenharmony_ci :: "r" (source), "r" (dest) 1468c2ecf20Sopenharmony_ci : "memory", "r8", "r9", "r10", "r11"); 1478c2ecf20Sopenharmony_ci dest += 32; 1488c2ecf20Sopenharmony_ci source += 32; 1498c2ecf20Sopenharmony_ci size -= 32; 1508c2ecf20Sopenharmony_ci } 1518c2ecf20Sopenharmony_ci 1528c2ecf20Sopenharmony_ci /* 1x8 movnti loop */ 1538c2ecf20Sopenharmony_ci while (size >= 8) { 1548c2ecf20Sopenharmony_ci asm("movq (%0), %%r8\n" 1558c2ecf20Sopenharmony_ci "movnti %%r8, (%1)\n" 1568c2ecf20Sopenharmony_ci :: "r" (source), "r" (dest) 1578c2ecf20Sopenharmony_ci : "memory", "r8"); 1588c2ecf20Sopenharmony_ci dest += 8; 1598c2ecf20Sopenharmony_ci source += 8; 1608c2ecf20Sopenharmony_ci size -= 8; 1618c2ecf20Sopenharmony_ci } 1628c2ecf20Sopenharmony_ci 1638c2ecf20Sopenharmony_ci /* 1x4 movnti loop */ 1648c2ecf20Sopenharmony_ci while (size >= 4) { 1658c2ecf20Sopenharmony_ci asm("movl (%0), %%r8d\n" 1668c2ecf20Sopenharmony_ci "movnti %%r8d, (%1)\n" 1678c2ecf20Sopenharmony_ci :: "r" (source), "r" (dest) 1688c2ecf20Sopenharmony_ci : "memory", "r8"); 1698c2ecf20Sopenharmony_ci dest += 4; 1708c2ecf20Sopenharmony_ci source += 4; 1718c2ecf20Sopenharmony_ci size -= 4; 1728c2ecf20Sopenharmony_ci } 1738c2ecf20Sopenharmony_ci 1748c2ecf20Sopenharmony_ci /* cache copy for remaining bytes */ 1758c2ecf20Sopenharmony_ci if (size) { 1768c2ecf20Sopenharmony_ci memcpy((void *) dest, (void *) source, size); 1778c2ecf20Sopenharmony_ci clean_cache_range((void *) dest, size); 1788c2ecf20Sopenharmony_ci } 1798c2ecf20Sopenharmony_ci} 1808c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(__memcpy_flushcache); 1818c2ecf20Sopenharmony_ci 1828c2ecf20Sopenharmony_civoid memcpy_page_flushcache(char *to, struct page *page, size_t offset, 1838c2ecf20Sopenharmony_ci size_t len) 1848c2ecf20Sopenharmony_ci{ 1858c2ecf20Sopenharmony_ci char *from = kmap_atomic(page); 1868c2ecf20Sopenharmony_ci 1878c2ecf20Sopenharmony_ci memcpy_flushcache(to, from + offset, len); 1888c2ecf20Sopenharmony_ci kunmap_atomic(from); 1898c2ecf20Sopenharmony_ci} 1908c2ecf20Sopenharmony_ci#endif 191