18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 28c2ecf20Sopenharmony_ci#include <crypto/hash.h> 38c2ecf20Sopenharmony_ci#include <linux/export.h> 48c2ecf20Sopenharmony_ci#include <linux/bvec.h> 58c2ecf20Sopenharmony_ci#include <linux/fault-inject-usercopy.h> 68c2ecf20Sopenharmony_ci#include <linux/uio.h> 78c2ecf20Sopenharmony_ci#include <linux/pagemap.h> 88c2ecf20Sopenharmony_ci#include <linux/slab.h> 98c2ecf20Sopenharmony_ci#include <linux/vmalloc.h> 108c2ecf20Sopenharmony_ci#include <linux/splice.h> 118c2ecf20Sopenharmony_ci#include <linux/compat.h> 128c2ecf20Sopenharmony_ci#include <net/checksum.h> 138c2ecf20Sopenharmony_ci#include <linux/scatterlist.h> 148c2ecf20Sopenharmony_ci#include <linux/instrumented.h> 158c2ecf20Sopenharmony_ci 168c2ecf20Sopenharmony_ci#define PIPE_PARANOIA /* for now */ 178c2ecf20Sopenharmony_ci 188c2ecf20Sopenharmony_ci#define iterate_iovec(i, n, __v, __p, skip, STEP) { \ 198c2ecf20Sopenharmony_ci size_t left; \ 208c2ecf20Sopenharmony_ci size_t wanted = n; \ 218c2ecf20Sopenharmony_ci __p = i->iov; \ 228c2ecf20Sopenharmony_ci __v.iov_len = min(n, __p->iov_len - skip); \ 238c2ecf20Sopenharmony_ci if (likely(__v.iov_len)) { \ 248c2ecf20Sopenharmony_ci __v.iov_base = __p->iov_base + skip; \ 258c2ecf20Sopenharmony_ci left = (STEP); \ 268c2ecf20Sopenharmony_ci __v.iov_len -= left; \ 278c2ecf20Sopenharmony_ci skip += __v.iov_len; \ 288c2ecf20Sopenharmony_ci n -= __v.iov_len; \ 298c2ecf20Sopenharmony_ci } else { \ 308c2ecf20Sopenharmony_ci left = 0; \ 318c2ecf20Sopenharmony_ci } \ 328c2ecf20Sopenharmony_ci while (unlikely(!left && n)) { \ 338c2ecf20Sopenharmony_ci __p++; \ 348c2ecf20Sopenharmony_ci __v.iov_len = min(n, __p->iov_len); \ 358c2ecf20Sopenharmony_ci if (unlikely(!__v.iov_len)) \ 368c2ecf20Sopenharmony_ci continue; \ 378c2ecf20Sopenharmony_ci __v.iov_base = __p->iov_base; \ 388c2ecf20Sopenharmony_ci left = (STEP); \ 398c2ecf20Sopenharmony_ci __v.iov_len -= left; \ 408c2ecf20Sopenharmony_ci skip = __v.iov_len; \ 418c2ecf20Sopenharmony_ci n -= __v.iov_len; \ 428c2ecf20Sopenharmony_ci } \ 438c2ecf20Sopenharmony_ci n = wanted - n; \ 448c2ecf20Sopenharmony_ci} 458c2ecf20Sopenharmony_ci 468c2ecf20Sopenharmony_ci#define iterate_kvec(i, n, __v, __p, skip, STEP) { \ 478c2ecf20Sopenharmony_ci size_t wanted = n; \ 488c2ecf20Sopenharmony_ci __p = i->kvec; \ 498c2ecf20Sopenharmony_ci __v.iov_len = min(n, __p->iov_len - skip); \ 508c2ecf20Sopenharmony_ci if (likely(__v.iov_len)) { \ 518c2ecf20Sopenharmony_ci __v.iov_base = __p->iov_base + skip; \ 528c2ecf20Sopenharmony_ci (void)(STEP); \ 538c2ecf20Sopenharmony_ci skip += __v.iov_len; \ 548c2ecf20Sopenharmony_ci n -= __v.iov_len; \ 558c2ecf20Sopenharmony_ci } \ 568c2ecf20Sopenharmony_ci while (unlikely(n)) { \ 578c2ecf20Sopenharmony_ci __p++; \ 588c2ecf20Sopenharmony_ci __v.iov_len = min(n, __p->iov_len); \ 598c2ecf20Sopenharmony_ci if (unlikely(!__v.iov_len)) \ 608c2ecf20Sopenharmony_ci continue; \ 618c2ecf20Sopenharmony_ci __v.iov_base = __p->iov_base; \ 628c2ecf20Sopenharmony_ci (void)(STEP); \ 638c2ecf20Sopenharmony_ci skip = __v.iov_len; \ 648c2ecf20Sopenharmony_ci n -= __v.iov_len; \ 658c2ecf20Sopenharmony_ci } \ 668c2ecf20Sopenharmony_ci n = wanted; \ 678c2ecf20Sopenharmony_ci} 688c2ecf20Sopenharmony_ci 698c2ecf20Sopenharmony_ci#define iterate_bvec(i, n, __v, __bi, skip, STEP) { \ 708c2ecf20Sopenharmony_ci struct bvec_iter __start; \ 718c2ecf20Sopenharmony_ci __start.bi_size = n; \ 728c2ecf20Sopenharmony_ci __start.bi_bvec_done = skip; \ 738c2ecf20Sopenharmony_ci __start.bi_idx = 0; \ 748c2ecf20Sopenharmony_ci for_each_bvec(__v, i->bvec, __bi, __start) { \ 758c2ecf20Sopenharmony_ci if (!__v.bv_len) \ 768c2ecf20Sopenharmony_ci continue; \ 778c2ecf20Sopenharmony_ci (void)(STEP); \ 788c2ecf20Sopenharmony_ci } \ 798c2ecf20Sopenharmony_ci} 808c2ecf20Sopenharmony_ci 818c2ecf20Sopenharmony_ci#define iterate_all_kinds(i, n, v, I, B, K) { \ 828c2ecf20Sopenharmony_ci if (likely(n)) { \ 838c2ecf20Sopenharmony_ci size_t skip = i->iov_offset; \ 848c2ecf20Sopenharmony_ci if (unlikely(i->type & ITER_BVEC)) { \ 858c2ecf20Sopenharmony_ci struct bio_vec v; \ 868c2ecf20Sopenharmony_ci struct bvec_iter __bi; \ 878c2ecf20Sopenharmony_ci iterate_bvec(i, n, v, __bi, skip, (B)) \ 888c2ecf20Sopenharmony_ci } else if (unlikely(i->type & ITER_KVEC)) { \ 898c2ecf20Sopenharmony_ci const struct kvec *kvec; \ 908c2ecf20Sopenharmony_ci struct kvec v; \ 918c2ecf20Sopenharmony_ci iterate_kvec(i, n, v, kvec, skip, (K)) \ 928c2ecf20Sopenharmony_ci } else if (unlikely(i->type & ITER_DISCARD)) { \ 938c2ecf20Sopenharmony_ci } else { \ 948c2ecf20Sopenharmony_ci const struct iovec *iov; \ 958c2ecf20Sopenharmony_ci struct iovec v; \ 968c2ecf20Sopenharmony_ci iterate_iovec(i, n, v, iov, skip, (I)) \ 978c2ecf20Sopenharmony_ci } \ 988c2ecf20Sopenharmony_ci } \ 998c2ecf20Sopenharmony_ci} 1008c2ecf20Sopenharmony_ci 1018c2ecf20Sopenharmony_ci#define iterate_and_advance(i, n, v, I, B, K) { \ 1028c2ecf20Sopenharmony_ci if (unlikely(i->count < n)) \ 1038c2ecf20Sopenharmony_ci n = i->count; \ 1048c2ecf20Sopenharmony_ci if (i->count) { \ 1058c2ecf20Sopenharmony_ci size_t skip = i->iov_offset; \ 1068c2ecf20Sopenharmony_ci if (unlikely(i->type & ITER_BVEC)) { \ 1078c2ecf20Sopenharmony_ci const struct bio_vec *bvec = i->bvec; \ 1088c2ecf20Sopenharmony_ci struct bio_vec v; \ 1098c2ecf20Sopenharmony_ci struct bvec_iter __bi; \ 1108c2ecf20Sopenharmony_ci iterate_bvec(i, n, v, __bi, skip, (B)) \ 1118c2ecf20Sopenharmony_ci i->bvec = __bvec_iter_bvec(i->bvec, __bi); \ 1128c2ecf20Sopenharmony_ci i->nr_segs -= i->bvec - bvec; \ 1138c2ecf20Sopenharmony_ci skip = __bi.bi_bvec_done; \ 1148c2ecf20Sopenharmony_ci } else if (unlikely(i->type & ITER_KVEC)) { \ 1158c2ecf20Sopenharmony_ci const struct kvec *kvec; \ 1168c2ecf20Sopenharmony_ci struct kvec v; \ 1178c2ecf20Sopenharmony_ci iterate_kvec(i, n, v, kvec, skip, (K)) \ 1188c2ecf20Sopenharmony_ci if (skip == kvec->iov_len) { \ 1198c2ecf20Sopenharmony_ci kvec++; \ 1208c2ecf20Sopenharmony_ci skip = 0; \ 1218c2ecf20Sopenharmony_ci } \ 1228c2ecf20Sopenharmony_ci i->nr_segs -= kvec - i->kvec; \ 1238c2ecf20Sopenharmony_ci i->kvec = kvec; \ 1248c2ecf20Sopenharmony_ci } else if (unlikely(i->type & ITER_DISCARD)) { \ 1258c2ecf20Sopenharmony_ci skip += n; \ 1268c2ecf20Sopenharmony_ci } else { \ 1278c2ecf20Sopenharmony_ci const struct iovec *iov; \ 1288c2ecf20Sopenharmony_ci struct iovec v; \ 1298c2ecf20Sopenharmony_ci iterate_iovec(i, n, v, iov, skip, (I)) \ 1308c2ecf20Sopenharmony_ci if (skip == iov->iov_len) { \ 1318c2ecf20Sopenharmony_ci iov++; \ 1328c2ecf20Sopenharmony_ci skip = 0; \ 1338c2ecf20Sopenharmony_ci } \ 1348c2ecf20Sopenharmony_ci i->nr_segs -= iov - i->iov; \ 1358c2ecf20Sopenharmony_ci i->iov = iov; \ 1368c2ecf20Sopenharmony_ci } \ 1378c2ecf20Sopenharmony_ci i->count -= n; \ 1388c2ecf20Sopenharmony_ci i->iov_offset = skip; \ 1398c2ecf20Sopenharmony_ci } \ 1408c2ecf20Sopenharmony_ci} 1418c2ecf20Sopenharmony_ci 1428c2ecf20Sopenharmony_cistatic int copyout(void __user *to, const void *from, size_t n) 1438c2ecf20Sopenharmony_ci{ 1448c2ecf20Sopenharmony_ci if (should_fail_usercopy()) 1458c2ecf20Sopenharmony_ci return n; 1468c2ecf20Sopenharmony_ci if (access_ok(to, n)) { 1478c2ecf20Sopenharmony_ci instrument_copy_to_user(to, from, n); 1488c2ecf20Sopenharmony_ci n = raw_copy_to_user(to, from, n); 1498c2ecf20Sopenharmony_ci } 1508c2ecf20Sopenharmony_ci return n; 1518c2ecf20Sopenharmony_ci} 1528c2ecf20Sopenharmony_ci 1538c2ecf20Sopenharmony_cistatic int copyin(void *to, const void __user *from, size_t n) 1548c2ecf20Sopenharmony_ci{ 1558c2ecf20Sopenharmony_ci if (should_fail_usercopy()) 1568c2ecf20Sopenharmony_ci return n; 1578c2ecf20Sopenharmony_ci if (access_ok(from, n)) { 1588c2ecf20Sopenharmony_ci instrument_copy_from_user(to, from, n); 1598c2ecf20Sopenharmony_ci n = raw_copy_from_user(to, from, n); 1608c2ecf20Sopenharmony_ci } 1618c2ecf20Sopenharmony_ci return n; 1628c2ecf20Sopenharmony_ci} 1638c2ecf20Sopenharmony_ci 1648c2ecf20Sopenharmony_cistatic size_t copy_page_to_iter_iovec(struct page *page, size_t offset, size_t bytes, 1658c2ecf20Sopenharmony_ci struct iov_iter *i) 1668c2ecf20Sopenharmony_ci{ 1678c2ecf20Sopenharmony_ci size_t skip, copy, left, wanted; 1688c2ecf20Sopenharmony_ci const struct iovec *iov; 1698c2ecf20Sopenharmony_ci char __user *buf; 1708c2ecf20Sopenharmony_ci void *kaddr, *from; 1718c2ecf20Sopenharmony_ci 1728c2ecf20Sopenharmony_ci if (unlikely(bytes > i->count)) 1738c2ecf20Sopenharmony_ci bytes = i->count; 1748c2ecf20Sopenharmony_ci 1758c2ecf20Sopenharmony_ci if (unlikely(!bytes)) 1768c2ecf20Sopenharmony_ci return 0; 1778c2ecf20Sopenharmony_ci 1788c2ecf20Sopenharmony_ci might_fault(); 1798c2ecf20Sopenharmony_ci wanted = bytes; 1808c2ecf20Sopenharmony_ci iov = i->iov; 1818c2ecf20Sopenharmony_ci skip = i->iov_offset; 1828c2ecf20Sopenharmony_ci buf = iov->iov_base + skip; 1838c2ecf20Sopenharmony_ci copy = min(bytes, iov->iov_len - skip); 1848c2ecf20Sopenharmony_ci 1858c2ecf20Sopenharmony_ci if (IS_ENABLED(CONFIG_HIGHMEM) && !fault_in_pages_writeable(buf, copy)) { 1868c2ecf20Sopenharmony_ci kaddr = kmap_atomic(page); 1878c2ecf20Sopenharmony_ci from = kaddr + offset; 1888c2ecf20Sopenharmony_ci 1898c2ecf20Sopenharmony_ci /* first chunk, usually the only one */ 1908c2ecf20Sopenharmony_ci left = copyout(buf, from, copy); 1918c2ecf20Sopenharmony_ci copy -= left; 1928c2ecf20Sopenharmony_ci skip += copy; 1938c2ecf20Sopenharmony_ci from += copy; 1948c2ecf20Sopenharmony_ci bytes -= copy; 1958c2ecf20Sopenharmony_ci 1968c2ecf20Sopenharmony_ci while (unlikely(!left && bytes)) { 1978c2ecf20Sopenharmony_ci iov++; 1988c2ecf20Sopenharmony_ci buf = iov->iov_base; 1998c2ecf20Sopenharmony_ci copy = min(bytes, iov->iov_len); 2008c2ecf20Sopenharmony_ci left = copyout(buf, from, copy); 2018c2ecf20Sopenharmony_ci copy -= left; 2028c2ecf20Sopenharmony_ci skip = copy; 2038c2ecf20Sopenharmony_ci from += copy; 2048c2ecf20Sopenharmony_ci bytes -= copy; 2058c2ecf20Sopenharmony_ci } 2068c2ecf20Sopenharmony_ci if (likely(!bytes)) { 2078c2ecf20Sopenharmony_ci kunmap_atomic(kaddr); 2088c2ecf20Sopenharmony_ci goto done; 2098c2ecf20Sopenharmony_ci } 2108c2ecf20Sopenharmony_ci offset = from - kaddr; 2118c2ecf20Sopenharmony_ci buf += copy; 2128c2ecf20Sopenharmony_ci kunmap_atomic(kaddr); 2138c2ecf20Sopenharmony_ci copy = min(bytes, iov->iov_len - skip); 2148c2ecf20Sopenharmony_ci } 2158c2ecf20Sopenharmony_ci /* Too bad - revert to non-atomic kmap */ 2168c2ecf20Sopenharmony_ci 2178c2ecf20Sopenharmony_ci kaddr = kmap(page); 2188c2ecf20Sopenharmony_ci from = kaddr + offset; 2198c2ecf20Sopenharmony_ci left = copyout(buf, from, copy); 2208c2ecf20Sopenharmony_ci copy -= left; 2218c2ecf20Sopenharmony_ci skip += copy; 2228c2ecf20Sopenharmony_ci from += copy; 2238c2ecf20Sopenharmony_ci bytes -= copy; 2248c2ecf20Sopenharmony_ci while (unlikely(!left && bytes)) { 2258c2ecf20Sopenharmony_ci iov++; 2268c2ecf20Sopenharmony_ci buf = iov->iov_base; 2278c2ecf20Sopenharmony_ci copy = min(bytes, iov->iov_len); 2288c2ecf20Sopenharmony_ci left = copyout(buf, from, copy); 2298c2ecf20Sopenharmony_ci copy -= left; 2308c2ecf20Sopenharmony_ci skip = copy; 2318c2ecf20Sopenharmony_ci from += copy; 2328c2ecf20Sopenharmony_ci bytes -= copy; 2338c2ecf20Sopenharmony_ci } 2348c2ecf20Sopenharmony_ci kunmap(page); 2358c2ecf20Sopenharmony_ci 2368c2ecf20Sopenharmony_cidone: 2378c2ecf20Sopenharmony_ci if (skip == iov->iov_len) { 2388c2ecf20Sopenharmony_ci iov++; 2398c2ecf20Sopenharmony_ci skip = 0; 2408c2ecf20Sopenharmony_ci } 2418c2ecf20Sopenharmony_ci i->count -= wanted - bytes; 2428c2ecf20Sopenharmony_ci i->nr_segs -= iov - i->iov; 2438c2ecf20Sopenharmony_ci i->iov = iov; 2448c2ecf20Sopenharmony_ci i->iov_offset = skip; 2458c2ecf20Sopenharmony_ci return wanted - bytes; 2468c2ecf20Sopenharmony_ci} 2478c2ecf20Sopenharmony_ci 2488c2ecf20Sopenharmony_cistatic size_t copy_page_from_iter_iovec(struct page *page, size_t offset, size_t bytes, 2498c2ecf20Sopenharmony_ci struct iov_iter *i) 2508c2ecf20Sopenharmony_ci{ 2518c2ecf20Sopenharmony_ci size_t skip, copy, left, wanted; 2528c2ecf20Sopenharmony_ci const struct iovec *iov; 2538c2ecf20Sopenharmony_ci char __user *buf; 2548c2ecf20Sopenharmony_ci void *kaddr, *to; 2558c2ecf20Sopenharmony_ci 2568c2ecf20Sopenharmony_ci if (unlikely(bytes > i->count)) 2578c2ecf20Sopenharmony_ci bytes = i->count; 2588c2ecf20Sopenharmony_ci 2598c2ecf20Sopenharmony_ci if (unlikely(!bytes)) 2608c2ecf20Sopenharmony_ci return 0; 2618c2ecf20Sopenharmony_ci 2628c2ecf20Sopenharmony_ci might_fault(); 2638c2ecf20Sopenharmony_ci wanted = bytes; 2648c2ecf20Sopenharmony_ci iov = i->iov; 2658c2ecf20Sopenharmony_ci skip = i->iov_offset; 2668c2ecf20Sopenharmony_ci buf = iov->iov_base + skip; 2678c2ecf20Sopenharmony_ci copy = min(bytes, iov->iov_len - skip); 2688c2ecf20Sopenharmony_ci 2698c2ecf20Sopenharmony_ci if (IS_ENABLED(CONFIG_HIGHMEM) && !fault_in_pages_readable(buf, copy)) { 2708c2ecf20Sopenharmony_ci kaddr = kmap_atomic(page); 2718c2ecf20Sopenharmony_ci to = kaddr + offset; 2728c2ecf20Sopenharmony_ci 2738c2ecf20Sopenharmony_ci /* first chunk, usually the only one */ 2748c2ecf20Sopenharmony_ci left = copyin(to, buf, copy); 2758c2ecf20Sopenharmony_ci copy -= left; 2768c2ecf20Sopenharmony_ci skip += copy; 2778c2ecf20Sopenharmony_ci to += copy; 2788c2ecf20Sopenharmony_ci bytes -= copy; 2798c2ecf20Sopenharmony_ci 2808c2ecf20Sopenharmony_ci while (unlikely(!left && bytes)) { 2818c2ecf20Sopenharmony_ci iov++; 2828c2ecf20Sopenharmony_ci buf = iov->iov_base; 2838c2ecf20Sopenharmony_ci copy = min(bytes, iov->iov_len); 2848c2ecf20Sopenharmony_ci left = copyin(to, buf, copy); 2858c2ecf20Sopenharmony_ci copy -= left; 2868c2ecf20Sopenharmony_ci skip = copy; 2878c2ecf20Sopenharmony_ci to += copy; 2888c2ecf20Sopenharmony_ci bytes -= copy; 2898c2ecf20Sopenharmony_ci } 2908c2ecf20Sopenharmony_ci if (likely(!bytes)) { 2918c2ecf20Sopenharmony_ci kunmap_atomic(kaddr); 2928c2ecf20Sopenharmony_ci goto done; 2938c2ecf20Sopenharmony_ci } 2948c2ecf20Sopenharmony_ci offset = to - kaddr; 2958c2ecf20Sopenharmony_ci buf += copy; 2968c2ecf20Sopenharmony_ci kunmap_atomic(kaddr); 2978c2ecf20Sopenharmony_ci copy = min(bytes, iov->iov_len - skip); 2988c2ecf20Sopenharmony_ci } 2998c2ecf20Sopenharmony_ci /* Too bad - revert to non-atomic kmap */ 3008c2ecf20Sopenharmony_ci 3018c2ecf20Sopenharmony_ci kaddr = kmap(page); 3028c2ecf20Sopenharmony_ci to = kaddr + offset; 3038c2ecf20Sopenharmony_ci left = copyin(to, buf, copy); 3048c2ecf20Sopenharmony_ci copy -= left; 3058c2ecf20Sopenharmony_ci skip += copy; 3068c2ecf20Sopenharmony_ci to += copy; 3078c2ecf20Sopenharmony_ci bytes -= copy; 3088c2ecf20Sopenharmony_ci while (unlikely(!left && bytes)) { 3098c2ecf20Sopenharmony_ci iov++; 3108c2ecf20Sopenharmony_ci buf = iov->iov_base; 3118c2ecf20Sopenharmony_ci copy = min(bytes, iov->iov_len); 3128c2ecf20Sopenharmony_ci left = copyin(to, buf, copy); 3138c2ecf20Sopenharmony_ci copy -= left; 3148c2ecf20Sopenharmony_ci skip = copy; 3158c2ecf20Sopenharmony_ci to += copy; 3168c2ecf20Sopenharmony_ci bytes -= copy; 3178c2ecf20Sopenharmony_ci } 3188c2ecf20Sopenharmony_ci kunmap(page); 3198c2ecf20Sopenharmony_ci 3208c2ecf20Sopenharmony_cidone: 3218c2ecf20Sopenharmony_ci if (skip == iov->iov_len) { 3228c2ecf20Sopenharmony_ci iov++; 3238c2ecf20Sopenharmony_ci skip = 0; 3248c2ecf20Sopenharmony_ci } 3258c2ecf20Sopenharmony_ci i->count -= wanted - bytes; 3268c2ecf20Sopenharmony_ci i->nr_segs -= iov - i->iov; 3278c2ecf20Sopenharmony_ci i->iov = iov; 3288c2ecf20Sopenharmony_ci i->iov_offset = skip; 3298c2ecf20Sopenharmony_ci return wanted - bytes; 3308c2ecf20Sopenharmony_ci} 3318c2ecf20Sopenharmony_ci 3328c2ecf20Sopenharmony_ci#ifdef PIPE_PARANOIA 3338c2ecf20Sopenharmony_cistatic bool sanity(const struct iov_iter *i) 3348c2ecf20Sopenharmony_ci{ 3358c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 3368c2ecf20Sopenharmony_ci unsigned int p_head = pipe->head; 3378c2ecf20Sopenharmony_ci unsigned int p_tail = pipe->tail; 3388c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 3398c2ecf20Sopenharmony_ci unsigned int p_occupancy = pipe_occupancy(p_head, p_tail); 3408c2ecf20Sopenharmony_ci unsigned int i_head = i->head; 3418c2ecf20Sopenharmony_ci unsigned int idx; 3428c2ecf20Sopenharmony_ci 3438c2ecf20Sopenharmony_ci if (i->iov_offset) { 3448c2ecf20Sopenharmony_ci struct pipe_buffer *p; 3458c2ecf20Sopenharmony_ci if (unlikely(p_occupancy == 0)) 3468c2ecf20Sopenharmony_ci goto Bad; // pipe must be non-empty 3478c2ecf20Sopenharmony_ci if (unlikely(i_head != p_head - 1)) 3488c2ecf20Sopenharmony_ci goto Bad; // must be at the last buffer... 3498c2ecf20Sopenharmony_ci 3508c2ecf20Sopenharmony_ci p = &pipe->bufs[i_head & p_mask]; 3518c2ecf20Sopenharmony_ci if (unlikely(p->offset + p->len != i->iov_offset)) 3528c2ecf20Sopenharmony_ci goto Bad; // ... at the end of segment 3538c2ecf20Sopenharmony_ci } else { 3548c2ecf20Sopenharmony_ci if (i_head != p_head) 3558c2ecf20Sopenharmony_ci goto Bad; // must be right after the last buffer 3568c2ecf20Sopenharmony_ci } 3578c2ecf20Sopenharmony_ci return true; 3588c2ecf20Sopenharmony_ciBad: 3598c2ecf20Sopenharmony_ci printk(KERN_ERR "idx = %d, offset = %zd\n", i_head, i->iov_offset); 3608c2ecf20Sopenharmony_ci printk(KERN_ERR "head = %d, tail = %d, buffers = %d\n", 3618c2ecf20Sopenharmony_ci p_head, p_tail, pipe->ring_size); 3628c2ecf20Sopenharmony_ci for (idx = 0; idx < pipe->ring_size; idx++) 3638c2ecf20Sopenharmony_ci printk(KERN_ERR "[%p %p %d %d]\n", 3648c2ecf20Sopenharmony_ci pipe->bufs[idx].ops, 3658c2ecf20Sopenharmony_ci pipe->bufs[idx].page, 3668c2ecf20Sopenharmony_ci pipe->bufs[idx].offset, 3678c2ecf20Sopenharmony_ci pipe->bufs[idx].len); 3688c2ecf20Sopenharmony_ci WARN_ON(1); 3698c2ecf20Sopenharmony_ci return false; 3708c2ecf20Sopenharmony_ci} 3718c2ecf20Sopenharmony_ci#else 3728c2ecf20Sopenharmony_ci#define sanity(i) true 3738c2ecf20Sopenharmony_ci#endif 3748c2ecf20Sopenharmony_ci 3758c2ecf20Sopenharmony_cistatic size_t copy_page_to_iter_pipe(struct page *page, size_t offset, size_t bytes, 3768c2ecf20Sopenharmony_ci struct iov_iter *i) 3778c2ecf20Sopenharmony_ci{ 3788c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 3798c2ecf20Sopenharmony_ci struct pipe_buffer *buf; 3808c2ecf20Sopenharmony_ci unsigned int p_tail = pipe->tail; 3818c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 3828c2ecf20Sopenharmony_ci unsigned int i_head = i->head; 3838c2ecf20Sopenharmony_ci size_t off; 3848c2ecf20Sopenharmony_ci 3858c2ecf20Sopenharmony_ci if (unlikely(bytes > i->count)) 3868c2ecf20Sopenharmony_ci bytes = i->count; 3878c2ecf20Sopenharmony_ci 3888c2ecf20Sopenharmony_ci if (unlikely(!bytes)) 3898c2ecf20Sopenharmony_ci return 0; 3908c2ecf20Sopenharmony_ci 3918c2ecf20Sopenharmony_ci if (!sanity(i)) 3928c2ecf20Sopenharmony_ci return 0; 3938c2ecf20Sopenharmony_ci 3948c2ecf20Sopenharmony_ci off = i->iov_offset; 3958c2ecf20Sopenharmony_ci buf = &pipe->bufs[i_head & p_mask]; 3968c2ecf20Sopenharmony_ci if (off) { 3978c2ecf20Sopenharmony_ci if (offset == off && buf->page == page) { 3988c2ecf20Sopenharmony_ci /* merge with the last one */ 3998c2ecf20Sopenharmony_ci buf->len += bytes; 4008c2ecf20Sopenharmony_ci i->iov_offset += bytes; 4018c2ecf20Sopenharmony_ci goto out; 4028c2ecf20Sopenharmony_ci } 4038c2ecf20Sopenharmony_ci i_head++; 4048c2ecf20Sopenharmony_ci buf = &pipe->bufs[i_head & p_mask]; 4058c2ecf20Sopenharmony_ci } 4068c2ecf20Sopenharmony_ci if (pipe_full(i_head, p_tail, pipe->max_usage)) 4078c2ecf20Sopenharmony_ci return 0; 4088c2ecf20Sopenharmony_ci 4098c2ecf20Sopenharmony_ci buf->ops = &page_cache_pipe_buf_ops; 4108c2ecf20Sopenharmony_ci buf->flags = 0; 4118c2ecf20Sopenharmony_ci get_page(page); 4128c2ecf20Sopenharmony_ci buf->page = page; 4138c2ecf20Sopenharmony_ci buf->offset = offset; 4148c2ecf20Sopenharmony_ci buf->len = bytes; 4158c2ecf20Sopenharmony_ci 4168c2ecf20Sopenharmony_ci pipe->head = i_head + 1; 4178c2ecf20Sopenharmony_ci i->iov_offset = offset + bytes; 4188c2ecf20Sopenharmony_ci i->head = i_head; 4198c2ecf20Sopenharmony_ciout: 4208c2ecf20Sopenharmony_ci i->count -= bytes; 4218c2ecf20Sopenharmony_ci return bytes; 4228c2ecf20Sopenharmony_ci} 4238c2ecf20Sopenharmony_ci 4248c2ecf20Sopenharmony_ci/* 4258c2ecf20Sopenharmony_ci * Fault in one or more iovecs of the given iov_iter, to a maximum length of 4268c2ecf20Sopenharmony_ci * bytes. For each iovec, fault in each page that constitutes the iovec. 4278c2ecf20Sopenharmony_ci * 4288c2ecf20Sopenharmony_ci * Return 0 on success, or non-zero if the memory could not be accessed (i.e. 4298c2ecf20Sopenharmony_ci * because it is an invalid address). 4308c2ecf20Sopenharmony_ci */ 4318c2ecf20Sopenharmony_ciint iov_iter_fault_in_readable(struct iov_iter *i, size_t bytes) 4328c2ecf20Sopenharmony_ci{ 4338c2ecf20Sopenharmony_ci size_t skip = i->iov_offset; 4348c2ecf20Sopenharmony_ci const struct iovec *iov; 4358c2ecf20Sopenharmony_ci int err; 4368c2ecf20Sopenharmony_ci struct iovec v; 4378c2ecf20Sopenharmony_ci 4388c2ecf20Sopenharmony_ci if (iter_is_iovec(i)) { 4398c2ecf20Sopenharmony_ci iterate_iovec(i, bytes, v, iov, skip, ({ 4408c2ecf20Sopenharmony_ci err = fault_in_pages_readable(v.iov_base, v.iov_len); 4418c2ecf20Sopenharmony_ci if (unlikely(err)) 4428c2ecf20Sopenharmony_ci return err; 4438c2ecf20Sopenharmony_ci 0;})) 4448c2ecf20Sopenharmony_ci } 4458c2ecf20Sopenharmony_ci return 0; 4468c2ecf20Sopenharmony_ci} 4478c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_fault_in_readable); 4488c2ecf20Sopenharmony_ci 4498c2ecf20Sopenharmony_civoid iov_iter_init(struct iov_iter *i, unsigned int direction, 4508c2ecf20Sopenharmony_ci const struct iovec *iov, unsigned long nr_segs, 4518c2ecf20Sopenharmony_ci size_t count) 4528c2ecf20Sopenharmony_ci{ 4538c2ecf20Sopenharmony_ci WARN_ON(direction & ~(READ | WRITE)); 4548c2ecf20Sopenharmony_ci direction &= READ | WRITE; 4558c2ecf20Sopenharmony_ci 4568c2ecf20Sopenharmony_ci /* It will get better. Eventually... */ 4578c2ecf20Sopenharmony_ci if (uaccess_kernel()) { 4588c2ecf20Sopenharmony_ci i->type = ITER_KVEC | direction; 4598c2ecf20Sopenharmony_ci i->kvec = (struct kvec *)iov; 4608c2ecf20Sopenharmony_ci } else { 4618c2ecf20Sopenharmony_ci i->type = ITER_IOVEC | direction; 4628c2ecf20Sopenharmony_ci i->iov = iov; 4638c2ecf20Sopenharmony_ci } 4648c2ecf20Sopenharmony_ci i->nr_segs = nr_segs; 4658c2ecf20Sopenharmony_ci i->iov_offset = 0; 4668c2ecf20Sopenharmony_ci i->count = count; 4678c2ecf20Sopenharmony_ci} 4688c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_init); 4698c2ecf20Sopenharmony_ci 4708c2ecf20Sopenharmony_cistatic void memzero_page(struct page *page, size_t offset, size_t len) 4718c2ecf20Sopenharmony_ci{ 4728c2ecf20Sopenharmony_ci char *addr = kmap_atomic(page); 4738c2ecf20Sopenharmony_ci memset(addr + offset, 0, len); 4748c2ecf20Sopenharmony_ci kunmap_atomic(addr); 4758c2ecf20Sopenharmony_ci} 4768c2ecf20Sopenharmony_ci 4778c2ecf20Sopenharmony_cistatic inline bool allocated(struct pipe_buffer *buf) 4788c2ecf20Sopenharmony_ci{ 4798c2ecf20Sopenharmony_ci return buf->ops == &default_pipe_buf_ops; 4808c2ecf20Sopenharmony_ci} 4818c2ecf20Sopenharmony_ci 4828c2ecf20Sopenharmony_cistatic inline void data_start(const struct iov_iter *i, 4838c2ecf20Sopenharmony_ci unsigned int *iter_headp, size_t *offp) 4848c2ecf20Sopenharmony_ci{ 4858c2ecf20Sopenharmony_ci unsigned int p_mask = i->pipe->ring_size - 1; 4868c2ecf20Sopenharmony_ci unsigned int iter_head = i->head; 4878c2ecf20Sopenharmony_ci size_t off = i->iov_offset; 4888c2ecf20Sopenharmony_ci 4898c2ecf20Sopenharmony_ci if (off && (!allocated(&i->pipe->bufs[iter_head & p_mask]) || 4908c2ecf20Sopenharmony_ci off == PAGE_SIZE)) { 4918c2ecf20Sopenharmony_ci iter_head++; 4928c2ecf20Sopenharmony_ci off = 0; 4938c2ecf20Sopenharmony_ci } 4948c2ecf20Sopenharmony_ci *iter_headp = iter_head; 4958c2ecf20Sopenharmony_ci *offp = off; 4968c2ecf20Sopenharmony_ci} 4978c2ecf20Sopenharmony_ci 4988c2ecf20Sopenharmony_cistatic size_t push_pipe(struct iov_iter *i, size_t size, 4998c2ecf20Sopenharmony_ci int *iter_headp, size_t *offp) 5008c2ecf20Sopenharmony_ci{ 5018c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 5028c2ecf20Sopenharmony_ci unsigned int p_tail = pipe->tail; 5038c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 5048c2ecf20Sopenharmony_ci unsigned int iter_head; 5058c2ecf20Sopenharmony_ci size_t off; 5068c2ecf20Sopenharmony_ci ssize_t left; 5078c2ecf20Sopenharmony_ci 5088c2ecf20Sopenharmony_ci if (unlikely(size > i->count)) 5098c2ecf20Sopenharmony_ci size = i->count; 5108c2ecf20Sopenharmony_ci if (unlikely(!size)) 5118c2ecf20Sopenharmony_ci return 0; 5128c2ecf20Sopenharmony_ci 5138c2ecf20Sopenharmony_ci left = size; 5148c2ecf20Sopenharmony_ci data_start(i, &iter_head, &off); 5158c2ecf20Sopenharmony_ci *iter_headp = iter_head; 5168c2ecf20Sopenharmony_ci *offp = off; 5178c2ecf20Sopenharmony_ci if (off) { 5188c2ecf20Sopenharmony_ci left -= PAGE_SIZE - off; 5198c2ecf20Sopenharmony_ci if (left <= 0) { 5208c2ecf20Sopenharmony_ci pipe->bufs[iter_head & p_mask].len += size; 5218c2ecf20Sopenharmony_ci return size; 5228c2ecf20Sopenharmony_ci } 5238c2ecf20Sopenharmony_ci pipe->bufs[iter_head & p_mask].len = PAGE_SIZE; 5248c2ecf20Sopenharmony_ci iter_head++; 5258c2ecf20Sopenharmony_ci } 5268c2ecf20Sopenharmony_ci while (!pipe_full(iter_head, p_tail, pipe->max_usage)) { 5278c2ecf20Sopenharmony_ci struct pipe_buffer *buf = &pipe->bufs[iter_head & p_mask]; 5288c2ecf20Sopenharmony_ci struct page *page = alloc_page(GFP_USER); 5298c2ecf20Sopenharmony_ci if (!page) 5308c2ecf20Sopenharmony_ci break; 5318c2ecf20Sopenharmony_ci 5328c2ecf20Sopenharmony_ci buf->ops = &default_pipe_buf_ops; 5338c2ecf20Sopenharmony_ci buf->flags = 0; 5348c2ecf20Sopenharmony_ci buf->page = page; 5358c2ecf20Sopenharmony_ci buf->offset = 0; 5368c2ecf20Sopenharmony_ci buf->len = min_t(ssize_t, left, PAGE_SIZE); 5378c2ecf20Sopenharmony_ci left -= buf->len; 5388c2ecf20Sopenharmony_ci iter_head++; 5398c2ecf20Sopenharmony_ci pipe->head = iter_head; 5408c2ecf20Sopenharmony_ci 5418c2ecf20Sopenharmony_ci if (left == 0) 5428c2ecf20Sopenharmony_ci return size; 5438c2ecf20Sopenharmony_ci } 5448c2ecf20Sopenharmony_ci return size - left; 5458c2ecf20Sopenharmony_ci} 5468c2ecf20Sopenharmony_ci 5478c2ecf20Sopenharmony_cistatic size_t copy_pipe_to_iter(const void *addr, size_t bytes, 5488c2ecf20Sopenharmony_ci struct iov_iter *i) 5498c2ecf20Sopenharmony_ci{ 5508c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 5518c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 5528c2ecf20Sopenharmony_ci unsigned int i_head; 5538c2ecf20Sopenharmony_ci size_t n, off; 5548c2ecf20Sopenharmony_ci 5558c2ecf20Sopenharmony_ci if (!sanity(i)) 5568c2ecf20Sopenharmony_ci return 0; 5578c2ecf20Sopenharmony_ci 5588c2ecf20Sopenharmony_ci bytes = n = push_pipe(i, bytes, &i_head, &off); 5598c2ecf20Sopenharmony_ci if (unlikely(!n)) 5608c2ecf20Sopenharmony_ci return 0; 5618c2ecf20Sopenharmony_ci do { 5628c2ecf20Sopenharmony_ci size_t chunk = min_t(size_t, n, PAGE_SIZE - off); 5638c2ecf20Sopenharmony_ci memcpy_to_page(pipe->bufs[i_head & p_mask].page, off, addr, chunk); 5648c2ecf20Sopenharmony_ci i->head = i_head; 5658c2ecf20Sopenharmony_ci i->iov_offset = off + chunk; 5668c2ecf20Sopenharmony_ci n -= chunk; 5678c2ecf20Sopenharmony_ci addr += chunk; 5688c2ecf20Sopenharmony_ci off = 0; 5698c2ecf20Sopenharmony_ci i_head++; 5708c2ecf20Sopenharmony_ci } while (n); 5718c2ecf20Sopenharmony_ci i->count -= bytes; 5728c2ecf20Sopenharmony_ci return bytes; 5738c2ecf20Sopenharmony_ci} 5748c2ecf20Sopenharmony_ci 5758c2ecf20Sopenharmony_cistatic __wsum csum_and_memcpy(void *to, const void *from, size_t len, 5768c2ecf20Sopenharmony_ci __wsum sum, size_t off) 5778c2ecf20Sopenharmony_ci{ 5788c2ecf20Sopenharmony_ci __wsum next = csum_partial_copy_nocheck(from, to, len); 5798c2ecf20Sopenharmony_ci return csum_block_add(sum, next, off); 5808c2ecf20Sopenharmony_ci} 5818c2ecf20Sopenharmony_ci 5828c2ecf20Sopenharmony_cistatic size_t csum_and_copy_to_pipe_iter(const void *addr, size_t bytes, 5838c2ecf20Sopenharmony_ci struct csum_state *csstate, 5848c2ecf20Sopenharmony_ci struct iov_iter *i) 5858c2ecf20Sopenharmony_ci{ 5868c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 5878c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 5888c2ecf20Sopenharmony_ci __wsum sum = csstate->csum; 5898c2ecf20Sopenharmony_ci size_t off = csstate->off; 5908c2ecf20Sopenharmony_ci unsigned int i_head; 5918c2ecf20Sopenharmony_ci size_t n, r; 5928c2ecf20Sopenharmony_ci 5938c2ecf20Sopenharmony_ci if (!sanity(i)) 5948c2ecf20Sopenharmony_ci return 0; 5958c2ecf20Sopenharmony_ci 5968c2ecf20Sopenharmony_ci bytes = n = push_pipe(i, bytes, &i_head, &r); 5978c2ecf20Sopenharmony_ci if (unlikely(!n)) 5988c2ecf20Sopenharmony_ci return 0; 5998c2ecf20Sopenharmony_ci do { 6008c2ecf20Sopenharmony_ci size_t chunk = min_t(size_t, n, PAGE_SIZE - r); 6018c2ecf20Sopenharmony_ci char *p = kmap_atomic(pipe->bufs[i_head & p_mask].page); 6028c2ecf20Sopenharmony_ci sum = csum_and_memcpy(p + r, addr, chunk, sum, off); 6038c2ecf20Sopenharmony_ci kunmap_atomic(p); 6048c2ecf20Sopenharmony_ci i->head = i_head; 6058c2ecf20Sopenharmony_ci i->iov_offset = r + chunk; 6068c2ecf20Sopenharmony_ci n -= chunk; 6078c2ecf20Sopenharmony_ci off += chunk; 6088c2ecf20Sopenharmony_ci addr += chunk; 6098c2ecf20Sopenharmony_ci r = 0; 6108c2ecf20Sopenharmony_ci i_head++; 6118c2ecf20Sopenharmony_ci } while (n); 6128c2ecf20Sopenharmony_ci i->count -= bytes; 6138c2ecf20Sopenharmony_ci csstate->csum = sum; 6148c2ecf20Sopenharmony_ci csstate->off = off; 6158c2ecf20Sopenharmony_ci return bytes; 6168c2ecf20Sopenharmony_ci} 6178c2ecf20Sopenharmony_ci 6188c2ecf20Sopenharmony_cisize_t _copy_to_iter(const void *addr, size_t bytes, struct iov_iter *i) 6198c2ecf20Sopenharmony_ci{ 6208c2ecf20Sopenharmony_ci const char *from = addr; 6218c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) 6228c2ecf20Sopenharmony_ci return copy_pipe_to_iter(addr, bytes, i); 6238c2ecf20Sopenharmony_ci if (iter_is_iovec(i)) 6248c2ecf20Sopenharmony_ci might_fault(); 6258c2ecf20Sopenharmony_ci iterate_and_advance(i, bytes, v, 6268c2ecf20Sopenharmony_ci copyout(v.iov_base, (from += v.iov_len) - v.iov_len, v.iov_len), 6278c2ecf20Sopenharmony_ci memcpy_to_page(v.bv_page, v.bv_offset, 6288c2ecf20Sopenharmony_ci (from += v.bv_len) - v.bv_len, v.bv_len), 6298c2ecf20Sopenharmony_ci memcpy(v.iov_base, (from += v.iov_len) - v.iov_len, v.iov_len) 6308c2ecf20Sopenharmony_ci ) 6318c2ecf20Sopenharmony_ci 6328c2ecf20Sopenharmony_ci return bytes; 6338c2ecf20Sopenharmony_ci} 6348c2ecf20Sopenharmony_ciEXPORT_SYMBOL(_copy_to_iter); 6358c2ecf20Sopenharmony_ci 6368c2ecf20Sopenharmony_ci#ifdef CONFIG_ARCH_HAS_COPY_MC 6378c2ecf20Sopenharmony_cistatic int copyout_mc(void __user *to, const void *from, size_t n) 6388c2ecf20Sopenharmony_ci{ 6398c2ecf20Sopenharmony_ci if (access_ok(to, n)) { 6408c2ecf20Sopenharmony_ci instrument_copy_to_user(to, from, n); 6418c2ecf20Sopenharmony_ci n = copy_mc_to_user((__force void *) to, from, n); 6428c2ecf20Sopenharmony_ci } 6438c2ecf20Sopenharmony_ci return n; 6448c2ecf20Sopenharmony_ci} 6458c2ecf20Sopenharmony_ci 6468c2ecf20Sopenharmony_cistatic unsigned long copy_mc_to_page(struct page *page, size_t offset, 6478c2ecf20Sopenharmony_ci const char *from, size_t len) 6488c2ecf20Sopenharmony_ci{ 6498c2ecf20Sopenharmony_ci unsigned long ret; 6508c2ecf20Sopenharmony_ci char *to; 6518c2ecf20Sopenharmony_ci 6528c2ecf20Sopenharmony_ci to = kmap_atomic(page); 6538c2ecf20Sopenharmony_ci ret = copy_mc_to_kernel(to + offset, from, len); 6548c2ecf20Sopenharmony_ci kunmap_atomic(to); 6558c2ecf20Sopenharmony_ci 6568c2ecf20Sopenharmony_ci return ret; 6578c2ecf20Sopenharmony_ci} 6588c2ecf20Sopenharmony_ci 6598c2ecf20Sopenharmony_cistatic size_t copy_mc_pipe_to_iter(const void *addr, size_t bytes, 6608c2ecf20Sopenharmony_ci struct iov_iter *i) 6618c2ecf20Sopenharmony_ci{ 6628c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 6638c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 6648c2ecf20Sopenharmony_ci unsigned int i_head; 6658c2ecf20Sopenharmony_ci size_t n, off, xfer = 0; 6668c2ecf20Sopenharmony_ci 6678c2ecf20Sopenharmony_ci if (!sanity(i)) 6688c2ecf20Sopenharmony_ci return 0; 6698c2ecf20Sopenharmony_ci 6708c2ecf20Sopenharmony_ci bytes = n = push_pipe(i, bytes, &i_head, &off); 6718c2ecf20Sopenharmony_ci if (unlikely(!n)) 6728c2ecf20Sopenharmony_ci return 0; 6738c2ecf20Sopenharmony_ci do { 6748c2ecf20Sopenharmony_ci size_t chunk = min_t(size_t, n, PAGE_SIZE - off); 6758c2ecf20Sopenharmony_ci unsigned long rem; 6768c2ecf20Sopenharmony_ci 6778c2ecf20Sopenharmony_ci rem = copy_mc_to_page(pipe->bufs[i_head & p_mask].page, 6788c2ecf20Sopenharmony_ci off, addr, chunk); 6798c2ecf20Sopenharmony_ci i->head = i_head; 6808c2ecf20Sopenharmony_ci i->iov_offset = off + chunk - rem; 6818c2ecf20Sopenharmony_ci xfer += chunk - rem; 6828c2ecf20Sopenharmony_ci if (rem) 6838c2ecf20Sopenharmony_ci break; 6848c2ecf20Sopenharmony_ci n -= chunk; 6858c2ecf20Sopenharmony_ci addr += chunk; 6868c2ecf20Sopenharmony_ci off = 0; 6878c2ecf20Sopenharmony_ci i_head++; 6888c2ecf20Sopenharmony_ci } while (n); 6898c2ecf20Sopenharmony_ci i->count -= xfer; 6908c2ecf20Sopenharmony_ci return xfer; 6918c2ecf20Sopenharmony_ci} 6928c2ecf20Sopenharmony_ci 6938c2ecf20Sopenharmony_ci/** 6948c2ecf20Sopenharmony_ci * _copy_mc_to_iter - copy to iter with source memory error exception handling 6958c2ecf20Sopenharmony_ci * @addr: source kernel address 6968c2ecf20Sopenharmony_ci * @bytes: total transfer length 6978c2ecf20Sopenharmony_ci * @iter: destination iterator 6988c2ecf20Sopenharmony_ci * 6998c2ecf20Sopenharmony_ci * The pmem driver deploys this for the dax operation 7008c2ecf20Sopenharmony_ci * (dax_copy_to_iter()) for dax reads (bypass page-cache and the 7018c2ecf20Sopenharmony_ci * block-layer). Upon #MC read(2) aborts and returns EIO or the bytes 7028c2ecf20Sopenharmony_ci * successfully copied. 7038c2ecf20Sopenharmony_ci * 7048c2ecf20Sopenharmony_ci * The main differences between this and typical _copy_to_iter(). 7058c2ecf20Sopenharmony_ci * 7068c2ecf20Sopenharmony_ci * * Typical tail/residue handling after a fault retries the copy 7078c2ecf20Sopenharmony_ci * byte-by-byte until the fault happens again. Re-triggering machine 7088c2ecf20Sopenharmony_ci * checks is potentially fatal so the implementation uses source 7098c2ecf20Sopenharmony_ci * alignment and poison alignment assumptions to avoid re-triggering 7108c2ecf20Sopenharmony_ci * hardware exceptions. 7118c2ecf20Sopenharmony_ci * 7128c2ecf20Sopenharmony_ci * * ITER_KVEC, ITER_PIPE, and ITER_BVEC can return short copies. 7138c2ecf20Sopenharmony_ci * Compare to copy_to_iter() where only ITER_IOVEC attempts might return 7148c2ecf20Sopenharmony_ci * a short copy. 7158c2ecf20Sopenharmony_ci */ 7168c2ecf20Sopenharmony_cisize_t _copy_mc_to_iter(const void *addr, size_t bytes, struct iov_iter *i) 7178c2ecf20Sopenharmony_ci{ 7188c2ecf20Sopenharmony_ci const char *from = addr; 7198c2ecf20Sopenharmony_ci unsigned long rem, curr_addr, s_addr = (unsigned long) addr; 7208c2ecf20Sopenharmony_ci 7218c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) 7228c2ecf20Sopenharmony_ci return copy_mc_pipe_to_iter(addr, bytes, i); 7238c2ecf20Sopenharmony_ci if (iter_is_iovec(i)) 7248c2ecf20Sopenharmony_ci might_fault(); 7258c2ecf20Sopenharmony_ci iterate_and_advance(i, bytes, v, 7268c2ecf20Sopenharmony_ci copyout_mc(v.iov_base, (from += v.iov_len) - v.iov_len, 7278c2ecf20Sopenharmony_ci v.iov_len), 7288c2ecf20Sopenharmony_ci ({ 7298c2ecf20Sopenharmony_ci rem = copy_mc_to_page(v.bv_page, v.bv_offset, 7308c2ecf20Sopenharmony_ci (from += v.bv_len) - v.bv_len, v.bv_len); 7318c2ecf20Sopenharmony_ci if (rem) { 7328c2ecf20Sopenharmony_ci curr_addr = (unsigned long) from; 7338c2ecf20Sopenharmony_ci bytes = curr_addr - s_addr - rem; 7348c2ecf20Sopenharmony_ci return bytes; 7358c2ecf20Sopenharmony_ci } 7368c2ecf20Sopenharmony_ci }), 7378c2ecf20Sopenharmony_ci ({ 7388c2ecf20Sopenharmony_ci rem = copy_mc_to_kernel(v.iov_base, (from += v.iov_len) 7398c2ecf20Sopenharmony_ci - v.iov_len, v.iov_len); 7408c2ecf20Sopenharmony_ci if (rem) { 7418c2ecf20Sopenharmony_ci curr_addr = (unsigned long) from; 7428c2ecf20Sopenharmony_ci bytes = curr_addr - s_addr - rem; 7438c2ecf20Sopenharmony_ci return bytes; 7448c2ecf20Sopenharmony_ci } 7458c2ecf20Sopenharmony_ci }) 7468c2ecf20Sopenharmony_ci ) 7478c2ecf20Sopenharmony_ci 7488c2ecf20Sopenharmony_ci return bytes; 7498c2ecf20Sopenharmony_ci} 7508c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(_copy_mc_to_iter); 7518c2ecf20Sopenharmony_ci#endif /* CONFIG_ARCH_HAS_COPY_MC */ 7528c2ecf20Sopenharmony_ci 7538c2ecf20Sopenharmony_cisize_t _copy_from_iter(void *addr, size_t bytes, struct iov_iter *i) 7548c2ecf20Sopenharmony_ci{ 7558c2ecf20Sopenharmony_ci char *to = addr; 7568c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) { 7578c2ecf20Sopenharmony_ci WARN_ON(1); 7588c2ecf20Sopenharmony_ci return 0; 7598c2ecf20Sopenharmony_ci } 7608c2ecf20Sopenharmony_ci if (iter_is_iovec(i)) 7618c2ecf20Sopenharmony_ci might_fault(); 7628c2ecf20Sopenharmony_ci iterate_and_advance(i, bytes, v, 7638c2ecf20Sopenharmony_ci copyin((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len), 7648c2ecf20Sopenharmony_ci memcpy_from_page((to += v.bv_len) - v.bv_len, v.bv_page, 7658c2ecf20Sopenharmony_ci v.bv_offset, v.bv_len), 7668c2ecf20Sopenharmony_ci memcpy((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len) 7678c2ecf20Sopenharmony_ci ) 7688c2ecf20Sopenharmony_ci 7698c2ecf20Sopenharmony_ci return bytes; 7708c2ecf20Sopenharmony_ci} 7718c2ecf20Sopenharmony_ciEXPORT_SYMBOL(_copy_from_iter); 7728c2ecf20Sopenharmony_ci 7738c2ecf20Sopenharmony_cibool _copy_from_iter_full(void *addr, size_t bytes, struct iov_iter *i) 7748c2ecf20Sopenharmony_ci{ 7758c2ecf20Sopenharmony_ci char *to = addr; 7768c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) { 7778c2ecf20Sopenharmony_ci WARN_ON(1); 7788c2ecf20Sopenharmony_ci return false; 7798c2ecf20Sopenharmony_ci } 7808c2ecf20Sopenharmony_ci if (unlikely(i->count < bytes)) 7818c2ecf20Sopenharmony_ci return false; 7828c2ecf20Sopenharmony_ci 7838c2ecf20Sopenharmony_ci if (iter_is_iovec(i)) 7848c2ecf20Sopenharmony_ci might_fault(); 7858c2ecf20Sopenharmony_ci iterate_all_kinds(i, bytes, v, ({ 7868c2ecf20Sopenharmony_ci if (copyin((to += v.iov_len) - v.iov_len, 7878c2ecf20Sopenharmony_ci v.iov_base, v.iov_len)) 7888c2ecf20Sopenharmony_ci return false; 7898c2ecf20Sopenharmony_ci 0;}), 7908c2ecf20Sopenharmony_ci memcpy_from_page((to += v.bv_len) - v.bv_len, v.bv_page, 7918c2ecf20Sopenharmony_ci v.bv_offset, v.bv_len), 7928c2ecf20Sopenharmony_ci memcpy((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len) 7938c2ecf20Sopenharmony_ci ) 7948c2ecf20Sopenharmony_ci 7958c2ecf20Sopenharmony_ci iov_iter_advance(i, bytes); 7968c2ecf20Sopenharmony_ci return true; 7978c2ecf20Sopenharmony_ci} 7988c2ecf20Sopenharmony_ciEXPORT_SYMBOL(_copy_from_iter_full); 7998c2ecf20Sopenharmony_ci 8008c2ecf20Sopenharmony_cisize_t _copy_from_iter_nocache(void *addr, size_t bytes, struct iov_iter *i) 8018c2ecf20Sopenharmony_ci{ 8028c2ecf20Sopenharmony_ci char *to = addr; 8038c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) { 8048c2ecf20Sopenharmony_ci WARN_ON(1); 8058c2ecf20Sopenharmony_ci return 0; 8068c2ecf20Sopenharmony_ci } 8078c2ecf20Sopenharmony_ci iterate_and_advance(i, bytes, v, 8088c2ecf20Sopenharmony_ci __copy_from_user_inatomic_nocache((to += v.iov_len) - v.iov_len, 8098c2ecf20Sopenharmony_ci v.iov_base, v.iov_len), 8108c2ecf20Sopenharmony_ci memcpy_from_page((to += v.bv_len) - v.bv_len, v.bv_page, 8118c2ecf20Sopenharmony_ci v.bv_offset, v.bv_len), 8128c2ecf20Sopenharmony_ci memcpy((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len) 8138c2ecf20Sopenharmony_ci ) 8148c2ecf20Sopenharmony_ci 8158c2ecf20Sopenharmony_ci return bytes; 8168c2ecf20Sopenharmony_ci} 8178c2ecf20Sopenharmony_ciEXPORT_SYMBOL(_copy_from_iter_nocache); 8188c2ecf20Sopenharmony_ci 8198c2ecf20Sopenharmony_ci#ifdef CONFIG_ARCH_HAS_UACCESS_FLUSHCACHE 8208c2ecf20Sopenharmony_ci/** 8218c2ecf20Sopenharmony_ci * _copy_from_iter_flushcache - write destination through cpu cache 8228c2ecf20Sopenharmony_ci * @addr: destination kernel address 8238c2ecf20Sopenharmony_ci * @bytes: total transfer length 8248c2ecf20Sopenharmony_ci * @iter: source iterator 8258c2ecf20Sopenharmony_ci * 8268c2ecf20Sopenharmony_ci * The pmem driver arranges for filesystem-dax to use this facility via 8278c2ecf20Sopenharmony_ci * dax_copy_from_iter() for ensuring that writes to persistent memory 8288c2ecf20Sopenharmony_ci * are flushed through the CPU cache. It is differentiated from 8298c2ecf20Sopenharmony_ci * _copy_from_iter_nocache() in that guarantees all data is flushed for 8308c2ecf20Sopenharmony_ci * all iterator types. The _copy_from_iter_nocache() only attempts to 8318c2ecf20Sopenharmony_ci * bypass the cache for the ITER_IOVEC case, and on some archs may use 8328c2ecf20Sopenharmony_ci * instructions that strand dirty-data in the cache. 8338c2ecf20Sopenharmony_ci */ 8348c2ecf20Sopenharmony_cisize_t _copy_from_iter_flushcache(void *addr, size_t bytes, struct iov_iter *i) 8358c2ecf20Sopenharmony_ci{ 8368c2ecf20Sopenharmony_ci char *to = addr; 8378c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) { 8388c2ecf20Sopenharmony_ci WARN_ON(1); 8398c2ecf20Sopenharmony_ci return 0; 8408c2ecf20Sopenharmony_ci } 8418c2ecf20Sopenharmony_ci iterate_and_advance(i, bytes, v, 8428c2ecf20Sopenharmony_ci __copy_from_user_flushcache((to += v.iov_len) - v.iov_len, 8438c2ecf20Sopenharmony_ci v.iov_base, v.iov_len), 8448c2ecf20Sopenharmony_ci memcpy_page_flushcache((to += v.bv_len) - v.bv_len, v.bv_page, 8458c2ecf20Sopenharmony_ci v.bv_offset, v.bv_len), 8468c2ecf20Sopenharmony_ci memcpy_flushcache((to += v.iov_len) - v.iov_len, v.iov_base, 8478c2ecf20Sopenharmony_ci v.iov_len) 8488c2ecf20Sopenharmony_ci ) 8498c2ecf20Sopenharmony_ci 8508c2ecf20Sopenharmony_ci return bytes; 8518c2ecf20Sopenharmony_ci} 8528c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(_copy_from_iter_flushcache); 8538c2ecf20Sopenharmony_ci#endif 8548c2ecf20Sopenharmony_ci 8558c2ecf20Sopenharmony_cibool _copy_from_iter_full_nocache(void *addr, size_t bytes, struct iov_iter *i) 8568c2ecf20Sopenharmony_ci{ 8578c2ecf20Sopenharmony_ci char *to = addr; 8588c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) { 8598c2ecf20Sopenharmony_ci WARN_ON(1); 8608c2ecf20Sopenharmony_ci return false; 8618c2ecf20Sopenharmony_ci } 8628c2ecf20Sopenharmony_ci if (unlikely(i->count < bytes)) 8638c2ecf20Sopenharmony_ci return false; 8648c2ecf20Sopenharmony_ci iterate_all_kinds(i, bytes, v, ({ 8658c2ecf20Sopenharmony_ci if (__copy_from_user_inatomic_nocache((to += v.iov_len) - v.iov_len, 8668c2ecf20Sopenharmony_ci v.iov_base, v.iov_len)) 8678c2ecf20Sopenharmony_ci return false; 8688c2ecf20Sopenharmony_ci 0;}), 8698c2ecf20Sopenharmony_ci memcpy_from_page((to += v.bv_len) - v.bv_len, v.bv_page, 8708c2ecf20Sopenharmony_ci v.bv_offset, v.bv_len), 8718c2ecf20Sopenharmony_ci memcpy((to += v.iov_len) - v.iov_len, v.iov_base, v.iov_len) 8728c2ecf20Sopenharmony_ci ) 8738c2ecf20Sopenharmony_ci 8748c2ecf20Sopenharmony_ci iov_iter_advance(i, bytes); 8758c2ecf20Sopenharmony_ci return true; 8768c2ecf20Sopenharmony_ci} 8778c2ecf20Sopenharmony_ciEXPORT_SYMBOL(_copy_from_iter_full_nocache); 8788c2ecf20Sopenharmony_ci 8798c2ecf20Sopenharmony_cistatic inline bool page_copy_sane(struct page *page, size_t offset, size_t n) 8808c2ecf20Sopenharmony_ci{ 8818c2ecf20Sopenharmony_ci struct page *head; 8828c2ecf20Sopenharmony_ci size_t v = n + offset; 8838c2ecf20Sopenharmony_ci 8848c2ecf20Sopenharmony_ci /* 8858c2ecf20Sopenharmony_ci * The general case needs to access the page order in order 8868c2ecf20Sopenharmony_ci * to compute the page size. 8878c2ecf20Sopenharmony_ci * However, we mostly deal with order-0 pages and thus can 8888c2ecf20Sopenharmony_ci * avoid a possible cache line miss for requests that fit all 8898c2ecf20Sopenharmony_ci * page orders. 8908c2ecf20Sopenharmony_ci */ 8918c2ecf20Sopenharmony_ci if (n <= v && v <= PAGE_SIZE) 8928c2ecf20Sopenharmony_ci return true; 8938c2ecf20Sopenharmony_ci 8948c2ecf20Sopenharmony_ci head = compound_head(page); 8958c2ecf20Sopenharmony_ci v += (page - head) << PAGE_SHIFT; 8968c2ecf20Sopenharmony_ci 8978c2ecf20Sopenharmony_ci if (likely(n <= v && v <= (page_size(head)))) 8988c2ecf20Sopenharmony_ci return true; 8998c2ecf20Sopenharmony_ci WARN_ON(1); 9008c2ecf20Sopenharmony_ci return false; 9018c2ecf20Sopenharmony_ci} 9028c2ecf20Sopenharmony_ci 9038c2ecf20Sopenharmony_cisize_t copy_page_to_iter(struct page *page, size_t offset, size_t bytes, 9048c2ecf20Sopenharmony_ci struct iov_iter *i) 9058c2ecf20Sopenharmony_ci{ 9068c2ecf20Sopenharmony_ci if (unlikely(!page_copy_sane(page, offset, bytes))) 9078c2ecf20Sopenharmony_ci return 0; 9088c2ecf20Sopenharmony_ci if (i->type & (ITER_BVEC|ITER_KVEC)) { 9098c2ecf20Sopenharmony_ci void *kaddr = kmap_atomic(page); 9108c2ecf20Sopenharmony_ci size_t wanted = copy_to_iter(kaddr + offset, bytes, i); 9118c2ecf20Sopenharmony_ci kunmap_atomic(kaddr); 9128c2ecf20Sopenharmony_ci return wanted; 9138c2ecf20Sopenharmony_ci } else if (unlikely(iov_iter_is_discard(i))) { 9148c2ecf20Sopenharmony_ci if (unlikely(i->count < bytes)) 9158c2ecf20Sopenharmony_ci bytes = i->count; 9168c2ecf20Sopenharmony_ci i->count -= bytes; 9178c2ecf20Sopenharmony_ci return bytes; 9188c2ecf20Sopenharmony_ci } else if (likely(!iov_iter_is_pipe(i))) 9198c2ecf20Sopenharmony_ci return copy_page_to_iter_iovec(page, offset, bytes, i); 9208c2ecf20Sopenharmony_ci else 9218c2ecf20Sopenharmony_ci return copy_page_to_iter_pipe(page, offset, bytes, i); 9228c2ecf20Sopenharmony_ci} 9238c2ecf20Sopenharmony_ciEXPORT_SYMBOL(copy_page_to_iter); 9248c2ecf20Sopenharmony_ci 9258c2ecf20Sopenharmony_cisize_t copy_page_from_iter(struct page *page, size_t offset, size_t bytes, 9268c2ecf20Sopenharmony_ci struct iov_iter *i) 9278c2ecf20Sopenharmony_ci{ 9288c2ecf20Sopenharmony_ci if (unlikely(!page_copy_sane(page, offset, bytes))) 9298c2ecf20Sopenharmony_ci return 0; 9308c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i) || iov_iter_is_discard(i))) { 9318c2ecf20Sopenharmony_ci WARN_ON(1); 9328c2ecf20Sopenharmony_ci return 0; 9338c2ecf20Sopenharmony_ci } 9348c2ecf20Sopenharmony_ci if (i->type & (ITER_BVEC|ITER_KVEC)) { 9358c2ecf20Sopenharmony_ci void *kaddr = kmap_atomic(page); 9368c2ecf20Sopenharmony_ci size_t wanted = _copy_from_iter(kaddr + offset, bytes, i); 9378c2ecf20Sopenharmony_ci kunmap_atomic(kaddr); 9388c2ecf20Sopenharmony_ci return wanted; 9398c2ecf20Sopenharmony_ci } else 9408c2ecf20Sopenharmony_ci return copy_page_from_iter_iovec(page, offset, bytes, i); 9418c2ecf20Sopenharmony_ci} 9428c2ecf20Sopenharmony_ciEXPORT_SYMBOL(copy_page_from_iter); 9438c2ecf20Sopenharmony_ci 9448c2ecf20Sopenharmony_cistatic size_t pipe_zero(size_t bytes, struct iov_iter *i) 9458c2ecf20Sopenharmony_ci{ 9468c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 9478c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 9488c2ecf20Sopenharmony_ci unsigned int i_head; 9498c2ecf20Sopenharmony_ci size_t n, off; 9508c2ecf20Sopenharmony_ci 9518c2ecf20Sopenharmony_ci if (!sanity(i)) 9528c2ecf20Sopenharmony_ci return 0; 9538c2ecf20Sopenharmony_ci 9548c2ecf20Sopenharmony_ci bytes = n = push_pipe(i, bytes, &i_head, &off); 9558c2ecf20Sopenharmony_ci if (unlikely(!n)) 9568c2ecf20Sopenharmony_ci return 0; 9578c2ecf20Sopenharmony_ci 9588c2ecf20Sopenharmony_ci do { 9598c2ecf20Sopenharmony_ci size_t chunk = min_t(size_t, n, PAGE_SIZE - off); 9608c2ecf20Sopenharmony_ci memzero_page(pipe->bufs[i_head & p_mask].page, off, chunk); 9618c2ecf20Sopenharmony_ci i->head = i_head; 9628c2ecf20Sopenharmony_ci i->iov_offset = off + chunk; 9638c2ecf20Sopenharmony_ci n -= chunk; 9648c2ecf20Sopenharmony_ci off = 0; 9658c2ecf20Sopenharmony_ci i_head++; 9668c2ecf20Sopenharmony_ci } while (n); 9678c2ecf20Sopenharmony_ci i->count -= bytes; 9688c2ecf20Sopenharmony_ci return bytes; 9698c2ecf20Sopenharmony_ci} 9708c2ecf20Sopenharmony_ci 9718c2ecf20Sopenharmony_cisize_t iov_iter_zero(size_t bytes, struct iov_iter *i) 9728c2ecf20Sopenharmony_ci{ 9738c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) 9748c2ecf20Sopenharmony_ci return pipe_zero(bytes, i); 9758c2ecf20Sopenharmony_ci iterate_and_advance(i, bytes, v, 9768c2ecf20Sopenharmony_ci clear_user(v.iov_base, v.iov_len), 9778c2ecf20Sopenharmony_ci memzero_page(v.bv_page, v.bv_offset, v.bv_len), 9788c2ecf20Sopenharmony_ci memset(v.iov_base, 0, v.iov_len) 9798c2ecf20Sopenharmony_ci ) 9808c2ecf20Sopenharmony_ci 9818c2ecf20Sopenharmony_ci return bytes; 9828c2ecf20Sopenharmony_ci} 9838c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_zero); 9848c2ecf20Sopenharmony_ci 9858c2ecf20Sopenharmony_cisize_t iov_iter_copy_from_user_atomic(struct page *page, 9868c2ecf20Sopenharmony_ci struct iov_iter *i, unsigned long offset, size_t bytes) 9878c2ecf20Sopenharmony_ci{ 9888c2ecf20Sopenharmony_ci char *kaddr = kmap_atomic(page), *p = kaddr + offset; 9898c2ecf20Sopenharmony_ci if (unlikely(!page_copy_sane(page, offset, bytes))) { 9908c2ecf20Sopenharmony_ci kunmap_atomic(kaddr); 9918c2ecf20Sopenharmony_ci return 0; 9928c2ecf20Sopenharmony_ci } 9938c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i) || iov_iter_is_discard(i))) { 9948c2ecf20Sopenharmony_ci kunmap_atomic(kaddr); 9958c2ecf20Sopenharmony_ci WARN_ON(1); 9968c2ecf20Sopenharmony_ci return 0; 9978c2ecf20Sopenharmony_ci } 9988c2ecf20Sopenharmony_ci iterate_all_kinds(i, bytes, v, 9998c2ecf20Sopenharmony_ci copyin((p += v.iov_len) - v.iov_len, v.iov_base, v.iov_len), 10008c2ecf20Sopenharmony_ci memcpy_from_page((p += v.bv_len) - v.bv_len, v.bv_page, 10018c2ecf20Sopenharmony_ci v.bv_offset, v.bv_len), 10028c2ecf20Sopenharmony_ci memcpy((p += v.iov_len) - v.iov_len, v.iov_base, v.iov_len) 10038c2ecf20Sopenharmony_ci ) 10048c2ecf20Sopenharmony_ci kunmap_atomic(kaddr); 10058c2ecf20Sopenharmony_ci return bytes; 10068c2ecf20Sopenharmony_ci} 10078c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_copy_from_user_atomic); 10088c2ecf20Sopenharmony_ci 10098c2ecf20Sopenharmony_cistatic inline void pipe_truncate(struct iov_iter *i) 10108c2ecf20Sopenharmony_ci{ 10118c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 10128c2ecf20Sopenharmony_ci unsigned int p_tail = pipe->tail; 10138c2ecf20Sopenharmony_ci unsigned int p_head = pipe->head; 10148c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 10158c2ecf20Sopenharmony_ci 10168c2ecf20Sopenharmony_ci if (!pipe_empty(p_head, p_tail)) { 10178c2ecf20Sopenharmony_ci struct pipe_buffer *buf; 10188c2ecf20Sopenharmony_ci unsigned int i_head = i->head; 10198c2ecf20Sopenharmony_ci size_t off = i->iov_offset; 10208c2ecf20Sopenharmony_ci 10218c2ecf20Sopenharmony_ci if (off) { 10228c2ecf20Sopenharmony_ci buf = &pipe->bufs[i_head & p_mask]; 10238c2ecf20Sopenharmony_ci buf->len = off - buf->offset; 10248c2ecf20Sopenharmony_ci i_head++; 10258c2ecf20Sopenharmony_ci } 10268c2ecf20Sopenharmony_ci while (p_head != i_head) { 10278c2ecf20Sopenharmony_ci p_head--; 10288c2ecf20Sopenharmony_ci pipe_buf_release(pipe, &pipe->bufs[p_head & p_mask]); 10298c2ecf20Sopenharmony_ci } 10308c2ecf20Sopenharmony_ci 10318c2ecf20Sopenharmony_ci pipe->head = p_head; 10328c2ecf20Sopenharmony_ci } 10338c2ecf20Sopenharmony_ci} 10348c2ecf20Sopenharmony_ci 10358c2ecf20Sopenharmony_cistatic void pipe_advance(struct iov_iter *i, size_t size) 10368c2ecf20Sopenharmony_ci{ 10378c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 10388c2ecf20Sopenharmony_ci if (unlikely(i->count < size)) 10398c2ecf20Sopenharmony_ci size = i->count; 10408c2ecf20Sopenharmony_ci if (size) { 10418c2ecf20Sopenharmony_ci struct pipe_buffer *buf; 10428c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 10438c2ecf20Sopenharmony_ci unsigned int i_head = i->head; 10448c2ecf20Sopenharmony_ci size_t off = i->iov_offset, left = size; 10458c2ecf20Sopenharmony_ci 10468c2ecf20Sopenharmony_ci if (off) /* make it relative to the beginning of buffer */ 10478c2ecf20Sopenharmony_ci left += off - pipe->bufs[i_head & p_mask].offset; 10488c2ecf20Sopenharmony_ci while (1) { 10498c2ecf20Sopenharmony_ci buf = &pipe->bufs[i_head & p_mask]; 10508c2ecf20Sopenharmony_ci if (left <= buf->len) 10518c2ecf20Sopenharmony_ci break; 10528c2ecf20Sopenharmony_ci left -= buf->len; 10538c2ecf20Sopenharmony_ci i_head++; 10548c2ecf20Sopenharmony_ci } 10558c2ecf20Sopenharmony_ci i->head = i_head; 10568c2ecf20Sopenharmony_ci i->iov_offset = buf->offset + left; 10578c2ecf20Sopenharmony_ci } 10588c2ecf20Sopenharmony_ci i->count -= size; 10598c2ecf20Sopenharmony_ci /* ... and discard everything past that point */ 10608c2ecf20Sopenharmony_ci pipe_truncate(i); 10618c2ecf20Sopenharmony_ci} 10628c2ecf20Sopenharmony_ci 10638c2ecf20Sopenharmony_civoid iov_iter_advance(struct iov_iter *i, size_t size) 10648c2ecf20Sopenharmony_ci{ 10658c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) { 10668c2ecf20Sopenharmony_ci pipe_advance(i, size); 10678c2ecf20Sopenharmony_ci return; 10688c2ecf20Sopenharmony_ci } 10698c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_discard(i))) { 10708c2ecf20Sopenharmony_ci i->count -= size; 10718c2ecf20Sopenharmony_ci return; 10728c2ecf20Sopenharmony_ci } 10738c2ecf20Sopenharmony_ci iterate_and_advance(i, size, v, 0, 0, 0) 10748c2ecf20Sopenharmony_ci} 10758c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_advance); 10768c2ecf20Sopenharmony_ci 10778c2ecf20Sopenharmony_civoid iov_iter_revert(struct iov_iter *i, size_t unroll) 10788c2ecf20Sopenharmony_ci{ 10798c2ecf20Sopenharmony_ci if (!unroll) 10808c2ecf20Sopenharmony_ci return; 10818c2ecf20Sopenharmony_ci if (WARN_ON(unroll > MAX_RW_COUNT)) 10828c2ecf20Sopenharmony_ci return; 10838c2ecf20Sopenharmony_ci i->count += unroll; 10848c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) { 10858c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 10868c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 10878c2ecf20Sopenharmony_ci unsigned int i_head = i->head; 10888c2ecf20Sopenharmony_ci size_t off = i->iov_offset; 10898c2ecf20Sopenharmony_ci while (1) { 10908c2ecf20Sopenharmony_ci struct pipe_buffer *b = &pipe->bufs[i_head & p_mask]; 10918c2ecf20Sopenharmony_ci size_t n = off - b->offset; 10928c2ecf20Sopenharmony_ci if (unroll < n) { 10938c2ecf20Sopenharmony_ci off -= unroll; 10948c2ecf20Sopenharmony_ci break; 10958c2ecf20Sopenharmony_ci } 10968c2ecf20Sopenharmony_ci unroll -= n; 10978c2ecf20Sopenharmony_ci if (!unroll && i_head == i->start_head) { 10988c2ecf20Sopenharmony_ci off = 0; 10998c2ecf20Sopenharmony_ci break; 11008c2ecf20Sopenharmony_ci } 11018c2ecf20Sopenharmony_ci i_head--; 11028c2ecf20Sopenharmony_ci b = &pipe->bufs[i_head & p_mask]; 11038c2ecf20Sopenharmony_ci off = b->offset + b->len; 11048c2ecf20Sopenharmony_ci } 11058c2ecf20Sopenharmony_ci i->iov_offset = off; 11068c2ecf20Sopenharmony_ci i->head = i_head; 11078c2ecf20Sopenharmony_ci pipe_truncate(i); 11088c2ecf20Sopenharmony_ci return; 11098c2ecf20Sopenharmony_ci } 11108c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_discard(i))) 11118c2ecf20Sopenharmony_ci return; 11128c2ecf20Sopenharmony_ci if (unroll <= i->iov_offset) { 11138c2ecf20Sopenharmony_ci i->iov_offset -= unroll; 11148c2ecf20Sopenharmony_ci return; 11158c2ecf20Sopenharmony_ci } 11168c2ecf20Sopenharmony_ci unroll -= i->iov_offset; 11178c2ecf20Sopenharmony_ci if (iov_iter_is_bvec(i)) { 11188c2ecf20Sopenharmony_ci const struct bio_vec *bvec = i->bvec; 11198c2ecf20Sopenharmony_ci while (1) { 11208c2ecf20Sopenharmony_ci size_t n = (--bvec)->bv_len; 11218c2ecf20Sopenharmony_ci i->nr_segs++; 11228c2ecf20Sopenharmony_ci if (unroll <= n) { 11238c2ecf20Sopenharmony_ci i->bvec = bvec; 11248c2ecf20Sopenharmony_ci i->iov_offset = n - unroll; 11258c2ecf20Sopenharmony_ci return; 11268c2ecf20Sopenharmony_ci } 11278c2ecf20Sopenharmony_ci unroll -= n; 11288c2ecf20Sopenharmony_ci } 11298c2ecf20Sopenharmony_ci } else { /* same logics for iovec and kvec */ 11308c2ecf20Sopenharmony_ci const struct iovec *iov = i->iov; 11318c2ecf20Sopenharmony_ci while (1) { 11328c2ecf20Sopenharmony_ci size_t n = (--iov)->iov_len; 11338c2ecf20Sopenharmony_ci i->nr_segs++; 11348c2ecf20Sopenharmony_ci if (unroll <= n) { 11358c2ecf20Sopenharmony_ci i->iov = iov; 11368c2ecf20Sopenharmony_ci i->iov_offset = n - unroll; 11378c2ecf20Sopenharmony_ci return; 11388c2ecf20Sopenharmony_ci } 11398c2ecf20Sopenharmony_ci unroll -= n; 11408c2ecf20Sopenharmony_ci } 11418c2ecf20Sopenharmony_ci } 11428c2ecf20Sopenharmony_ci} 11438c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_revert); 11448c2ecf20Sopenharmony_ci 11458c2ecf20Sopenharmony_ci/* 11468c2ecf20Sopenharmony_ci * Return the count of just the current iov_iter segment. 11478c2ecf20Sopenharmony_ci */ 11488c2ecf20Sopenharmony_cisize_t iov_iter_single_seg_count(const struct iov_iter *i) 11498c2ecf20Sopenharmony_ci{ 11508c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) 11518c2ecf20Sopenharmony_ci return i->count; // it is a silly place, anyway 11528c2ecf20Sopenharmony_ci if (i->nr_segs == 1) 11538c2ecf20Sopenharmony_ci return i->count; 11548c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_discard(i))) 11558c2ecf20Sopenharmony_ci return i->count; 11568c2ecf20Sopenharmony_ci else if (iov_iter_is_bvec(i)) 11578c2ecf20Sopenharmony_ci return min(i->count, i->bvec->bv_len - i->iov_offset); 11588c2ecf20Sopenharmony_ci else 11598c2ecf20Sopenharmony_ci return min(i->count, i->iov->iov_len - i->iov_offset); 11608c2ecf20Sopenharmony_ci} 11618c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_single_seg_count); 11628c2ecf20Sopenharmony_ci 11638c2ecf20Sopenharmony_civoid iov_iter_kvec(struct iov_iter *i, unsigned int direction, 11648c2ecf20Sopenharmony_ci const struct kvec *kvec, unsigned long nr_segs, 11658c2ecf20Sopenharmony_ci size_t count) 11668c2ecf20Sopenharmony_ci{ 11678c2ecf20Sopenharmony_ci WARN_ON(direction & ~(READ | WRITE)); 11688c2ecf20Sopenharmony_ci i->type = ITER_KVEC | (direction & (READ | WRITE)); 11698c2ecf20Sopenharmony_ci i->kvec = kvec; 11708c2ecf20Sopenharmony_ci i->nr_segs = nr_segs; 11718c2ecf20Sopenharmony_ci i->iov_offset = 0; 11728c2ecf20Sopenharmony_ci i->count = count; 11738c2ecf20Sopenharmony_ci} 11748c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_kvec); 11758c2ecf20Sopenharmony_ci 11768c2ecf20Sopenharmony_civoid iov_iter_bvec(struct iov_iter *i, unsigned int direction, 11778c2ecf20Sopenharmony_ci const struct bio_vec *bvec, unsigned long nr_segs, 11788c2ecf20Sopenharmony_ci size_t count) 11798c2ecf20Sopenharmony_ci{ 11808c2ecf20Sopenharmony_ci WARN_ON(direction & ~(READ | WRITE)); 11818c2ecf20Sopenharmony_ci i->type = ITER_BVEC | (direction & (READ | WRITE)); 11828c2ecf20Sopenharmony_ci i->bvec = bvec; 11838c2ecf20Sopenharmony_ci i->nr_segs = nr_segs; 11848c2ecf20Sopenharmony_ci i->iov_offset = 0; 11858c2ecf20Sopenharmony_ci i->count = count; 11868c2ecf20Sopenharmony_ci} 11878c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_bvec); 11888c2ecf20Sopenharmony_ci 11898c2ecf20Sopenharmony_civoid iov_iter_pipe(struct iov_iter *i, unsigned int direction, 11908c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe, 11918c2ecf20Sopenharmony_ci size_t count) 11928c2ecf20Sopenharmony_ci{ 11938c2ecf20Sopenharmony_ci BUG_ON(direction != READ); 11948c2ecf20Sopenharmony_ci WARN_ON(pipe_full(pipe->head, pipe->tail, pipe->ring_size)); 11958c2ecf20Sopenharmony_ci i->type = ITER_PIPE | READ; 11968c2ecf20Sopenharmony_ci i->pipe = pipe; 11978c2ecf20Sopenharmony_ci i->head = pipe->head; 11988c2ecf20Sopenharmony_ci i->iov_offset = 0; 11998c2ecf20Sopenharmony_ci i->count = count; 12008c2ecf20Sopenharmony_ci i->start_head = i->head; 12018c2ecf20Sopenharmony_ci} 12028c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_pipe); 12038c2ecf20Sopenharmony_ci 12048c2ecf20Sopenharmony_ci/** 12058c2ecf20Sopenharmony_ci * iov_iter_discard - Initialise an I/O iterator that discards data 12068c2ecf20Sopenharmony_ci * @i: The iterator to initialise. 12078c2ecf20Sopenharmony_ci * @direction: The direction of the transfer. 12088c2ecf20Sopenharmony_ci * @count: The size of the I/O buffer in bytes. 12098c2ecf20Sopenharmony_ci * 12108c2ecf20Sopenharmony_ci * Set up an I/O iterator that just discards everything that's written to it. 12118c2ecf20Sopenharmony_ci * It's only available as a READ iterator. 12128c2ecf20Sopenharmony_ci */ 12138c2ecf20Sopenharmony_civoid iov_iter_discard(struct iov_iter *i, unsigned int direction, size_t count) 12148c2ecf20Sopenharmony_ci{ 12158c2ecf20Sopenharmony_ci BUG_ON(direction != READ); 12168c2ecf20Sopenharmony_ci i->type = ITER_DISCARD | READ; 12178c2ecf20Sopenharmony_ci i->count = count; 12188c2ecf20Sopenharmony_ci i->iov_offset = 0; 12198c2ecf20Sopenharmony_ci} 12208c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_discard); 12218c2ecf20Sopenharmony_ci 12228c2ecf20Sopenharmony_ciunsigned long iov_iter_alignment(const struct iov_iter *i) 12238c2ecf20Sopenharmony_ci{ 12248c2ecf20Sopenharmony_ci unsigned long res = 0; 12258c2ecf20Sopenharmony_ci size_t size = i->count; 12268c2ecf20Sopenharmony_ci 12278c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) { 12288c2ecf20Sopenharmony_ci unsigned int p_mask = i->pipe->ring_size - 1; 12298c2ecf20Sopenharmony_ci 12308c2ecf20Sopenharmony_ci if (size && i->iov_offset && allocated(&i->pipe->bufs[i->head & p_mask])) 12318c2ecf20Sopenharmony_ci return size | i->iov_offset; 12328c2ecf20Sopenharmony_ci return size; 12338c2ecf20Sopenharmony_ci } 12348c2ecf20Sopenharmony_ci iterate_all_kinds(i, size, v, 12358c2ecf20Sopenharmony_ci (res |= (unsigned long)v.iov_base | v.iov_len, 0), 12368c2ecf20Sopenharmony_ci res |= v.bv_offset | v.bv_len, 12378c2ecf20Sopenharmony_ci res |= (unsigned long)v.iov_base | v.iov_len 12388c2ecf20Sopenharmony_ci ) 12398c2ecf20Sopenharmony_ci return res; 12408c2ecf20Sopenharmony_ci} 12418c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_alignment); 12428c2ecf20Sopenharmony_ci 12438c2ecf20Sopenharmony_ciunsigned long iov_iter_gap_alignment(const struct iov_iter *i) 12448c2ecf20Sopenharmony_ci{ 12458c2ecf20Sopenharmony_ci unsigned long res = 0; 12468c2ecf20Sopenharmony_ci size_t size = i->count; 12478c2ecf20Sopenharmony_ci 12488c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i) || iov_iter_is_discard(i))) { 12498c2ecf20Sopenharmony_ci WARN_ON(1); 12508c2ecf20Sopenharmony_ci return ~0U; 12518c2ecf20Sopenharmony_ci } 12528c2ecf20Sopenharmony_ci 12538c2ecf20Sopenharmony_ci iterate_all_kinds(i, size, v, 12548c2ecf20Sopenharmony_ci (res |= (!res ? 0 : (unsigned long)v.iov_base) | 12558c2ecf20Sopenharmony_ci (size != v.iov_len ? size : 0), 0), 12568c2ecf20Sopenharmony_ci (res |= (!res ? 0 : (unsigned long)v.bv_offset) | 12578c2ecf20Sopenharmony_ci (size != v.bv_len ? size : 0)), 12588c2ecf20Sopenharmony_ci (res |= (!res ? 0 : (unsigned long)v.iov_base) | 12598c2ecf20Sopenharmony_ci (size != v.iov_len ? size : 0)) 12608c2ecf20Sopenharmony_ci ); 12618c2ecf20Sopenharmony_ci return res; 12628c2ecf20Sopenharmony_ci} 12638c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_gap_alignment); 12648c2ecf20Sopenharmony_ci 12658c2ecf20Sopenharmony_cistatic inline ssize_t __pipe_get_pages(struct iov_iter *i, 12668c2ecf20Sopenharmony_ci size_t maxsize, 12678c2ecf20Sopenharmony_ci struct page **pages, 12688c2ecf20Sopenharmony_ci int iter_head, 12698c2ecf20Sopenharmony_ci size_t *start) 12708c2ecf20Sopenharmony_ci{ 12718c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 12728c2ecf20Sopenharmony_ci unsigned int p_mask = pipe->ring_size - 1; 12738c2ecf20Sopenharmony_ci ssize_t n = push_pipe(i, maxsize, &iter_head, start); 12748c2ecf20Sopenharmony_ci if (!n) 12758c2ecf20Sopenharmony_ci return -EFAULT; 12768c2ecf20Sopenharmony_ci 12778c2ecf20Sopenharmony_ci maxsize = n; 12788c2ecf20Sopenharmony_ci n += *start; 12798c2ecf20Sopenharmony_ci while (n > 0) { 12808c2ecf20Sopenharmony_ci get_page(*pages++ = pipe->bufs[iter_head & p_mask].page); 12818c2ecf20Sopenharmony_ci iter_head++; 12828c2ecf20Sopenharmony_ci n -= PAGE_SIZE; 12838c2ecf20Sopenharmony_ci } 12848c2ecf20Sopenharmony_ci 12858c2ecf20Sopenharmony_ci return maxsize; 12868c2ecf20Sopenharmony_ci} 12878c2ecf20Sopenharmony_ci 12888c2ecf20Sopenharmony_cistatic ssize_t pipe_get_pages(struct iov_iter *i, 12898c2ecf20Sopenharmony_ci struct page **pages, size_t maxsize, unsigned maxpages, 12908c2ecf20Sopenharmony_ci size_t *start) 12918c2ecf20Sopenharmony_ci{ 12928c2ecf20Sopenharmony_ci unsigned int iter_head, npages; 12938c2ecf20Sopenharmony_ci size_t capacity; 12948c2ecf20Sopenharmony_ci 12958c2ecf20Sopenharmony_ci if (!maxsize) 12968c2ecf20Sopenharmony_ci return 0; 12978c2ecf20Sopenharmony_ci 12988c2ecf20Sopenharmony_ci if (!sanity(i)) 12998c2ecf20Sopenharmony_ci return -EFAULT; 13008c2ecf20Sopenharmony_ci 13018c2ecf20Sopenharmony_ci data_start(i, &iter_head, start); 13028c2ecf20Sopenharmony_ci /* Amount of free space: some of this one + all after this one */ 13038c2ecf20Sopenharmony_ci npages = pipe_space_for_user(iter_head, i->pipe->tail, i->pipe); 13048c2ecf20Sopenharmony_ci capacity = min(npages, maxpages) * PAGE_SIZE - *start; 13058c2ecf20Sopenharmony_ci 13068c2ecf20Sopenharmony_ci return __pipe_get_pages(i, min(maxsize, capacity), pages, iter_head, start); 13078c2ecf20Sopenharmony_ci} 13088c2ecf20Sopenharmony_ci 13098c2ecf20Sopenharmony_cissize_t iov_iter_get_pages(struct iov_iter *i, 13108c2ecf20Sopenharmony_ci struct page **pages, size_t maxsize, unsigned maxpages, 13118c2ecf20Sopenharmony_ci size_t *start) 13128c2ecf20Sopenharmony_ci{ 13138c2ecf20Sopenharmony_ci if (maxsize > i->count) 13148c2ecf20Sopenharmony_ci maxsize = i->count; 13158c2ecf20Sopenharmony_ci 13168c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) 13178c2ecf20Sopenharmony_ci return pipe_get_pages(i, pages, maxsize, maxpages, start); 13188c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_discard(i))) 13198c2ecf20Sopenharmony_ci return -EFAULT; 13208c2ecf20Sopenharmony_ci 13218c2ecf20Sopenharmony_ci iterate_all_kinds(i, maxsize, v, ({ 13228c2ecf20Sopenharmony_ci unsigned long addr = (unsigned long)v.iov_base; 13238c2ecf20Sopenharmony_ci size_t len = v.iov_len + (*start = addr & (PAGE_SIZE - 1)); 13248c2ecf20Sopenharmony_ci int n; 13258c2ecf20Sopenharmony_ci int res; 13268c2ecf20Sopenharmony_ci 13278c2ecf20Sopenharmony_ci if (len > maxpages * PAGE_SIZE) 13288c2ecf20Sopenharmony_ci len = maxpages * PAGE_SIZE; 13298c2ecf20Sopenharmony_ci addr &= ~(PAGE_SIZE - 1); 13308c2ecf20Sopenharmony_ci n = DIV_ROUND_UP(len, PAGE_SIZE); 13318c2ecf20Sopenharmony_ci res = get_user_pages_fast(addr, n, 13328c2ecf20Sopenharmony_ci iov_iter_rw(i) != WRITE ? FOLL_WRITE : 0, 13338c2ecf20Sopenharmony_ci pages); 13348c2ecf20Sopenharmony_ci if (unlikely(res <= 0)) 13358c2ecf20Sopenharmony_ci return res; 13368c2ecf20Sopenharmony_ci return (res == n ? len : res * PAGE_SIZE) - *start; 13378c2ecf20Sopenharmony_ci 0;}),({ 13388c2ecf20Sopenharmony_ci /* can't be more than PAGE_SIZE */ 13398c2ecf20Sopenharmony_ci *start = v.bv_offset; 13408c2ecf20Sopenharmony_ci get_page(*pages = v.bv_page); 13418c2ecf20Sopenharmony_ci return v.bv_len; 13428c2ecf20Sopenharmony_ci }),({ 13438c2ecf20Sopenharmony_ci return -EFAULT; 13448c2ecf20Sopenharmony_ci }) 13458c2ecf20Sopenharmony_ci ) 13468c2ecf20Sopenharmony_ci return 0; 13478c2ecf20Sopenharmony_ci} 13488c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_get_pages); 13498c2ecf20Sopenharmony_ci 13508c2ecf20Sopenharmony_cistatic struct page **get_pages_array(size_t n) 13518c2ecf20Sopenharmony_ci{ 13528c2ecf20Sopenharmony_ci return kvmalloc_array(n, sizeof(struct page *), GFP_KERNEL); 13538c2ecf20Sopenharmony_ci} 13548c2ecf20Sopenharmony_ci 13558c2ecf20Sopenharmony_cistatic ssize_t pipe_get_pages_alloc(struct iov_iter *i, 13568c2ecf20Sopenharmony_ci struct page ***pages, size_t maxsize, 13578c2ecf20Sopenharmony_ci size_t *start) 13588c2ecf20Sopenharmony_ci{ 13598c2ecf20Sopenharmony_ci struct page **p; 13608c2ecf20Sopenharmony_ci unsigned int iter_head, npages; 13618c2ecf20Sopenharmony_ci ssize_t n; 13628c2ecf20Sopenharmony_ci 13638c2ecf20Sopenharmony_ci if (!maxsize) 13648c2ecf20Sopenharmony_ci return 0; 13658c2ecf20Sopenharmony_ci 13668c2ecf20Sopenharmony_ci if (!sanity(i)) 13678c2ecf20Sopenharmony_ci return -EFAULT; 13688c2ecf20Sopenharmony_ci 13698c2ecf20Sopenharmony_ci data_start(i, &iter_head, start); 13708c2ecf20Sopenharmony_ci /* Amount of free space: some of this one + all after this one */ 13718c2ecf20Sopenharmony_ci npages = pipe_space_for_user(iter_head, i->pipe->tail, i->pipe); 13728c2ecf20Sopenharmony_ci n = npages * PAGE_SIZE - *start; 13738c2ecf20Sopenharmony_ci if (maxsize > n) 13748c2ecf20Sopenharmony_ci maxsize = n; 13758c2ecf20Sopenharmony_ci else 13768c2ecf20Sopenharmony_ci npages = DIV_ROUND_UP(maxsize + *start, PAGE_SIZE); 13778c2ecf20Sopenharmony_ci p = get_pages_array(npages); 13788c2ecf20Sopenharmony_ci if (!p) 13798c2ecf20Sopenharmony_ci return -ENOMEM; 13808c2ecf20Sopenharmony_ci n = __pipe_get_pages(i, maxsize, p, iter_head, start); 13818c2ecf20Sopenharmony_ci if (n > 0) 13828c2ecf20Sopenharmony_ci *pages = p; 13838c2ecf20Sopenharmony_ci else 13848c2ecf20Sopenharmony_ci kvfree(p); 13858c2ecf20Sopenharmony_ci return n; 13868c2ecf20Sopenharmony_ci} 13878c2ecf20Sopenharmony_ci 13888c2ecf20Sopenharmony_cissize_t iov_iter_get_pages_alloc(struct iov_iter *i, 13898c2ecf20Sopenharmony_ci struct page ***pages, size_t maxsize, 13908c2ecf20Sopenharmony_ci size_t *start) 13918c2ecf20Sopenharmony_ci{ 13928c2ecf20Sopenharmony_ci struct page **p; 13938c2ecf20Sopenharmony_ci 13948c2ecf20Sopenharmony_ci if (maxsize > i->count) 13958c2ecf20Sopenharmony_ci maxsize = i->count; 13968c2ecf20Sopenharmony_ci 13978c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) 13988c2ecf20Sopenharmony_ci return pipe_get_pages_alloc(i, pages, maxsize, start); 13998c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_discard(i))) 14008c2ecf20Sopenharmony_ci return -EFAULT; 14018c2ecf20Sopenharmony_ci 14028c2ecf20Sopenharmony_ci iterate_all_kinds(i, maxsize, v, ({ 14038c2ecf20Sopenharmony_ci unsigned long addr = (unsigned long)v.iov_base; 14048c2ecf20Sopenharmony_ci size_t len = v.iov_len + (*start = addr & (PAGE_SIZE - 1)); 14058c2ecf20Sopenharmony_ci int n; 14068c2ecf20Sopenharmony_ci int res; 14078c2ecf20Sopenharmony_ci 14088c2ecf20Sopenharmony_ci addr &= ~(PAGE_SIZE - 1); 14098c2ecf20Sopenharmony_ci n = DIV_ROUND_UP(len, PAGE_SIZE); 14108c2ecf20Sopenharmony_ci p = get_pages_array(n); 14118c2ecf20Sopenharmony_ci if (!p) 14128c2ecf20Sopenharmony_ci return -ENOMEM; 14138c2ecf20Sopenharmony_ci res = get_user_pages_fast(addr, n, 14148c2ecf20Sopenharmony_ci iov_iter_rw(i) != WRITE ? FOLL_WRITE : 0, p); 14158c2ecf20Sopenharmony_ci if (unlikely(res <= 0)) { 14168c2ecf20Sopenharmony_ci kvfree(p); 14178c2ecf20Sopenharmony_ci *pages = NULL; 14188c2ecf20Sopenharmony_ci return res; 14198c2ecf20Sopenharmony_ci } 14208c2ecf20Sopenharmony_ci *pages = p; 14218c2ecf20Sopenharmony_ci return (res == n ? len : res * PAGE_SIZE) - *start; 14228c2ecf20Sopenharmony_ci 0;}),({ 14238c2ecf20Sopenharmony_ci /* can't be more than PAGE_SIZE */ 14248c2ecf20Sopenharmony_ci *start = v.bv_offset; 14258c2ecf20Sopenharmony_ci *pages = p = get_pages_array(1); 14268c2ecf20Sopenharmony_ci if (!p) 14278c2ecf20Sopenharmony_ci return -ENOMEM; 14288c2ecf20Sopenharmony_ci get_page(*p = v.bv_page); 14298c2ecf20Sopenharmony_ci return v.bv_len; 14308c2ecf20Sopenharmony_ci }),({ 14318c2ecf20Sopenharmony_ci return -EFAULT; 14328c2ecf20Sopenharmony_ci }) 14338c2ecf20Sopenharmony_ci ) 14348c2ecf20Sopenharmony_ci return 0; 14358c2ecf20Sopenharmony_ci} 14368c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_get_pages_alloc); 14378c2ecf20Sopenharmony_ci 14388c2ecf20Sopenharmony_cisize_t csum_and_copy_from_iter(void *addr, size_t bytes, __wsum *csum, 14398c2ecf20Sopenharmony_ci struct iov_iter *i) 14408c2ecf20Sopenharmony_ci{ 14418c2ecf20Sopenharmony_ci char *to = addr; 14428c2ecf20Sopenharmony_ci __wsum sum, next; 14438c2ecf20Sopenharmony_ci size_t off = 0; 14448c2ecf20Sopenharmony_ci sum = *csum; 14458c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i) || iov_iter_is_discard(i))) { 14468c2ecf20Sopenharmony_ci WARN_ON(1); 14478c2ecf20Sopenharmony_ci return 0; 14488c2ecf20Sopenharmony_ci } 14498c2ecf20Sopenharmony_ci iterate_and_advance(i, bytes, v, ({ 14508c2ecf20Sopenharmony_ci next = csum_and_copy_from_user(v.iov_base, 14518c2ecf20Sopenharmony_ci (to += v.iov_len) - v.iov_len, 14528c2ecf20Sopenharmony_ci v.iov_len); 14538c2ecf20Sopenharmony_ci if (next) { 14548c2ecf20Sopenharmony_ci sum = csum_block_add(sum, next, off); 14558c2ecf20Sopenharmony_ci off += v.iov_len; 14568c2ecf20Sopenharmony_ci } 14578c2ecf20Sopenharmony_ci next ? 0 : v.iov_len; 14588c2ecf20Sopenharmony_ci }), ({ 14598c2ecf20Sopenharmony_ci char *p = kmap_atomic(v.bv_page); 14608c2ecf20Sopenharmony_ci sum = csum_and_memcpy((to += v.bv_len) - v.bv_len, 14618c2ecf20Sopenharmony_ci p + v.bv_offset, v.bv_len, 14628c2ecf20Sopenharmony_ci sum, off); 14638c2ecf20Sopenharmony_ci kunmap_atomic(p); 14648c2ecf20Sopenharmony_ci off += v.bv_len; 14658c2ecf20Sopenharmony_ci }),({ 14668c2ecf20Sopenharmony_ci sum = csum_and_memcpy((to += v.iov_len) - v.iov_len, 14678c2ecf20Sopenharmony_ci v.iov_base, v.iov_len, 14688c2ecf20Sopenharmony_ci sum, off); 14698c2ecf20Sopenharmony_ci off += v.iov_len; 14708c2ecf20Sopenharmony_ci }) 14718c2ecf20Sopenharmony_ci ) 14728c2ecf20Sopenharmony_ci *csum = sum; 14738c2ecf20Sopenharmony_ci return bytes; 14748c2ecf20Sopenharmony_ci} 14758c2ecf20Sopenharmony_ciEXPORT_SYMBOL(csum_and_copy_from_iter); 14768c2ecf20Sopenharmony_ci 14778c2ecf20Sopenharmony_cibool csum_and_copy_from_iter_full(void *addr, size_t bytes, __wsum *csum, 14788c2ecf20Sopenharmony_ci struct iov_iter *i) 14798c2ecf20Sopenharmony_ci{ 14808c2ecf20Sopenharmony_ci char *to = addr; 14818c2ecf20Sopenharmony_ci __wsum sum, next; 14828c2ecf20Sopenharmony_ci size_t off = 0; 14838c2ecf20Sopenharmony_ci sum = *csum; 14848c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i) || iov_iter_is_discard(i))) { 14858c2ecf20Sopenharmony_ci WARN_ON(1); 14868c2ecf20Sopenharmony_ci return false; 14878c2ecf20Sopenharmony_ci } 14888c2ecf20Sopenharmony_ci if (unlikely(i->count < bytes)) 14898c2ecf20Sopenharmony_ci return false; 14908c2ecf20Sopenharmony_ci iterate_all_kinds(i, bytes, v, ({ 14918c2ecf20Sopenharmony_ci next = csum_and_copy_from_user(v.iov_base, 14928c2ecf20Sopenharmony_ci (to += v.iov_len) - v.iov_len, 14938c2ecf20Sopenharmony_ci v.iov_len); 14948c2ecf20Sopenharmony_ci if (!next) 14958c2ecf20Sopenharmony_ci return false; 14968c2ecf20Sopenharmony_ci sum = csum_block_add(sum, next, off); 14978c2ecf20Sopenharmony_ci off += v.iov_len; 14988c2ecf20Sopenharmony_ci 0; 14998c2ecf20Sopenharmony_ci }), ({ 15008c2ecf20Sopenharmony_ci char *p = kmap_atomic(v.bv_page); 15018c2ecf20Sopenharmony_ci sum = csum_and_memcpy((to += v.bv_len) - v.bv_len, 15028c2ecf20Sopenharmony_ci p + v.bv_offset, v.bv_len, 15038c2ecf20Sopenharmony_ci sum, off); 15048c2ecf20Sopenharmony_ci kunmap_atomic(p); 15058c2ecf20Sopenharmony_ci off += v.bv_len; 15068c2ecf20Sopenharmony_ci }),({ 15078c2ecf20Sopenharmony_ci sum = csum_and_memcpy((to += v.iov_len) - v.iov_len, 15088c2ecf20Sopenharmony_ci v.iov_base, v.iov_len, 15098c2ecf20Sopenharmony_ci sum, off); 15108c2ecf20Sopenharmony_ci off += v.iov_len; 15118c2ecf20Sopenharmony_ci }) 15128c2ecf20Sopenharmony_ci ) 15138c2ecf20Sopenharmony_ci *csum = sum; 15148c2ecf20Sopenharmony_ci iov_iter_advance(i, bytes); 15158c2ecf20Sopenharmony_ci return true; 15168c2ecf20Sopenharmony_ci} 15178c2ecf20Sopenharmony_ciEXPORT_SYMBOL(csum_and_copy_from_iter_full); 15188c2ecf20Sopenharmony_ci 15198c2ecf20Sopenharmony_cisize_t csum_and_copy_to_iter(const void *addr, size_t bytes, void *_csstate, 15208c2ecf20Sopenharmony_ci struct iov_iter *i) 15218c2ecf20Sopenharmony_ci{ 15228c2ecf20Sopenharmony_ci struct csum_state *csstate = _csstate; 15238c2ecf20Sopenharmony_ci const char *from = addr; 15248c2ecf20Sopenharmony_ci __wsum sum, next; 15258c2ecf20Sopenharmony_ci size_t off; 15268c2ecf20Sopenharmony_ci 15278c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) 15288c2ecf20Sopenharmony_ci return csum_and_copy_to_pipe_iter(addr, bytes, _csstate, i); 15298c2ecf20Sopenharmony_ci 15308c2ecf20Sopenharmony_ci sum = csstate->csum; 15318c2ecf20Sopenharmony_ci off = csstate->off; 15328c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_discard(i))) { 15338c2ecf20Sopenharmony_ci WARN_ON(1); /* for now */ 15348c2ecf20Sopenharmony_ci return 0; 15358c2ecf20Sopenharmony_ci } 15368c2ecf20Sopenharmony_ci iterate_and_advance(i, bytes, v, ({ 15378c2ecf20Sopenharmony_ci next = csum_and_copy_to_user((from += v.iov_len) - v.iov_len, 15388c2ecf20Sopenharmony_ci v.iov_base, 15398c2ecf20Sopenharmony_ci v.iov_len); 15408c2ecf20Sopenharmony_ci if (next) { 15418c2ecf20Sopenharmony_ci sum = csum_block_add(sum, next, off); 15428c2ecf20Sopenharmony_ci off += v.iov_len; 15438c2ecf20Sopenharmony_ci } 15448c2ecf20Sopenharmony_ci next ? 0 : v.iov_len; 15458c2ecf20Sopenharmony_ci }), ({ 15468c2ecf20Sopenharmony_ci char *p = kmap_atomic(v.bv_page); 15478c2ecf20Sopenharmony_ci sum = csum_and_memcpy(p + v.bv_offset, 15488c2ecf20Sopenharmony_ci (from += v.bv_len) - v.bv_len, 15498c2ecf20Sopenharmony_ci v.bv_len, sum, off); 15508c2ecf20Sopenharmony_ci kunmap_atomic(p); 15518c2ecf20Sopenharmony_ci off += v.bv_len; 15528c2ecf20Sopenharmony_ci }),({ 15538c2ecf20Sopenharmony_ci sum = csum_and_memcpy(v.iov_base, 15548c2ecf20Sopenharmony_ci (from += v.iov_len) - v.iov_len, 15558c2ecf20Sopenharmony_ci v.iov_len, sum, off); 15568c2ecf20Sopenharmony_ci off += v.iov_len; 15578c2ecf20Sopenharmony_ci }) 15588c2ecf20Sopenharmony_ci ) 15598c2ecf20Sopenharmony_ci csstate->csum = sum; 15608c2ecf20Sopenharmony_ci csstate->off = off; 15618c2ecf20Sopenharmony_ci return bytes; 15628c2ecf20Sopenharmony_ci} 15638c2ecf20Sopenharmony_ciEXPORT_SYMBOL(csum_and_copy_to_iter); 15648c2ecf20Sopenharmony_ci 15658c2ecf20Sopenharmony_cisize_t hash_and_copy_to_iter(const void *addr, size_t bytes, void *hashp, 15668c2ecf20Sopenharmony_ci struct iov_iter *i) 15678c2ecf20Sopenharmony_ci{ 15688c2ecf20Sopenharmony_ci#ifdef CONFIG_CRYPTO_HASH 15698c2ecf20Sopenharmony_ci struct ahash_request *hash = hashp; 15708c2ecf20Sopenharmony_ci struct scatterlist sg; 15718c2ecf20Sopenharmony_ci size_t copied; 15728c2ecf20Sopenharmony_ci 15738c2ecf20Sopenharmony_ci copied = copy_to_iter(addr, bytes, i); 15748c2ecf20Sopenharmony_ci sg_init_one(&sg, addr, copied); 15758c2ecf20Sopenharmony_ci ahash_request_set_crypt(hash, &sg, NULL, copied); 15768c2ecf20Sopenharmony_ci crypto_ahash_update(hash); 15778c2ecf20Sopenharmony_ci return copied; 15788c2ecf20Sopenharmony_ci#else 15798c2ecf20Sopenharmony_ci return 0; 15808c2ecf20Sopenharmony_ci#endif 15818c2ecf20Sopenharmony_ci} 15828c2ecf20Sopenharmony_ciEXPORT_SYMBOL(hash_and_copy_to_iter); 15838c2ecf20Sopenharmony_ci 15848c2ecf20Sopenharmony_ciint iov_iter_npages(const struct iov_iter *i, int maxpages) 15858c2ecf20Sopenharmony_ci{ 15868c2ecf20Sopenharmony_ci size_t size = i->count; 15878c2ecf20Sopenharmony_ci int npages = 0; 15888c2ecf20Sopenharmony_ci 15898c2ecf20Sopenharmony_ci if (!size) 15908c2ecf20Sopenharmony_ci return 0; 15918c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_discard(i))) 15928c2ecf20Sopenharmony_ci return 0; 15938c2ecf20Sopenharmony_ci 15948c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(i))) { 15958c2ecf20Sopenharmony_ci struct pipe_inode_info *pipe = i->pipe; 15968c2ecf20Sopenharmony_ci unsigned int iter_head; 15978c2ecf20Sopenharmony_ci size_t off; 15988c2ecf20Sopenharmony_ci 15998c2ecf20Sopenharmony_ci if (!sanity(i)) 16008c2ecf20Sopenharmony_ci return 0; 16018c2ecf20Sopenharmony_ci 16028c2ecf20Sopenharmony_ci data_start(i, &iter_head, &off); 16038c2ecf20Sopenharmony_ci /* some of this one + all after this one */ 16048c2ecf20Sopenharmony_ci npages = pipe_space_for_user(iter_head, pipe->tail, pipe); 16058c2ecf20Sopenharmony_ci if (npages >= maxpages) 16068c2ecf20Sopenharmony_ci return maxpages; 16078c2ecf20Sopenharmony_ci } else iterate_all_kinds(i, size, v, ({ 16088c2ecf20Sopenharmony_ci unsigned long p = (unsigned long)v.iov_base; 16098c2ecf20Sopenharmony_ci npages += DIV_ROUND_UP(p + v.iov_len, PAGE_SIZE) 16108c2ecf20Sopenharmony_ci - p / PAGE_SIZE; 16118c2ecf20Sopenharmony_ci if (npages >= maxpages) 16128c2ecf20Sopenharmony_ci return maxpages; 16138c2ecf20Sopenharmony_ci 0;}),({ 16148c2ecf20Sopenharmony_ci npages++; 16158c2ecf20Sopenharmony_ci if (npages >= maxpages) 16168c2ecf20Sopenharmony_ci return maxpages; 16178c2ecf20Sopenharmony_ci }),({ 16188c2ecf20Sopenharmony_ci unsigned long p = (unsigned long)v.iov_base; 16198c2ecf20Sopenharmony_ci npages += DIV_ROUND_UP(p + v.iov_len, PAGE_SIZE) 16208c2ecf20Sopenharmony_ci - p / PAGE_SIZE; 16218c2ecf20Sopenharmony_ci if (npages >= maxpages) 16228c2ecf20Sopenharmony_ci return maxpages; 16238c2ecf20Sopenharmony_ci }) 16248c2ecf20Sopenharmony_ci ) 16258c2ecf20Sopenharmony_ci return npages; 16268c2ecf20Sopenharmony_ci} 16278c2ecf20Sopenharmony_ciEXPORT_SYMBOL(iov_iter_npages); 16288c2ecf20Sopenharmony_ci 16298c2ecf20Sopenharmony_ciconst void *dup_iter(struct iov_iter *new, struct iov_iter *old, gfp_t flags) 16308c2ecf20Sopenharmony_ci{ 16318c2ecf20Sopenharmony_ci *new = *old; 16328c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_pipe(new))) { 16338c2ecf20Sopenharmony_ci WARN_ON(1); 16348c2ecf20Sopenharmony_ci return NULL; 16358c2ecf20Sopenharmony_ci } 16368c2ecf20Sopenharmony_ci if (unlikely(iov_iter_is_discard(new))) 16378c2ecf20Sopenharmony_ci return NULL; 16388c2ecf20Sopenharmony_ci if (iov_iter_is_bvec(new)) 16398c2ecf20Sopenharmony_ci return new->bvec = kmemdup(new->bvec, 16408c2ecf20Sopenharmony_ci new->nr_segs * sizeof(struct bio_vec), 16418c2ecf20Sopenharmony_ci flags); 16428c2ecf20Sopenharmony_ci else 16438c2ecf20Sopenharmony_ci /* iovec and kvec have identical layout */ 16448c2ecf20Sopenharmony_ci return new->iov = kmemdup(new->iov, 16458c2ecf20Sopenharmony_ci new->nr_segs * sizeof(struct iovec), 16468c2ecf20Sopenharmony_ci flags); 16478c2ecf20Sopenharmony_ci} 16488c2ecf20Sopenharmony_ciEXPORT_SYMBOL(dup_iter); 16498c2ecf20Sopenharmony_ci 16508c2ecf20Sopenharmony_cistatic int copy_compat_iovec_from_user(struct iovec *iov, 16518c2ecf20Sopenharmony_ci const struct iovec __user *uvec, unsigned long nr_segs) 16528c2ecf20Sopenharmony_ci{ 16538c2ecf20Sopenharmony_ci const struct compat_iovec __user *uiov = 16548c2ecf20Sopenharmony_ci (const struct compat_iovec __user *)uvec; 16558c2ecf20Sopenharmony_ci int ret = -EFAULT, i; 16568c2ecf20Sopenharmony_ci 16578c2ecf20Sopenharmony_ci if (!user_access_begin(uiov, nr_segs * sizeof(*uiov))) 16588c2ecf20Sopenharmony_ci return -EFAULT; 16598c2ecf20Sopenharmony_ci 16608c2ecf20Sopenharmony_ci for (i = 0; i < nr_segs; i++) { 16618c2ecf20Sopenharmony_ci compat_uptr_t buf; 16628c2ecf20Sopenharmony_ci compat_ssize_t len; 16638c2ecf20Sopenharmony_ci 16648c2ecf20Sopenharmony_ci unsafe_get_user(len, &uiov[i].iov_len, uaccess_end); 16658c2ecf20Sopenharmony_ci unsafe_get_user(buf, &uiov[i].iov_base, uaccess_end); 16668c2ecf20Sopenharmony_ci 16678c2ecf20Sopenharmony_ci /* check for compat_size_t not fitting in compat_ssize_t .. */ 16688c2ecf20Sopenharmony_ci if (len < 0) { 16698c2ecf20Sopenharmony_ci ret = -EINVAL; 16708c2ecf20Sopenharmony_ci goto uaccess_end; 16718c2ecf20Sopenharmony_ci } 16728c2ecf20Sopenharmony_ci iov[i].iov_base = compat_ptr(buf); 16738c2ecf20Sopenharmony_ci iov[i].iov_len = len; 16748c2ecf20Sopenharmony_ci } 16758c2ecf20Sopenharmony_ci 16768c2ecf20Sopenharmony_ci ret = 0; 16778c2ecf20Sopenharmony_ciuaccess_end: 16788c2ecf20Sopenharmony_ci user_access_end(); 16798c2ecf20Sopenharmony_ci return ret; 16808c2ecf20Sopenharmony_ci} 16818c2ecf20Sopenharmony_ci 16828c2ecf20Sopenharmony_cistatic int copy_iovec_from_user(struct iovec *iov, 16838c2ecf20Sopenharmony_ci const struct iovec __user *uvec, unsigned long nr_segs) 16848c2ecf20Sopenharmony_ci{ 16858c2ecf20Sopenharmony_ci unsigned long seg; 16868c2ecf20Sopenharmony_ci 16878c2ecf20Sopenharmony_ci if (copy_from_user(iov, uvec, nr_segs * sizeof(*uvec))) 16888c2ecf20Sopenharmony_ci return -EFAULT; 16898c2ecf20Sopenharmony_ci for (seg = 0; seg < nr_segs; seg++) { 16908c2ecf20Sopenharmony_ci if ((ssize_t)iov[seg].iov_len < 0) 16918c2ecf20Sopenharmony_ci return -EINVAL; 16928c2ecf20Sopenharmony_ci } 16938c2ecf20Sopenharmony_ci 16948c2ecf20Sopenharmony_ci return 0; 16958c2ecf20Sopenharmony_ci} 16968c2ecf20Sopenharmony_ci 16978c2ecf20Sopenharmony_cistruct iovec *iovec_from_user(const struct iovec __user *uvec, 16988c2ecf20Sopenharmony_ci unsigned long nr_segs, unsigned long fast_segs, 16998c2ecf20Sopenharmony_ci struct iovec *fast_iov, bool compat) 17008c2ecf20Sopenharmony_ci{ 17018c2ecf20Sopenharmony_ci struct iovec *iov = fast_iov; 17028c2ecf20Sopenharmony_ci int ret; 17038c2ecf20Sopenharmony_ci 17048c2ecf20Sopenharmony_ci /* 17058c2ecf20Sopenharmony_ci * SuS says "The readv() function *may* fail if the iovcnt argument was 17068c2ecf20Sopenharmony_ci * less than or equal to 0, or greater than {IOV_MAX}. Linux has 17078c2ecf20Sopenharmony_ci * traditionally returned zero for zero segments, so... 17088c2ecf20Sopenharmony_ci */ 17098c2ecf20Sopenharmony_ci if (nr_segs == 0) 17108c2ecf20Sopenharmony_ci return iov; 17118c2ecf20Sopenharmony_ci if (nr_segs > UIO_MAXIOV) 17128c2ecf20Sopenharmony_ci return ERR_PTR(-EINVAL); 17138c2ecf20Sopenharmony_ci if (nr_segs > fast_segs) { 17148c2ecf20Sopenharmony_ci iov = kmalloc_array(nr_segs, sizeof(struct iovec), GFP_KERNEL); 17158c2ecf20Sopenharmony_ci if (!iov) 17168c2ecf20Sopenharmony_ci return ERR_PTR(-ENOMEM); 17178c2ecf20Sopenharmony_ci } 17188c2ecf20Sopenharmony_ci 17198c2ecf20Sopenharmony_ci if (compat) 17208c2ecf20Sopenharmony_ci ret = copy_compat_iovec_from_user(iov, uvec, nr_segs); 17218c2ecf20Sopenharmony_ci else 17228c2ecf20Sopenharmony_ci ret = copy_iovec_from_user(iov, uvec, nr_segs); 17238c2ecf20Sopenharmony_ci if (ret) { 17248c2ecf20Sopenharmony_ci if (iov != fast_iov) 17258c2ecf20Sopenharmony_ci kfree(iov); 17268c2ecf20Sopenharmony_ci return ERR_PTR(ret); 17278c2ecf20Sopenharmony_ci } 17288c2ecf20Sopenharmony_ci 17298c2ecf20Sopenharmony_ci return iov; 17308c2ecf20Sopenharmony_ci} 17318c2ecf20Sopenharmony_ci 17328c2ecf20Sopenharmony_cissize_t __import_iovec(int type, const struct iovec __user *uvec, 17338c2ecf20Sopenharmony_ci unsigned nr_segs, unsigned fast_segs, struct iovec **iovp, 17348c2ecf20Sopenharmony_ci struct iov_iter *i, bool compat) 17358c2ecf20Sopenharmony_ci{ 17368c2ecf20Sopenharmony_ci ssize_t total_len = 0; 17378c2ecf20Sopenharmony_ci unsigned long seg; 17388c2ecf20Sopenharmony_ci struct iovec *iov; 17398c2ecf20Sopenharmony_ci 17408c2ecf20Sopenharmony_ci iov = iovec_from_user(uvec, nr_segs, fast_segs, *iovp, compat); 17418c2ecf20Sopenharmony_ci if (IS_ERR(iov)) { 17428c2ecf20Sopenharmony_ci *iovp = NULL; 17438c2ecf20Sopenharmony_ci return PTR_ERR(iov); 17448c2ecf20Sopenharmony_ci } 17458c2ecf20Sopenharmony_ci 17468c2ecf20Sopenharmony_ci /* 17478c2ecf20Sopenharmony_ci * According to the Single Unix Specification we should return EINVAL if 17488c2ecf20Sopenharmony_ci * an element length is < 0 when cast to ssize_t or if the total length 17498c2ecf20Sopenharmony_ci * would overflow the ssize_t return value of the system call. 17508c2ecf20Sopenharmony_ci * 17518c2ecf20Sopenharmony_ci * Linux caps all read/write calls to MAX_RW_COUNT, and avoids the 17528c2ecf20Sopenharmony_ci * overflow case. 17538c2ecf20Sopenharmony_ci */ 17548c2ecf20Sopenharmony_ci for (seg = 0; seg < nr_segs; seg++) { 17558c2ecf20Sopenharmony_ci ssize_t len = (ssize_t)iov[seg].iov_len; 17568c2ecf20Sopenharmony_ci 17578c2ecf20Sopenharmony_ci if (!access_ok(iov[seg].iov_base, len)) { 17588c2ecf20Sopenharmony_ci if (iov != *iovp) 17598c2ecf20Sopenharmony_ci kfree(iov); 17608c2ecf20Sopenharmony_ci *iovp = NULL; 17618c2ecf20Sopenharmony_ci return -EFAULT; 17628c2ecf20Sopenharmony_ci } 17638c2ecf20Sopenharmony_ci 17648c2ecf20Sopenharmony_ci if (len > MAX_RW_COUNT - total_len) { 17658c2ecf20Sopenharmony_ci len = MAX_RW_COUNT - total_len; 17668c2ecf20Sopenharmony_ci iov[seg].iov_len = len; 17678c2ecf20Sopenharmony_ci } 17688c2ecf20Sopenharmony_ci total_len += len; 17698c2ecf20Sopenharmony_ci } 17708c2ecf20Sopenharmony_ci 17718c2ecf20Sopenharmony_ci iov_iter_init(i, type, iov, nr_segs, total_len); 17728c2ecf20Sopenharmony_ci if (iov == *iovp) 17738c2ecf20Sopenharmony_ci *iovp = NULL; 17748c2ecf20Sopenharmony_ci else 17758c2ecf20Sopenharmony_ci *iovp = iov; 17768c2ecf20Sopenharmony_ci return total_len; 17778c2ecf20Sopenharmony_ci} 17788c2ecf20Sopenharmony_ci 17798c2ecf20Sopenharmony_ci/** 17808c2ecf20Sopenharmony_ci * import_iovec() - Copy an array of &struct iovec from userspace 17818c2ecf20Sopenharmony_ci * into the kernel, check that it is valid, and initialize a new 17828c2ecf20Sopenharmony_ci * &struct iov_iter iterator to access it. 17838c2ecf20Sopenharmony_ci * 17848c2ecf20Sopenharmony_ci * @type: One of %READ or %WRITE. 17858c2ecf20Sopenharmony_ci * @uvec: Pointer to the userspace array. 17868c2ecf20Sopenharmony_ci * @nr_segs: Number of elements in userspace array. 17878c2ecf20Sopenharmony_ci * @fast_segs: Number of elements in @iov. 17888c2ecf20Sopenharmony_ci * @iovp: (input and output parameter) Pointer to pointer to (usually small 17898c2ecf20Sopenharmony_ci * on-stack) kernel array. 17908c2ecf20Sopenharmony_ci * @i: Pointer to iterator that will be initialized on success. 17918c2ecf20Sopenharmony_ci * 17928c2ecf20Sopenharmony_ci * If the array pointed to by *@iov is large enough to hold all @nr_segs, 17938c2ecf20Sopenharmony_ci * then this function places %NULL in *@iov on return. Otherwise, a new 17948c2ecf20Sopenharmony_ci * array will be allocated and the result placed in *@iov. This means that 17958c2ecf20Sopenharmony_ci * the caller may call kfree() on *@iov regardless of whether the small 17968c2ecf20Sopenharmony_ci * on-stack array was used or not (and regardless of whether this function 17978c2ecf20Sopenharmony_ci * returns an error or not). 17988c2ecf20Sopenharmony_ci * 17998c2ecf20Sopenharmony_ci * Return: Negative error code on error, bytes imported on success 18008c2ecf20Sopenharmony_ci */ 18018c2ecf20Sopenharmony_cissize_t import_iovec(int type, const struct iovec __user *uvec, 18028c2ecf20Sopenharmony_ci unsigned nr_segs, unsigned fast_segs, 18038c2ecf20Sopenharmony_ci struct iovec **iovp, struct iov_iter *i) 18048c2ecf20Sopenharmony_ci{ 18058c2ecf20Sopenharmony_ci return __import_iovec(type, uvec, nr_segs, fast_segs, iovp, i, 18068c2ecf20Sopenharmony_ci in_compat_syscall()); 18078c2ecf20Sopenharmony_ci} 18088c2ecf20Sopenharmony_ciEXPORT_SYMBOL(import_iovec); 18098c2ecf20Sopenharmony_ci 18108c2ecf20Sopenharmony_ciint import_single_range(int rw, void __user *buf, size_t len, 18118c2ecf20Sopenharmony_ci struct iovec *iov, struct iov_iter *i) 18128c2ecf20Sopenharmony_ci{ 18138c2ecf20Sopenharmony_ci if (len > MAX_RW_COUNT) 18148c2ecf20Sopenharmony_ci len = MAX_RW_COUNT; 18158c2ecf20Sopenharmony_ci if (unlikely(!access_ok(buf, len))) 18168c2ecf20Sopenharmony_ci return -EFAULT; 18178c2ecf20Sopenharmony_ci 18188c2ecf20Sopenharmony_ci iov->iov_base = buf; 18198c2ecf20Sopenharmony_ci iov->iov_len = len; 18208c2ecf20Sopenharmony_ci iov_iter_init(i, rw, iov, 1, len); 18218c2ecf20Sopenharmony_ci return 0; 18228c2ecf20Sopenharmony_ci} 18238c2ecf20Sopenharmony_ciEXPORT_SYMBOL(import_single_range); 18248c2ecf20Sopenharmony_ci 18258c2ecf20Sopenharmony_ci/** 18268c2ecf20Sopenharmony_ci * iov_iter_restore() - Restore a &struct iov_iter to the same state as when 18278c2ecf20Sopenharmony_ci * iov_iter_save_state() was called. 18288c2ecf20Sopenharmony_ci * 18298c2ecf20Sopenharmony_ci * @i: &struct iov_iter to restore 18308c2ecf20Sopenharmony_ci * @state: state to restore from 18318c2ecf20Sopenharmony_ci * 18328c2ecf20Sopenharmony_ci * Used after iov_iter_save_state() to bring restore @i, if operations may 18338c2ecf20Sopenharmony_ci * have advanced it. 18348c2ecf20Sopenharmony_ci * 18358c2ecf20Sopenharmony_ci * Note: only works on ITER_IOVEC, ITER_BVEC, and ITER_KVEC 18368c2ecf20Sopenharmony_ci */ 18378c2ecf20Sopenharmony_civoid iov_iter_restore(struct iov_iter *i, struct iov_iter_state *state) 18388c2ecf20Sopenharmony_ci{ 18398c2ecf20Sopenharmony_ci if (WARN_ON_ONCE(!iov_iter_is_bvec(i) && !iter_is_iovec(i)) && 18408c2ecf20Sopenharmony_ci !iov_iter_is_kvec(i)) 18418c2ecf20Sopenharmony_ci return; 18428c2ecf20Sopenharmony_ci i->iov_offset = state->iov_offset; 18438c2ecf20Sopenharmony_ci i->count = state->count; 18448c2ecf20Sopenharmony_ci /* 18458c2ecf20Sopenharmony_ci * For the *vec iters, nr_segs + iov is constant - if we increment 18468c2ecf20Sopenharmony_ci * the vec, then we also decrement the nr_segs count. Hence we don't 18478c2ecf20Sopenharmony_ci * need to track both of these, just one is enough and we can deduct 18488c2ecf20Sopenharmony_ci * the other from that. ITER_KVEC and ITER_IOVEC are the same struct 18498c2ecf20Sopenharmony_ci * size, so we can just increment the iov pointer as they are unionzed. 18508c2ecf20Sopenharmony_ci * ITER_BVEC _may_ be the same size on some archs, but on others it is 18518c2ecf20Sopenharmony_ci * not. Be safe and handle it separately. 18528c2ecf20Sopenharmony_ci */ 18538c2ecf20Sopenharmony_ci BUILD_BUG_ON(sizeof(struct iovec) != sizeof(struct kvec)); 18548c2ecf20Sopenharmony_ci if (iov_iter_is_bvec(i)) 18558c2ecf20Sopenharmony_ci i->bvec -= state->nr_segs - i->nr_segs; 18568c2ecf20Sopenharmony_ci else 18578c2ecf20Sopenharmony_ci i->iov -= state->nr_segs - i->nr_segs; 18588c2ecf20Sopenharmony_ci i->nr_segs = state->nr_segs; 18598c2ecf20Sopenharmony_ci} 1860