18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 28c2ecf20Sopenharmony_ci/* 38c2ecf20Sopenharmony_ci * (c) 2017 Stefano Stabellini <stefano@aporeto.com> 48c2ecf20Sopenharmony_ci */ 58c2ecf20Sopenharmony_ci 68c2ecf20Sopenharmony_ci#include <linux/module.h> 78c2ecf20Sopenharmony_ci#include <linux/net.h> 88c2ecf20Sopenharmony_ci#include <linux/socket.h> 98c2ecf20Sopenharmony_ci 108c2ecf20Sopenharmony_ci#include <net/sock.h> 118c2ecf20Sopenharmony_ci 128c2ecf20Sopenharmony_ci#include <xen/events.h> 138c2ecf20Sopenharmony_ci#include <xen/grant_table.h> 148c2ecf20Sopenharmony_ci#include <xen/xen.h> 158c2ecf20Sopenharmony_ci#include <xen/xenbus.h> 168c2ecf20Sopenharmony_ci#include <xen/interface/io/pvcalls.h> 178c2ecf20Sopenharmony_ci 188c2ecf20Sopenharmony_ci#include "pvcalls-front.h" 198c2ecf20Sopenharmony_ci 208c2ecf20Sopenharmony_ci#define PVCALLS_INVALID_ID UINT_MAX 218c2ecf20Sopenharmony_ci#define PVCALLS_RING_ORDER XENBUS_MAX_RING_GRANT_ORDER 228c2ecf20Sopenharmony_ci#define PVCALLS_NR_RSP_PER_RING __CONST_RING_SIZE(xen_pvcalls, XEN_PAGE_SIZE) 238c2ecf20Sopenharmony_ci#define PVCALLS_FRONT_MAX_SPIN 5000 248c2ecf20Sopenharmony_ci 258c2ecf20Sopenharmony_cistatic struct proto pvcalls_proto = { 268c2ecf20Sopenharmony_ci .name = "PVCalls", 278c2ecf20Sopenharmony_ci .owner = THIS_MODULE, 288c2ecf20Sopenharmony_ci .obj_size = sizeof(struct sock), 298c2ecf20Sopenharmony_ci}; 308c2ecf20Sopenharmony_ci 318c2ecf20Sopenharmony_cistruct pvcalls_bedata { 328c2ecf20Sopenharmony_ci struct xen_pvcalls_front_ring ring; 338c2ecf20Sopenharmony_ci grant_ref_t ref; 348c2ecf20Sopenharmony_ci int irq; 358c2ecf20Sopenharmony_ci 368c2ecf20Sopenharmony_ci struct list_head socket_mappings; 378c2ecf20Sopenharmony_ci spinlock_t socket_lock; 388c2ecf20Sopenharmony_ci 398c2ecf20Sopenharmony_ci wait_queue_head_t inflight_req; 408c2ecf20Sopenharmony_ci struct xen_pvcalls_response rsp[PVCALLS_NR_RSP_PER_RING]; 418c2ecf20Sopenharmony_ci}; 428c2ecf20Sopenharmony_ci/* Only one front/back connection supported. */ 438c2ecf20Sopenharmony_cistatic struct xenbus_device *pvcalls_front_dev; 448c2ecf20Sopenharmony_cistatic atomic_t pvcalls_refcount; 458c2ecf20Sopenharmony_ci 468c2ecf20Sopenharmony_ci/* first increment refcount, then proceed */ 478c2ecf20Sopenharmony_ci#define pvcalls_enter() { \ 488c2ecf20Sopenharmony_ci atomic_inc(&pvcalls_refcount); \ 498c2ecf20Sopenharmony_ci} 508c2ecf20Sopenharmony_ci 518c2ecf20Sopenharmony_ci/* first complete other operations, then decrement refcount */ 528c2ecf20Sopenharmony_ci#define pvcalls_exit() { \ 538c2ecf20Sopenharmony_ci atomic_dec(&pvcalls_refcount); \ 548c2ecf20Sopenharmony_ci} 558c2ecf20Sopenharmony_ci 568c2ecf20Sopenharmony_cistruct sock_mapping { 578c2ecf20Sopenharmony_ci bool active_socket; 588c2ecf20Sopenharmony_ci struct list_head list; 598c2ecf20Sopenharmony_ci struct socket *sock; 608c2ecf20Sopenharmony_ci atomic_t refcount; 618c2ecf20Sopenharmony_ci union { 628c2ecf20Sopenharmony_ci struct { 638c2ecf20Sopenharmony_ci int irq; 648c2ecf20Sopenharmony_ci grant_ref_t ref; 658c2ecf20Sopenharmony_ci struct pvcalls_data_intf *ring; 668c2ecf20Sopenharmony_ci struct pvcalls_data data; 678c2ecf20Sopenharmony_ci struct mutex in_mutex; 688c2ecf20Sopenharmony_ci struct mutex out_mutex; 698c2ecf20Sopenharmony_ci 708c2ecf20Sopenharmony_ci wait_queue_head_t inflight_conn_req; 718c2ecf20Sopenharmony_ci } active; 728c2ecf20Sopenharmony_ci struct { 738c2ecf20Sopenharmony_ci /* 748c2ecf20Sopenharmony_ci * Socket status, needs to be 64-bit aligned due to the 758c2ecf20Sopenharmony_ci * test_and_* functions which have this requirement on arm64. 768c2ecf20Sopenharmony_ci */ 778c2ecf20Sopenharmony_ci#define PVCALLS_STATUS_UNINITALIZED 0 788c2ecf20Sopenharmony_ci#define PVCALLS_STATUS_BIND 1 798c2ecf20Sopenharmony_ci#define PVCALLS_STATUS_LISTEN 2 808c2ecf20Sopenharmony_ci uint8_t status __attribute__((aligned(8))); 818c2ecf20Sopenharmony_ci /* 828c2ecf20Sopenharmony_ci * Internal state-machine flags. 838c2ecf20Sopenharmony_ci * Only one accept operation can be inflight for a socket. 848c2ecf20Sopenharmony_ci * Only one poll operation can be inflight for a given socket. 858c2ecf20Sopenharmony_ci * flags needs to be 64-bit aligned due to the test_and_* 868c2ecf20Sopenharmony_ci * functions which have this requirement on arm64. 878c2ecf20Sopenharmony_ci */ 888c2ecf20Sopenharmony_ci#define PVCALLS_FLAG_ACCEPT_INFLIGHT 0 898c2ecf20Sopenharmony_ci#define PVCALLS_FLAG_POLL_INFLIGHT 1 908c2ecf20Sopenharmony_ci#define PVCALLS_FLAG_POLL_RET 2 918c2ecf20Sopenharmony_ci uint8_t flags __attribute__((aligned(8))); 928c2ecf20Sopenharmony_ci uint32_t inflight_req_id; 938c2ecf20Sopenharmony_ci struct sock_mapping *accept_map; 948c2ecf20Sopenharmony_ci wait_queue_head_t inflight_accept_req; 958c2ecf20Sopenharmony_ci } passive; 968c2ecf20Sopenharmony_ci }; 978c2ecf20Sopenharmony_ci}; 988c2ecf20Sopenharmony_ci 998c2ecf20Sopenharmony_cistatic inline struct sock_mapping *pvcalls_enter_sock(struct socket *sock) 1008c2ecf20Sopenharmony_ci{ 1018c2ecf20Sopenharmony_ci struct sock_mapping *map; 1028c2ecf20Sopenharmony_ci 1038c2ecf20Sopenharmony_ci if (!pvcalls_front_dev || 1048c2ecf20Sopenharmony_ci dev_get_drvdata(&pvcalls_front_dev->dev) == NULL) 1058c2ecf20Sopenharmony_ci return ERR_PTR(-ENOTCONN); 1068c2ecf20Sopenharmony_ci 1078c2ecf20Sopenharmony_ci map = (struct sock_mapping *)sock->sk->sk_send_head; 1088c2ecf20Sopenharmony_ci if (map == NULL) 1098c2ecf20Sopenharmony_ci return ERR_PTR(-ENOTSOCK); 1108c2ecf20Sopenharmony_ci 1118c2ecf20Sopenharmony_ci pvcalls_enter(); 1128c2ecf20Sopenharmony_ci atomic_inc(&map->refcount); 1138c2ecf20Sopenharmony_ci return map; 1148c2ecf20Sopenharmony_ci} 1158c2ecf20Sopenharmony_ci 1168c2ecf20Sopenharmony_cistatic inline void pvcalls_exit_sock(struct socket *sock) 1178c2ecf20Sopenharmony_ci{ 1188c2ecf20Sopenharmony_ci struct sock_mapping *map; 1198c2ecf20Sopenharmony_ci 1208c2ecf20Sopenharmony_ci map = (struct sock_mapping *)sock->sk->sk_send_head; 1218c2ecf20Sopenharmony_ci atomic_dec(&map->refcount); 1228c2ecf20Sopenharmony_ci pvcalls_exit(); 1238c2ecf20Sopenharmony_ci} 1248c2ecf20Sopenharmony_ci 1258c2ecf20Sopenharmony_cistatic inline int get_request(struct pvcalls_bedata *bedata, int *req_id) 1268c2ecf20Sopenharmony_ci{ 1278c2ecf20Sopenharmony_ci *req_id = bedata->ring.req_prod_pvt & (RING_SIZE(&bedata->ring) - 1); 1288c2ecf20Sopenharmony_ci if (RING_FULL(&bedata->ring) || 1298c2ecf20Sopenharmony_ci bedata->rsp[*req_id].req_id != PVCALLS_INVALID_ID) 1308c2ecf20Sopenharmony_ci return -EAGAIN; 1318c2ecf20Sopenharmony_ci return 0; 1328c2ecf20Sopenharmony_ci} 1338c2ecf20Sopenharmony_ci 1348c2ecf20Sopenharmony_cistatic bool pvcalls_front_write_todo(struct sock_mapping *map) 1358c2ecf20Sopenharmony_ci{ 1368c2ecf20Sopenharmony_ci struct pvcalls_data_intf *intf = map->active.ring; 1378c2ecf20Sopenharmony_ci RING_IDX cons, prod, size = XEN_FLEX_RING_SIZE(PVCALLS_RING_ORDER); 1388c2ecf20Sopenharmony_ci int32_t error; 1398c2ecf20Sopenharmony_ci 1408c2ecf20Sopenharmony_ci error = intf->out_error; 1418c2ecf20Sopenharmony_ci if (error == -ENOTCONN) 1428c2ecf20Sopenharmony_ci return false; 1438c2ecf20Sopenharmony_ci if (error != 0) 1448c2ecf20Sopenharmony_ci return true; 1458c2ecf20Sopenharmony_ci 1468c2ecf20Sopenharmony_ci cons = intf->out_cons; 1478c2ecf20Sopenharmony_ci prod = intf->out_prod; 1488c2ecf20Sopenharmony_ci return !!(size - pvcalls_queued(prod, cons, size)); 1498c2ecf20Sopenharmony_ci} 1508c2ecf20Sopenharmony_ci 1518c2ecf20Sopenharmony_cistatic bool pvcalls_front_read_todo(struct sock_mapping *map) 1528c2ecf20Sopenharmony_ci{ 1538c2ecf20Sopenharmony_ci struct pvcalls_data_intf *intf = map->active.ring; 1548c2ecf20Sopenharmony_ci RING_IDX cons, prod; 1558c2ecf20Sopenharmony_ci int32_t error; 1568c2ecf20Sopenharmony_ci 1578c2ecf20Sopenharmony_ci cons = intf->in_cons; 1588c2ecf20Sopenharmony_ci prod = intf->in_prod; 1598c2ecf20Sopenharmony_ci error = intf->in_error; 1608c2ecf20Sopenharmony_ci return (error != 0 || 1618c2ecf20Sopenharmony_ci pvcalls_queued(prod, cons, 1628c2ecf20Sopenharmony_ci XEN_FLEX_RING_SIZE(PVCALLS_RING_ORDER)) != 0); 1638c2ecf20Sopenharmony_ci} 1648c2ecf20Sopenharmony_ci 1658c2ecf20Sopenharmony_cistatic irqreturn_t pvcalls_front_event_handler(int irq, void *dev_id) 1668c2ecf20Sopenharmony_ci{ 1678c2ecf20Sopenharmony_ci struct xenbus_device *dev = dev_id; 1688c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata; 1698c2ecf20Sopenharmony_ci struct xen_pvcalls_response *rsp; 1708c2ecf20Sopenharmony_ci uint8_t *src, *dst; 1718c2ecf20Sopenharmony_ci int req_id = 0, more = 0, done = 0; 1728c2ecf20Sopenharmony_ci 1738c2ecf20Sopenharmony_ci if (dev == NULL) 1748c2ecf20Sopenharmony_ci return IRQ_HANDLED; 1758c2ecf20Sopenharmony_ci 1768c2ecf20Sopenharmony_ci pvcalls_enter(); 1778c2ecf20Sopenharmony_ci bedata = dev_get_drvdata(&dev->dev); 1788c2ecf20Sopenharmony_ci if (bedata == NULL) { 1798c2ecf20Sopenharmony_ci pvcalls_exit(); 1808c2ecf20Sopenharmony_ci return IRQ_HANDLED; 1818c2ecf20Sopenharmony_ci } 1828c2ecf20Sopenharmony_ci 1838c2ecf20Sopenharmony_ciagain: 1848c2ecf20Sopenharmony_ci while (RING_HAS_UNCONSUMED_RESPONSES(&bedata->ring)) { 1858c2ecf20Sopenharmony_ci rsp = RING_GET_RESPONSE(&bedata->ring, bedata->ring.rsp_cons); 1868c2ecf20Sopenharmony_ci 1878c2ecf20Sopenharmony_ci req_id = rsp->req_id; 1888c2ecf20Sopenharmony_ci if (rsp->cmd == PVCALLS_POLL) { 1898c2ecf20Sopenharmony_ci struct sock_mapping *map = (struct sock_mapping *)(uintptr_t) 1908c2ecf20Sopenharmony_ci rsp->u.poll.id; 1918c2ecf20Sopenharmony_ci 1928c2ecf20Sopenharmony_ci clear_bit(PVCALLS_FLAG_POLL_INFLIGHT, 1938c2ecf20Sopenharmony_ci (void *)&map->passive.flags); 1948c2ecf20Sopenharmony_ci /* 1958c2ecf20Sopenharmony_ci * clear INFLIGHT, then set RET. It pairs with 1968c2ecf20Sopenharmony_ci * the checks at the beginning of 1978c2ecf20Sopenharmony_ci * pvcalls_front_poll_passive. 1988c2ecf20Sopenharmony_ci */ 1998c2ecf20Sopenharmony_ci smp_wmb(); 2008c2ecf20Sopenharmony_ci set_bit(PVCALLS_FLAG_POLL_RET, 2018c2ecf20Sopenharmony_ci (void *)&map->passive.flags); 2028c2ecf20Sopenharmony_ci } else { 2038c2ecf20Sopenharmony_ci dst = (uint8_t *)&bedata->rsp[req_id] + 2048c2ecf20Sopenharmony_ci sizeof(rsp->req_id); 2058c2ecf20Sopenharmony_ci src = (uint8_t *)rsp + sizeof(rsp->req_id); 2068c2ecf20Sopenharmony_ci memcpy(dst, src, sizeof(*rsp) - sizeof(rsp->req_id)); 2078c2ecf20Sopenharmony_ci /* 2088c2ecf20Sopenharmony_ci * First copy the rest of the data, then req_id. It is 2098c2ecf20Sopenharmony_ci * paired with the barrier when accessing bedata->rsp. 2108c2ecf20Sopenharmony_ci */ 2118c2ecf20Sopenharmony_ci smp_wmb(); 2128c2ecf20Sopenharmony_ci bedata->rsp[req_id].req_id = req_id; 2138c2ecf20Sopenharmony_ci } 2148c2ecf20Sopenharmony_ci 2158c2ecf20Sopenharmony_ci done = 1; 2168c2ecf20Sopenharmony_ci bedata->ring.rsp_cons++; 2178c2ecf20Sopenharmony_ci } 2188c2ecf20Sopenharmony_ci 2198c2ecf20Sopenharmony_ci RING_FINAL_CHECK_FOR_RESPONSES(&bedata->ring, more); 2208c2ecf20Sopenharmony_ci if (more) 2218c2ecf20Sopenharmony_ci goto again; 2228c2ecf20Sopenharmony_ci if (done) 2238c2ecf20Sopenharmony_ci wake_up(&bedata->inflight_req); 2248c2ecf20Sopenharmony_ci pvcalls_exit(); 2258c2ecf20Sopenharmony_ci return IRQ_HANDLED; 2268c2ecf20Sopenharmony_ci} 2278c2ecf20Sopenharmony_ci 2288c2ecf20Sopenharmony_cistatic void pvcalls_front_free_map(struct pvcalls_bedata *bedata, 2298c2ecf20Sopenharmony_ci struct sock_mapping *map) 2308c2ecf20Sopenharmony_ci{ 2318c2ecf20Sopenharmony_ci int i; 2328c2ecf20Sopenharmony_ci 2338c2ecf20Sopenharmony_ci unbind_from_irqhandler(map->active.irq, map); 2348c2ecf20Sopenharmony_ci 2358c2ecf20Sopenharmony_ci spin_lock(&bedata->socket_lock); 2368c2ecf20Sopenharmony_ci if (!list_empty(&map->list)) 2378c2ecf20Sopenharmony_ci list_del_init(&map->list); 2388c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 2398c2ecf20Sopenharmony_ci 2408c2ecf20Sopenharmony_ci for (i = 0; i < (1 << PVCALLS_RING_ORDER); i++) 2418c2ecf20Sopenharmony_ci gnttab_end_foreign_access(map->active.ring->ref[i], 0, 0); 2428c2ecf20Sopenharmony_ci gnttab_end_foreign_access(map->active.ref, 0, 0); 2438c2ecf20Sopenharmony_ci free_page((unsigned long)map->active.ring); 2448c2ecf20Sopenharmony_ci 2458c2ecf20Sopenharmony_ci kfree(map); 2468c2ecf20Sopenharmony_ci} 2478c2ecf20Sopenharmony_ci 2488c2ecf20Sopenharmony_cistatic irqreturn_t pvcalls_front_conn_handler(int irq, void *sock_map) 2498c2ecf20Sopenharmony_ci{ 2508c2ecf20Sopenharmony_ci struct sock_mapping *map = sock_map; 2518c2ecf20Sopenharmony_ci 2528c2ecf20Sopenharmony_ci if (map == NULL) 2538c2ecf20Sopenharmony_ci return IRQ_HANDLED; 2548c2ecf20Sopenharmony_ci 2558c2ecf20Sopenharmony_ci wake_up_interruptible(&map->active.inflight_conn_req); 2568c2ecf20Sopenharmony_ci 2578c2ecf20Sopenharmony_ci return IRQ_HANDLED; 2588c2ecf20Sopenharmony_ci} 2598c2ecf20Sopenharmony_ci 2608c2ecf20Sopenharmony_ciint pvcalls_front_socket(struct socket *sock) 2618c2ecf20Sopenharmony_ci{ 2628c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata; 2638c2ecf20Sopenharmony_ci struct sock_mapping *map = NULL; 2648c2ecf20Sopenharmony_ci struct xen_pvcalls_request *req; 2658c2ecf20Sopenharmony_ci int notify, req_id, ret; 2668c2ecf20Sopenharmony_ci 2678c2ecf20Sopenharmony_ci /* 2688c2ecf20Sopenharmony_ci * PVCalls only supports domain AF_INET, 2698c2ecf20Sopenharmony_ci * type SOCK_STREAM and protocol 0 sockets for now. 2708c2ecf20Sopenharmony_ci * 2718c2ecf20Sopenharmony_ci * Check socket type here, AF_INET and protocol checks are done 2728c2ecf20Sopenharmony_ci * by the caller. 2738c2ecf20Sopenharmony_ci */ 2748c2ecf20Sopenharmony_ci if (sock->type != SOCK_STREAM) 2758c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 2768c2ecf20Sopenharmony_ci 2778c2ecf20Sopenharmony_ci pvcalls_enter(); 2788c2ecf20Sopenharmony_ci if (!pvcalls_front_dev) { 2798c2ecf20Sopenharmony_ci pvcalls_exit(); 2808c2ecf20Sopenharmony_ci return -EACCES; 2818c2ecf20Sopenharmony_ci } 2828c2ecf20Sopenharmony_ci bedata = dev_get_drvdata(&pvcalls_front_dev->dev); 2838c2ecf20Sopenharmony_ci 2848c2ecf20Sopenharmony_ci map = kzalloc(sizeof(*map), GFP_KERNEL); 2858c2ecf20Sopenharmony_ci if (map == NULL) { 2868c2ecf20Sopenharmony_ci pvcalls_exit(); 2878c2ecf20Sopenharmony_ci return -ENOMEM; 2888c2ecf20Sopenharmony_ci } 2898c2ecf20Sopenharmony_ci 2908c2ecf20Sopenharmony_ci spin_lock(&bedata->socket_lock); 2918c2ecf20Sopenharmony_ci 2928c2ecf20Sopenharmony_ci ret = get_request(bedata, &req_id); 2938c2ecf20Sopenharmony_ci if (ret < 0) { 2948c2ecf20Sopenharmony_ci kfree(map); 2958c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 2968c2ecf20Sopenharmony_ci pvcalls_exit(); 2978c2ecf20Sopenharmony_ci return ret; 2988c2ecf20Sopenharmony_ci } 2998c2ecf20Sopenharmony_ci 3008c2ecf20Sopenharmony_ci /* 3018c2ecf20Sopenharmony_ci * sock->sk->sk_send_head is not used for ip sockets: reuse the 3028c2ecf20Sopenharmony_ci * field to store a pointer to the struct sock_mapping 3038c2ecf20Sopenharmony_ci * corresponding to the socket. This way, we can easily get the 3048c2ecf20Sopenharmony_ci * struct sock_mapping from the struct socket. 3058c2ecf20Sopenharmony_ci */ 3068c2ecf20Sopenharmony_ci sock->sk->sk_send_head = (void *)map; 3078c2ecf20Sopenharmony_ci list_add_tail(&map->list, &bedata->socket_mappings); 3088c2ecf20Sopenharmony_ci 3098c2ecf20Sopenharmony_ci req = RING_GET_REQUEST(&bedata->ring, req_id); 3108c2ecf20Sopenharmony_ci req->req_id = req_id; 3118c2ecf20Sopenharmony_ci req->cmd = PVCALLS_SOCKET; 3128c2ecf20Sopenharmony_ci req->u.socket.id = (uintptr_t) map; 3138c2ecf20Sopenharmony_ci req->u.socket.domain = AF_INET; 3148c2ecf20Sopenharmony_ci req->u.socket.type = SOCK_STREAM; 3158c2ecf20Sopenharmony_ci req->u.socket.protocol = IPPROTO_IP; 3168c2ecf20Sopenharmony_ci 3178c2ecf20Sopenharmony_ci bedata->ring.req_prod_pvt++; 3188c2ecf20Sopenharmony_ci RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&bedata->ring, notify); 3198c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 3208c2ecf20Sopenharmony_ci if (notify) 3218c2ecf20Sopenharmony_ci notify_remote_via_irq(bedata->irq); 3228c2ecf20Sopenharmony_ci 3238c2ecf20Sopenharmony_ci wait_event(bedata->inflight_req, 3248c2ecf20Sopenharmony_ci READ_ONCE(bedata->rsp[req_id].req_id) == req_id); 3258c2ecf20Sopenharmony_ci 3268c2ecf20Sopenharmony_ci /* read req_id, then the content */ 3278c2ecf20Sopenharmony_ci smp_rmb(); 3288c2ecf20Sopenharmony_ci ret = bedata->rsp[req_id].ret; 3298c2ecf20Sopenharmony_ci bedata->rsp[req_id].req_id = PVCALLS_INVALID_ID; 3308c2ecf20Sopenharmony_ci 3318c2ecf20Sopenharmony_ci pvcalls_exit(); 3328c2ecf20Sopenharmony_ci return ret; 3338c2ecf20Sopenharmony_ci} 3348c2ecf20Sopenharmony_ci 3358c2ecf20Sopenharmony_cistatic void free_active_ring(struct sock_mapping *map) 3368c2ecf20Sopenharmony_ci{ 3378c2ecf20Sopenharmony_ci if (!map->active.ring) 3388c2ecf20Sopenharmony_ci return; 3398c2ecf20Sopenharmony_ci 3408c2ecf20Sopenharmony_ci free_pages_exact(map->active.data.in, 3418c2ecf20Sopenharmony_ci PAGE_SIZE << map->active.ring->ring_order); 3428c2ecf20Sopenharmony_ci free_page((unsigned long)map->active.ring); 3438c2ecf20Sopenharmony_ci} 3448c2ecf20Sopenharmony_ci 3458c2ecf20Sopenharmony_cistatic int alloc_active_ring(struct sock_mapping *map) 3468c2ecf20Sopenharmony_ci{ 3478c2ecf20Sopenharmony_ci void *bytes; 3488c2ecf20Sopenharmony_ci 3498c2ecf20Sopenharmony_ci map->active.ring = (struct pvcalls_data_intf *) 3508c2ecf20Sopenharmony_ci get_zeroed_page(GFP_KERNEL); 3518c2ecf20Sopenharmony_ci if (!map->active.ring) 3528c2ecf20Sopenharmony_ci goto out; 3538c2ecf20Sopenharmony_ci 3548c2ecf20Sopenharmony_ci map->active.ring->ring_order = PVCALLS_RING_ORDER; 3558c2ecf20Sopenharmony_ci bytes = alloc_pages_exact(PAGE_SIZE << PVCALLS_RING_ORDER, 3568c2ecf20Sopenharmony_ci GFP_KERNEL | __GFP_ZERO); 3578c2ecf20Sopenharmony_ci if (!bytes) 3588c2ecf20Sopenharmony_ci goto out; 3598c2ecf20Sopenharmony_ci 3608c2ecf20Sopenharmony_ci map->active.data.in = bytes; 3618c2ecf20Sopenharmony_ci map->active.data.out = bytes + 3628c2ecf20Sopenharmony_ci XEN_FLEX_RING_SIZE(PVCALLS_RING_ORDER); 3638c2ecf20Sopenharmony_ci 3648c2ecf20Sopenharmony_ci return 0; 3658c2ecf20Sopenharmony_ci 3668c2ecf20Sopenharmony_ciout: 3678c2ecf20Sopenharmony_ci free_active_ring(map); 3688c2ecf20Sopenharmony_ci return -ENOMEM; 3698c2ecf20Sopenharmony_ci} 3708c2ecf20Sopenharmony_ci 3718c2ecf20Sopenharmony_cistatic int create_active(struct sock_mapping *map, evtchn_port_t *evtchn) 3728c2ecf20Sopenharmony_ci{ 3738c2ecf20Sopenharmony_ci void *bytes; 3748c2ecf20Sopenharmony_ci int ret, irq = -1, i; 3758c2ecf20Sopenharmony_ci 3768c2ecf20Sopenharmony_ci *evtchn = 0; 3778c2ecf20Sopenharmony_ci init_waitqueue_head(&map->active.inflight_conn_req); 3788c2ecf20Sopenharmony_ci 3798c2ecf20Sopenharmony_ci bytes = map->active.data.in; 3808c2ecf20Sopenharmony_ci for (i = 0; i < (1 << PVCALLS_RING_ORDER); i++) 3818c2ecf20Sopenharmony_ci map->active.ring->ref[i] = gnttab_grant_foreign_access( 3828c2ecf20Sopenharmony_ci pvcalls_front_dev->otherend_id, 3838c2ecf20Sopenharmony_ci pfn_to_gfn(virt_to_pfn(bytes) + i), 0); 3848c2ecf20Sopenharmony_ci 3858c2ecf20Sopenharmony_ci map->active.ref = gnttab_grant_foreign_access( 3868c2ecf20Sopenharmony_ci pvcalls_front_dev->otherend_id, 3878c2ecf20Sopenharmony_ci pfn_to_gfn(virt_to_pfn((void *)map->active.ring)), 0); 3888c2ecf20Sopenharmony_ci 3898c2ecf20Sopenharmony_ci ret = xenbus_alloc_evtchn(pvcalls_front_dev, evtchn); 3908c2ecf20Sopenharmony_ci if (ret) 3918c2ecf20Sopenharmony_ci goto out_error; 3928c2ecf20Sopenharmony_ci irq = bind_evtchn_to_irqhandler(*evtchn, pvcalls_front_conn_handler, 3938c2ecf20Sopenharmony_ci 0, "pvcalls-frontend", map); 3948c2ecf20Sopenharmony_ci if (irq < 0) { 3958c2ecf20Sopenharmony_ci ret = irq; 3968c2ecf20Sopenharmony_ci goto out_error; 3978c2ecf20Sopenharmony_ci } 3988c2ecf20Sopenharmony_ci 3998c2ecf20Sopenharmony_ci map->active.irq = irq; 4008c2ecf20Sopenharmony_ci map->active_socket = true; 4018c2ecf20Sopenharmony_ci mutex_init(&map->active.in_mutex); 4028c2ecf20Sopenharmony_ci mutex_init(&map->active.out_mutex); 4038c2ecf20Sopenharmony_ci 4048c2ecf20Sopenharmony_ci return 0; 4058c2ecf20Sopenharmony_ci 4068c2ecf20Sopenharmony_ciout_error: 4078c2ecf20Sopenharmony_ci if (*evtchn > 0) 4088c2ecf20Sopenharmony_ci xenbus_free_evtchn(pvcalls_front_dev, *evtchn); 4098c2ecf20Sopenharmony_ci return ret; 4108c2ecf20Sopenharmony_ci} 4118c2ecf20Sopenharmony_ci 4128c2ecf20Sopenharmony_ciint pvcalls_front_connect(struct socket *sock, struct sockaddr *addr, 4138c2ecf20Sopenharmony_ci int addr_len, int flags) 4148c2ecf20Sopenharmony_ci{ 4158c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata; 4168c2ecf20Sopenharmony_ci struct sock_mapping *map = NULL; 4178c2ecf20Sopenharmony_ci struct xen_pvcalls_request *req; 4188c2ecf20Sopenharmony_ci int notify, req_id, ret; 4198c2ecf20Sopenharmony_ci evtchn_port_t evtchn; 4208c2ecf20Sopenharmony_ci 4218c2ecf20Sopenharmony_ci if (addr->sa_family != AF_INET || sock->type != SOCK_STREAM) 4228c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 4238c2ecf20Sopenharmony_ci 4248c2ecf20Sopenharmony_ci map = pvcalls_enter_sock(sock); 4258c2ecf20Sopenharmony_ci if (IS_ERR(map)) 4268c2ecf20Sopenharmony_ci return PTR_ERR(map); 4278c2ecf20Sopenharmony_ci 4288c2ecf20Sopenharmony_ci bedata = dev_get_drvdata(&pvcalls_front_dev->dev); 4298c2ecf20Sopenharmony_ci ret = alloc_active_ring(map); 4308c2ecf20Sopenharmony_ci if (ret < 0) { 4318c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 4328c2ecf20Sopenharmony_ci return ret; 4338c2ecf20Sopenharmony_ci } 4348c2ecf20Sopenharmony_ci 4358c2ecf20Sopenharmony_ci spin_lock(&bedata->socket_lock); 4368c2ecf20Sopenharmony_ci ret = get_request(bedata, &req_id); 4378c2ecf20Sopenharmony_ci if (ret < 0) { 4388c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 4398c2ecf20Sopenharmony_ci free_active_ring(map); 4408c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 4418c2ecf20Sopenharmony_ci return ret; 4428c2ecf20Sopenharmony_ci } 4438c2ecf20Sopenharmony_ci ret = create_active(map, &evtchn); 4448c2ecf20Sopenharmony_ci if (ret < 0) { 4458c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 4468c2ecf20Sopenharmony_ci free_active_ring(map); 4478c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 4488c2ecf20Sopenharmony_ci return ret; 4498c2ecf20Sopenharmony_ci } 4508c2ecf20Sopenharmony_ci 4518c2ecf20Sopenharmony_ci req = RING_GET_REQUEST(&bedata->ring, req_id); 4528c2ecf20Sopenharmony_ci req->req_id = req_id; 4538c2ecf20Sopenharmony_ci req->cmd = PVCALLS_CONNECT; 4548c2ecf20Sopenharmony_ci req->u.connect.id = (uintptr_t)map; 4558c2ecf20Sopenharmony_ci req->u.connect.len = addr_len; 4568c2ecf20Sopenharmony_ci req->u.connect.flags = flags; 4578c2ecf20Sopenharmony_ci req->u.connect.ref = map->active.ref; 4588c2ecf20Sopenharmony_ci req->u.connect.evtchn = evtchn; 4598c2ecf20Sopenharmony_ci memcpy(req->u.connect.addr, addr, sizeof(*addr)); 4608c2ecf20Sopenharmony_ci 4618c2ecf20Sopenharmony_ci map->sock = sock; 4628c2ecf20Sopenharmony_ci 4638c2ecf20Sopenharmony_ci bedata->ring.req_prod_pvt++; 4648c2ecf20Sopenharmony_ci RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&bedata->ring, notify); 4658c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 4668c2ecf20Sopenharmony_ci 4678c2ecf20Sopenharmony_ci if (notify) 4688c2ecf20Sopenharmony_ci notify_remote_via_irq(bedata->irq); 4698c2ecf20Sopenharmony_ci 4708c2ecf20Sopenharmony_ci wait_event(bedata->inflight_req, 4718c2ecf20Sopenharmony_ci READ_ONCE(bedata->rsp[req_id].req_id) == req_id); 4728c2ecf20Sopenharmony_ci 4738c2ecf20Sopenharmony_ci /* read req_id, then the content */ 4748c2ecf20Sopenharmony_ci smp_rmb(); 4758c2ecf20Sopenharmony_ci ret = bedata->rsp[req_id].ret; 4768c2ecf20Sopenharmony_ci bedata->rsp[req_id].req_id = PVCALLS_INVALID_ID; 4778c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 4788c2ecf20Sopenharmony_ci return ret; 4798c2ecf20Sopenharmony_ci} 4808c2ecf20Sopenharmony_ci 4818c2ecf20Sopenharmony_cistatic int __write_ring(struct pvcalls_data_intf *intf, 4828c2ecf20Sopenharmony_ci struct pvcalls_data *data, 4838c2ecf20Sopenharmony_ci struct iov_iter *msg_iter, 4848c2ecf20Sopenharmony_ci int len) 4858c2ecf20Sopenharmony_ci{ 4868c2ecf20Sopenharmony_ci RING_IDX cons, prod, size, masked_prod, masked_cons; 4878c2ecf20Sopenharmony_ci RING_IDX array_size = XEN_FLEX_RING_SIZE(PVCALLS_RING_ORDER); 4888c2ecf20Sopenharmony_ci int32_t error; 4898c2ecf20Sopenharmony_ci 4908c2ecf20Sopenharmony_ci error = intf->out_error; 4918c2ecf20Sopenharmony_ci if (error < 0) 4928c2ecf20Sopenharmony_ci return error; 4938c2ecf20Sopenharmony_ci cons = intf->out_cons; 4948c2ecf20Sopenharmony_ci prod = intf->out_prod; 4958c2ecf20Sopenharmony_ci /* read indexes before continuing */ 4968c2ecf20Sopenharmony_ci virt_mb(); 4978c2ecf20Sopenharmony_ci 4988c2ecf20Sopenharmony_ci size = pvcalls_queued(prod, cons, array_size); 4998c2ecf20Sopenharmony_ci if (size > array_size) 5008c2ecf20Sopenharmony_ci return -EINVAL; 5018c2ecf20Sopenharmony_ci if (size == array_size) 5028c2ecf20Sopenharmony_ci return 0; 5038c2ecf20Sopenharmony_ci if (len > array_size - size) 5048c2ecf20Sopenharmony_ci len = array_size - size; 5058c2ecf20Sopenharmony_ci 5068c2ecf20Sopenharmony_ci masked_prod = pvcalls_mask(prod, array_size); 5078c2ecf20Sopenharmony_ci masked_cons = pvcalls_mask(cons, array_size); 5088c2ecf20Sopenharmony_ci 5098c2ecf20Sopenharmony_ci if (masked_prod < masked_cons) { 5108c2ecf20Sopenharmony_ci len = copy_from_iter(data->out + masked_prod, len, msg_iter); 5118c2ecf20Sopenharmony_ci } else { 5128c2ecf20Sopenharmony_ci if (len > array_size - masked_prod) { 5138c2ecf20Sopenharmony_ci int ret = copy_from_iter(data->out + masked_prod, 5148c2ecf20Sopenharmony_ci array_size - masked_prod, msg_iter); 5158c2ecf20Sopenharmony_ci if (ret != array_size - masked_prod) { 5168c2ecf20Sopenharmony_ci len = ret; 5178c2ecf20Sopenharmony_ci goto out; 5188c2ecf20Sopenharmony_ci } 5198c2ecf20Sopenharmony_ci len = ret + copy_from_iter(data->out, len - ret, msg_iter); 5208c2ecf20Sopenharmony_ci } else { 5218c2ecf20Sopenharmony_ci len = copy_from_iter(data->out + masked_prod, len, msg_iter); 5228c2ecf20Sopenharmony_ci } 5238c2ecf20Sopenharmony_ci } 5248c2ecf20Sopenharmony_ciout: 5258c2ecf20Sopenharmony_ci /* write to ring before updating pointer */ 5268c2ecf20Sopenharmony_ci virt_wmb(); 5278c2ecf20Sopenharmony_ci intf->out_prod += len; 5288c2ecf20Sopenharmony_ci 5298c2ecf20Sopenharmony_ci return len; 5308c2ecf20Sopenharmony_ci} 5318c2ecf20Sopenharmony_ci 5328c2ecf20Sopenharmony_ciint pvcalls_front_sendmsg(struct socket *sock, struct msghdr *msg, 5338c2ecf20Sopenharmony_ci size_t len) 5348c2ecf20Sopenharmony_ci{ 5358c2ecf20Sopenharmony_ci struct sock_mapping *map; 5368c2ecf20Sopenharmony_ci int sent, tot_sent = 0; 5378c2ecf20Sopenharmony_ci int count = 0, flags; 5388c2ecf20Sopenharmony_ci 5398c2ecf20Sopenharmony_ci flags = msg->msg_flags; 5408c2ecf20Sopenharmony_ci if (flags & (MSG_CONFIRM|MSG_DONTROUTE|MSG_EOR|MSG_OOB)) 5418c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 5428c2ecf20Sopenharmony_ci 5438c2ecf20Sopenharmony_ci map = pvcalls_enter_sock(sock); 5448c2ecf20Sopenharmony_ci if (IS_ERR(map)) 5458c2ecf20Sopenharmony_ci return PTR_ERR(map); 5468c2ecf20Sopenharmony_ci 5478c2ecf20Sopenharmony_ci mutex_lock(&map->active.out_mutex); 5488c2ecf20Sopenharmony_ci if ((flags & MSG_DONTWAIT) && !pvcalls_front_write_todo(map)) { 5498c2ecf20Sopenharmony_ci mutex_unlock(&map->active.out_mutex); 5508c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 5518c2ecf20Sopenharmony_ci return -EAGAIN; 5528c2ecf20Sopenharmony_ci } 5538c2ecf20Sopenharmony_ci if (len > INT_MAX) 5548c2ecf20Sopenharmony_ci len = INT_MAX; 5558c2ecf20Sopenharmony_ci 5568c2ecf20Sopenharmony_ciagain: 5578c2ecf20Sopenharmony_ci count++; 5588c2ecf20Sopenharmony_ci sent = __write_ring(map->active.ring, 5598c2ecf20Sopenharmony_ci &map->active.data, &msg->msg_iter, 5608c2ecf20Sopenharmony_ci len); 5618c2ecf20Sopenharmony_ci if (sent > 0) { 5628c2ecf20Sopenharmony_ci len -= sent; 5638c2ecf20Sopenharmony_ci tot_sent += sent; 5648c2ecf20Sopenharmony_ci notify_remote_via_irq(map->active.irq); 5658c2ecf20Sopenharmony_ci } 5668c2ecf20Sopenharmony_ci if (sent >= 0 && len > 0 && count < PVCALLS_FRONT_MAX_SPIN) 5678c2ecf20Sopenharmony_ci goto again; 5688c2ecf20Sopenharmony_ci if (sent < 0) 5698c2ecf20Sopenharmony_ci tot_sent = sent; 5708c2ecf20Sopenharmony_ci 5718c2ecf20Sopenharmony_ci mutex_unlock(&map->active.out_mutex); 5728c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 5738c2ecf20Sopenharmony_ci return tot_sent; 5748c2ecf20Sopenharmony_ci} 5758c2ecf20Sopenharmony_ci 5768c2ecf20Sopenharmony_cistatic int __read_ring(struct pvcalls_data_intf *intf, 5778c2ecf20Sopenharmony_ci struct pvcalls_data *data, 5788c2ecf20Sopenharmony_ci struct iov_iter *msg_iter, 5798c2ecf20Sopenharmony_ci size_t len, int flags) 5808c2ecf20Sopenharmony_ci{ 5818c2ecf20Sopenharmony_ci RING_IDX cons, prod, size, masked_prod, masked_cons; 5828c2ecf20Sopenharmony_ci RING_IDX array_size = XEN_FLEX_RING_SIZE(PVCALLS_RING_ORDER); 5838c2ecf20Sopenharmony_ci int32_t error; 5848c2ecf20Sopenharmony_ci 5858c2ecf20Sopenharmony_ci cons = intf->in_cons; 5868c2ecf20Sopenharmony_ci prod = intf->in_prod; 5878c2ecf20Sopenharmony_ci error = intf->in_error; 5888c2ecf20Sopenharmony_ci /* get pointers before reading from the ring */ 5898c2ecf20Sopenharmony_ci virt_rmb(); 5908c2ecf20Sopenharmony_ci 5918c2ecf20Sopenharmony_ci size = pvcalls_queued(prod, cons, array_size); 5928c2ecf20Sopenharmony_ci masked_prod = pvcalls_mask(prod, array_size); 5938c2ecf20Sopenharmony_ci masked_cons = pvcalls_mask(cons, array_size); 5948c2ecf20Sopenharmony_ci 5958c2ecf20Sopenharmony_ci if (size == 0) 5968c2ecf20Sopenharmony_ci return error ?: size; 5978c2ecf20Sopenharmony_ci 5988c2ecf20Sopenharmony_ci if (len > size) 5998c2ecf20Sopenharmony_ci len = size; 6008c2ecf20Sopenharmony_ci 6018c2ecf20Sopenharmony_ci if (masked_prod > masked_cons) { 6028c2ecf20Sopenharmony_ci len = copy_to_iter(data->in + masked_cons, len, msg_iter); 6038c2ecf20Sopenharmony_ci } else { 6048c2ecf20Sopenharmony_ci if (len > (array_size - masked_cons)) { 6058c2ecf20Sopenharmony_ci int ret = copy_to_iter(data->in + masked_cons, 6068c2ecf20Sopenharmony_ci array_size - masked_cons, msg_iter); 6078c2ecf20Sopenharmony_ci if (ret != array_size - masked_cons) { 6088c2ecf20Sopenharmony_ci len = ret; 6098c2ecf20Sopenharmony_ci goto out; 6108c2ecf20Sopenharmony_ci } 6118c2ecf20Sopenharmony_ci len = ret + copy_to_iter(data->in, len - ret, msg_iter); 6128c2ecf20Sopenharmony_ci } else { 6138c2ecf20Sopenharmony_ci len = copy_to_iter(data->in + masked_cons, len, msg_iter); 6148c2ecf20Sopenharmony_ci } 6158c2ecf20Sopenharmony_ci } 6168c2ecf20Sopenharmony_ciout: 6178c2ecf20Sopenharmony_ci /* read data from the ring before increasing the index */ 6188c2ecf20Sopenharmony_ci virt_mb(); 6198c2ecf20Sopenharmony_ci if (!(flags & MSG_PEEK)) 6208c2ecf20Sopenharmony_ci intf->in_cons += len; 6218c2ecf20Sopenharmony_ci 6228c2ecf20Sopenharmony_ci return len; 6238c2ecf20Sopenharmony_ci} 6248c2ecf20Sopenharmony_ci 6258c2ecf20Sopenharmony_ciint pvcalls_front_recvmsg(struct socket *sock, struct msghdr *msg, size_t len, 6268c2ecf20Sopenharmony_ci int flags) 6278c2ecf20Sopenharmony_ci{ 6288c2ecf20Sopenharmony_ci int ret; 6298c2ecf20Sopenharmony_ci struct sock_mapping *map; 6308c2ecf20Sopenharmony_ci 6318c2ecf20Sopenharmony_ci if (flags & (MSG_CMSG_CLOEXEC|MSG_ERRQUEUE|MSG_OOB|MSG_TRUNC)) 6328c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 6338c2ecf20Sopenharmony_ci 6348c2ecf20Sopenharmony_ci map = pvcalls_enter_sock(sock); 6358c2ecf20Sopenharmony_ci if (IS_ERR(map)) 6368c2ecf20Sopenharmony_ci return PTR_ERR(map); 6378c2ecf20Sopenharmony_ci 6388c2ecf20Sopenharmony_ci mutex_lock(&map->active.in_mutex); 6398c2ecf20Sopenharmony_ci if (len > XEN_FLEX_RING_SIZE(PVCALLS_RING_ORDER)) 6408c2ecf20Sopenharmony_ci len = XEN_FLEX_RING_SIZE(PVCALLS_RING_ORDER); 6418c2ecf20Sopenharmony_ci 6428c2ecf20Sopenharmony_ci while (!(flags & MSG_DONTWAIT) && !pvcalls_front_read_todo(map)) { 6438c2ecf20Sopenharmony_ci wait_event_interruptible(map->active.inflight_conn_req, 6448c2ecf20Sopenharmony_ci pvcalls_front_read_todo(map)); 6458c2ecf20Sopenharmony_ci } 6468c2ecf20Sopenharmony_ci ret = __read_ring(map->active.ring, &map->active.data, 6478c2ecf20Sopenharmony_ci &msg->msg_iter, len, flags); 6488c2ecf20Sopenharmony_ci 6498c2ecf20Sopenharmony_ci if (ret > 0) 6508c2ecf20Sopenharmony_ci notify_remote_via_irq(map->active.irq); 6518c2ecf20Sopenharmony_ci if (ret == 0) 6528c2ecf20Sopenharmony_ci ret = (flags & MSG_DONTWAIT) ? -EAGAIN : 0; 6538c2ecf20Sopenharmony_ci if (ret == -ENOTCONN) 6548c2ecf20Sopenharmony_ci ret = 0; 6558c2ecf20Sopenharmony_ci 6568c2ecf20Sopenharmony_ci mutex_unlock(&map->active.in_mutex); 6578c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 6588c2ecf20Sopenharmony_ci return ret; 6598c2ecf20Sopenharmony_ci} 6608c2ecf20Sopenharmony_ci 6618c2ecf20Sopenharmony_ciint pvcalls_front_bind(struct socket *sock, struct sockaddr *addr, int addr_len) 6628c2ecf20Sopenharmony_ci{ 6638c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata; 6648c2ecf20Sopenharmony_ci struct sock_mapping *map = NULL; 6658c2ecf20Sopenharmony_ci struct xen_pvcalls_request *req; 6668c2ecf20Sopenharmony_ci int notify, req_id, ret; 6678c2ecf20Sopenharmony_ci 6688c2ecf20Sopenharmony_ci if (addr->sa_family != AF_INET || sock->type != SOCK_STREAM) 6698c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 6708c2ecf20Sopenharmony_ci 6718c2ecf20Sopenharmony_ci map = pvcalls_enter_sock(sock); 6728c2ecf20Sopenharmony_ci if (IS_ERR(map)) 6738c2ecf20Sopenharmony_ci return PTR_ERR(map); 6748c2ecf20Sopenharmony_ci bedata = dev_get_drvdata(&pvcalls_front_dev->dev); 6758c2ecf20Sopenharmony_ci 6768c2ecf20Sopenharmony_ci spin_lock(&bedata->socket_lock); 6778c2ecf20Sopenharmony_ci ret = get_request(bedata, &req_id); 6788c2ecf20Sopenharmony_ci if (ret < 0) { 6798c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 6808c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 6818c2ecf20Sopenharmony_ci return ret; 6828c2ecf20Sopenharmony_ci } 6838c2ecf20Sopenharmony_ci req = RING_GET_REQUEST(&bedata->ring, req_id); 6848c2ecf20Sopenharmony_ci req->req_id = req_id; 6858c2ecf20Sopenharmony_ci map->sock = sock; 6868c2ecf20Sopenharmony_ci req->cmd = PVCALLS_BIND; 6878c2ecf20Sopenharmony_ci req->u.bind.id = (uintptr_t)map; 6888c2ecf20Sopenharmony_ci memcpy(req->u.bind.addr, addr, sizeof(*addr)); 6898c2ecf20Sopenharmony_ci req->u.bind.len = addr_len; 6908c2ecf20Sopenharmony_ci 6918c2ecf20Sopenharmony_ci init_waitqueue_head(&map->passive.inflight_accept_req); 6928c2ecf20Sopenharmony_ci 6938c2ecf20Sopenharmony_ci map->active_socket = false; 6948c2ecf20Sopenharmony_ci 6958c2ecf20Sopenharmony_ci bedata->ring.req_prod_pvt++; 6968c2ecf20Sopenharmony_ci RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&bedata->ring, notify); 6978c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 6988c2ecf20Sopenharmony_ci if (notify) 6998c2ecf20Sopenharmony_ci notify_remote_via_irq(bedata->irq); 7008c2ecf20Sopenharmony_ci 7018c2ecf20Sopenharmony_ci wait_event(bedata->inflight_req, 7028c2ecf20Sopenharmony_ci READ_ONCE(bedata->rsp[req_id].req_id) == req_id); 7038c2ecf20Sopenharmony_ci 7048c2ecf20Sopenharmony_ci /* read req_id, then the content */ 7058c2ecf20Sopenharmony_ci smp_rmb(); 7068c2ecf20Sopenharmony_ci ret = bedata->rsp[req_id].ret; 7078c2ecf20Sopenharmony_ci bedata->rsp[req_id].req_id = PVCALLS_INVALID_ID; 7088c2ecf20Sopenharmony_ci 7098c2ecf20Sopenharmony_ci map->passive.status = PVCALLS_STATUS_BIND; 7108c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 7118c2ecf20Sopenharmony_ci return 0; 7128c2ecf20Sopenharmony_ci} 7138c2ecf20Sopenharmony_ci 7148c2ecf20Sopenharmony_ciint pvcalls_front_listen(struct socket *sock, int backlog) 7158c2ecf20Sopenharmony_ci{ 7168c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata; 7178c2ecf20Sopenharmony_ci struct sock_mapping *map; 7188c2ecf20Sopenharmony_ci struct xen_pvcalls_request *req; 7198c2ecf20Sopenharmony_ci int notify, req_id, ret; 7208c2ecf20Sopenharmony_ci 7218c2ecf20Sopenharmony_ci map = pvcalls_enter_sock(sock); 7228c2ecf20Sopenharmony_ci if (IS_ERR(map)) 7238c2ecf20Sopenharmony_ci return PTR_ERR(map); 7248c2ecf20Sopenharmony_ci bedata = dev_get_drvdata(&pvcalls_front_dev->dev); 7258c2ecf20Sopenharmony_ci 7268c2ecf20Sopenharmony_ci if (map->passive.status != PVCALLS_STATUS_BIND) { 7278c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 7288c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 7298c2ecf20Sopenharmony_ci } 7308c2ecf20Sopenharmony_ci 7318c2ecf20Sopenharmony_ci spin_lock(&bedata->socket_lock); 7328c2ecf20Sopenharmony_ci ret = get_request(bedata, &req_id); 7338c2ecf20Sopenharmony_ci if (ret < 0) { 7348c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 7358c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 7368c2ecf20Sopenharmony_ci return ret; 7378c2ecf20Sopenharmony_ci } 7388c2ecf20Sopenharmony_ci req = RING_GET_REQUEST(&bedata->ring, req_id); 7398c2ecf20Sopenharmony_ci req->req_id = req_id; 7408c2ecf20Sopenharmony_ci req->cmd = PVCALLS_LISTEN; 7418c2ecf20Sopenharmony_ci req->u.listen.id = (uintptr_t) map; 7428c2ecf20Sopenharmony_ci req->u.listen.backlog = backlog; 7438c2ecf20Sopenharmony_ci 7448c2ecf20Sopenharmony_ci bedata->ring.req_prod_pvt++; 7458c2ecf20Sopenharmony_ci RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&bedata->ring, notify); 7468c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 7478c2ecf20Sopenharmony_ci if (notify) 7488c2ecf20Sopenharmony_ci notify_remote_via_irq(bedata->irq); 7498c2ecf20Sopenharmony_ci 7508c2ecf20Sopenharmony_ci wait_event(bedata->inflight_req, 7518c2ecf20Sopenharmony_ci READ_ONCE(bedata->rsp[req_id].req_id) == req_id); 7528c2ecf20Sopenharmony_ci 7538c2ecf20Sopenharmony_ci /* read req_id, then the content */ 7548c2ecf20Sopenharmony_ci smp_rmb(); 7558c2ecf20Sopenharmony_ci ret = bedata->rsp[req_id].ret; 7568c2ecf20Sopenharmony_ci bedata->rsp[req_id].req_id = PVCALLS_INVALID_ID; 7578c2ecf20Sopenharmony_ci 7588c2ecf20Sopenharmony_ci map->passive.status = PVCALLS_STATUS_LISTEN; 7598c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 7608c2ecf20Sopenharmony_ci return ret; 7618c2ecf20Sopenharmony_ci} 7628c2ecf20Sopenharmony_ci 7638c2ecf20Sopenharmony_ciint pvcalls_front_accept(struct socket *sock, struct socket *newsock, int flags) 7648c2ecf20Sopenharmony_ci{ 7658c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata; 7668c2ecf20Sopenharmony_ci struct sock_mapping *map; 7678c2ecf20Sopenharmony_ci struct sock_mapping *map2 = NULL; 7688c2ecf20Sopenharmony_ci struct xen_pvcalls_request *req; 7698c2ecf20Sopenharmony_ci int notify, req_id, ret, nonblock; 7708c2ecf20Sopenharmony_ci evtchn_port_t evtchn; 7718c2ecf20Sopenharmony_ci 7728c2ecf20Sopenharmony_ci map = pvcalls_enter_sock(sock); 7738c2ecf20Sopenharmony_ci if (IS_ERR(map)) 7748c2ecf20Sopenharmony_ci return PTR_ERR(map); 7758c2ecf20Sopenharmony_ci bedata = dev_get_drvdata(&pvcalls_front_dev->dev); 7768c2ecf20Sopenharmony_ci 7778c2ecf20Sopenharmony_ci if (map->passive.status != PVCALLS_STATUS_LISTEN) { 7788c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 7798c2ecf20Sopenharmony_ci return -EINVAL; 7808c2ecf20Sopenharmony_ci } 7818c2ecf20Sopenharmony_ci 7828c2ecf20Sopenharmony_ci nonblock = flags & SOCK_NONBLOCK; 7838c2ecf20Sopenharmony_ci /* 7848c2ecf20Sopenharmony_ci * Backend only supports 1 inflight accept request, will return 7858c2ecf20Sopenharmony_ci * errors for the others 7868c2ecf20Sopenharmony_ci */ 7878c2ecf20Sopenharmony_ci if (test_and_set_bit(PVCALLS_FLAG_ACCEPT_INFLIGHT, 7888c2ecf20Sopenharmony_ci (void *)&map->passive.flags)) { 7898c2ecf20Sopenharmony_ci req_id = READ_ONCE(map->passive.inflight_req_id); 7908c2ecf20Sopenharmony_ci if (req_id != PVCALLS_INVALID_ID && 7918c2ecf20Sopenharmony_ci READ_ONCE(bedata->rsp[req_id].req_id) == req_id) { 7928c2ecf20Sopenharmony_ci map2 = map->passive.accept_map; 7938c2ecf20Sopenharmony_ci goto received; 7948c2ecf20Sopenharmony_ci } 7958c2ecf20Sopenharmony_ci if (nonblock) { 7968c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 7978c2ecf20Sopenharmony_ci return -EAGAIN; 7988c2ecf20Sopenharmony_ci } 7998c2ecf20Sopenharmony_ci if (wait_event_interruptible(map->passive.inflight_accept_req, 8008c2ecf20Sopenharmony_ci !test_and_set_bit(PVCALLS_FLAG_ACCEPT_INFLIGHT, 8018c2ecf20Sopenharmony_ci (void *)&map->passive.flags))) { 8028c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 8038c2ecf20Sopenharmony_ci return -EINTR; 8048c2ecf20Sopenharmony_ci } 8058c2ecf20Sopenharmony_ci } 8068c2ecf20Sopenharmony_ci 8078c2ecf20Sopenharmony_ci map2 = kzalloc(sizeof(*map2), GFP_KERNEL); 8088c2ecf20Sopenharmony_ci if (map2 == NULL) { 8098c2ecf20Sopenharmony_ci clear_bit(PVCALLS_FLAG_ACCEPT_INFLIGHT, 8108c2ecf20Sopenharmony_ci (void *)&map->passive.flags); 8118c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 8128c2ecf20Sopenharmony_ci return -ENOMEM; 8138c2ecf20Sopenharmony_ci } 8148c2ecf20Sopenharmony_ci ret = alloc_active_ring(map2); 8158c2ecf20Sopenharmony_ci if (ret < 0) { 8168c2ecf20Sopenharmony_ci clear_bit(PVCALLS_FLAG_ACCEPT_INFLIGHT, 8178c2ecf20Sopenharmony_ci (void *)&map->passive.flags); 8188c2ecf20Sopenharmony_ci kfree(map2); 8198c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 8208c2ecf20Sopenharmony_ci return ret; 8218c2ecf20Sopenharmony_ci } 8228c2ecf20Sopenharmony_ci spin_lock(&bedata->socket_lock); 8238c2ecf20Sopenharmony_ci ret = get_request(bedata, &req_id); 8248c2ecf20Sopenharmony_ci if (ret < 0) { 8258c2ecf20Sopenharmony_ci clear_bit(PVCALLS_FLAG_ACCEPT_INFLIGHT, 8268c2ecf20Sopenharmony_ci (void *)&map->passive.flags); 8278c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 8288c2ecf20Sopenharmony_ci free_active_ring(map2); 8298c2ecf20Sopenharmony_ci kfree(map2); 8308c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 8318c2ecf20Sopenharmony_ci return ret; 8328c2ecf20Sopenharmony_ci } 8338c2ecf20Sopenharmony_ci 8348c2ecf20Sopenharmony_ci ret = create_active(map2, &evtchn); 8358c2ecf20Sopenharmony_ci if (ret < 0) { 8368c2ecf20Sopenharmony_ci free_active_ring(map2); 8378c2ecf20Sopenharmony_ci kfree(map2); 8388c2ecf20Sopenharmony_ci clear_bit(PVCALLS_FLAG_ACCEPT_INFLIGHT, 8398c2ecf20Sopenharmony_ci (void *)&map->passive.flags); 8408c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 8418c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 8428c2ecf20Sopenharmony_ci return ret; 8438c2ecf20Sopenharmony_ci } 8448c2ecf20Sopenharmony_ci list_add_tail(&map2->list, &bedata->socket_mappings); 8458c2ecf20Sopenharmony_ci 8468c2ecf20Sopenharmony_ci req = RING_GET_REQUEST(&bedata->ring, req_id); 8478c2ecf20Sopenharmony_ci req->req_id = req_id; 8488c2ecf20Sopenharmony_ci req->cmd = PVCALLS_ACCEPT; 8498c2ecf20Sopenharmony_ci req->u.accept.id = (uintptr_t) map; 8508c2ecf20Sopenharmony_ci req->u.accept.ref = map2->active.ref; 8518c2ecf20Sopenharmony_ci req->u.accept.id_new = (uintptr_t) map2; 8528c2ecf20Sopenharmony_ci req->u.accept.evtchn = evtchn; 8538c2ecf20Sopenharmony_ci map->passive.accept_map = map2; 8548c2ecf20Sopenharmony_ci 8558c2ecf20Sopenharmony_ci bedata->ring.req_prod_pvt++; 8568c2ecf20Sopenharmony_ci RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&bedata->ring, notify); 8578c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 8588c2ecf20Sopenharmony_ci if (notify) 8598c2ecf20Sopenharmony_ci notify_remote_via_irq(bedata->irq); 8608c2ecf20Sopenharmony_ci /* We could check if we have received a response before returning. */ 8618c2ecf20Sopenharmony_ci if (nonblock) { 8628c2ecf20Sopenharmony_ci WRITE_ONCE(map->passive.inflight_req_id, req_id); 8638c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 8648c2ecf20Sopenharmony_ci return -EAGAIN; 8658c2ecf20Sopenharmony_ci } 8668c2ecf20Sopenharmony_ci 8678c2ecf20Sopenharmony_ci if (wait_event_interruptible(bedata->inflight_req, 8688c2ecf20Sopenharmony_ci READ_ONCE(bedata->rsp[req_id].req_id) == req_id)) { 8698c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 8708c2ecf20Sopenharmony_ci return -EINTR; 8718c2ecf20Sopenharmony_ci } 8728c2ecf20Sopenharmony_ci /* read req_id, then the content */ 8738c2ecf20Sopenharmony_ci smp_rmb(); 8748c2ecf20Sopenharmony_ci 8758c2ecf20Sopenharmony_cireceived: 8768c2ecf20Sopenharmony_ci map2->sock = newsock; 8778c2ecf20Sopenharmony_ci newsock->sk = sk_alloc(sock_net(sock->sk), PF_INET, GFP_KERNEL, &pvcalls_proto, false); 8788c2ecf20Sopenharmony_ci if (!newsock->sk) { 8798c2ecf20Sopenharmony_ci bedata->rsp[req_id].req_id = PVCALLS_INVALID_ID; 8808c2ecf20Sopenharmony_ci map->passive.inflight_req_id = PVCALLS_INVALID_ID; 8818c2ecf20Sopenharmony_ci clear_bit(PVCALLS_FLAG_ACCEPT_INFLIGHT, 8828c2ecf20Sopenharmony_ci (void *)&map->passive.flags); 8838c2ecf20Sopenharmony_ci pvcalls_front_free_map(bedata, map2); 8848c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 8858c2ecf20Sopenharmony_ci return -ENOMEM; 8868c2ecf20Sopenharmony_ci } 8878c2ecf20Sopenharmony_ci newsock->sk->sk_send_head = (void *)map2; 8888c2ecf20Sopenharmony_ci 8898c2ecf20Sopenharmony_ci ret = bedata->rsp[req_id].ret; 8908c2ecf20Sopenharmony_ci bedata->rsp[req_id].req_id = PVCALLS_INVALID_ID; 8918c2ecf20Sopenharmony_ci map->passive.inflight_req_id = PVCALLS_INVALID_ID; 8928c2ecf20Sopenharmony_ci 8938c2ecf20Sopenharmony_ci clear_bit(PVCALLS_FLAG_ACCEPT_INFLIGHT, (void *)&map->passive.flags); 8948c2ecf20Sopenharmony_ci wake_up(&map->passive.inflight_accept_req); 8958c2ecf20Sopenharmony_ci 8968c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 8978c2ecf20Sopenharmony_ci return ret; 8988c2ecf20Sopenharmony_ci} 8998c2ecf20Sopenharmony_ci 9008c2ecf20Sopenharmony_cistatic __poll_t pvcalls_front_poll_passive(struct file *file, 9018c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata, 9028c2ecf20Sopenharmony_ci struct sock_mapping *map, 9038c2ecf20Sopenharmony_ci poll_table *wait) 9048c2ecf20Sopenharmony_ci{ 9058c2ecf20Sopenharmony_ci int notify, req_id, ret; 9068c2ecf20Sopenharmony_ci struct xen_pvcalls_request *req; 9078c2ecf20Sopenharmony_ci 9088c2ecf20Sopenharmony_ci if (test_bit(PVCALLS_FLAG_ACCEPT_INFLIGHT, 9098c2ecf20Sopenharmony_ci (void *)&map->passive.flags)) { 9108c2ecf20Sopenharmony_ci uint32_t req_id = READ_ONCE(map->passive.inflight_req_id); 9118c2ecf20Sopenharmony_ci 9128c2ecf20Sopenharmony_ci if (req_id != PVCALLS_INVALID_ID && 9138c2ecf20Sopenharmony_ci READ_ONCE(bedata->rsp[req_id].req_id) == req_id) 9148c2ecf20Sopenharmony_ci return EPOLLIN | EPOLLRDNORM; 9158c2ecf20Sopenharmony_ci 9168c2ecf20Sopenharmony_ci poll_wait(file, &map->passive.inflight_accept_req, wait); 9178c2ecf20Sopenharmony_ci return 0; 9188c2ecf20Sopenharmony_ci } 9198c2ecf20Sopenharmony_ci 9208c2ecf20Sopenharmony_ci if (test_and_clear_bit(PVCALLS_FLAG_POLL_RET, 9218c2ecf20Sopenharmony_ci (void *)&map->passive.flags)) 9228c2ecf20Sopenharmony_ci return EPOLLIN | EPOLLRDNORM; 9238c2ecf20Sopenharmony_ci 9248c2ecf20Sopenharmony_ci /* 9258c2ecf20Sopenharmony_ci * First check RET, then INFLIGHT. No barriers necessary to 9268c2ecf20Sopenharmony_ci * ensure execution ordering because of the conditional 9278c2ecf20Sopenharmony_ci * instructions creating control dependencies. 9288c2ecf20Sopenharmony_ci */ 9298c2ecf20Sopenharmony_ci 9308c2ecf20Sopenharmony_ci if (test_and_set_bit(PVCALLS_FLAG_POLL_INFLIGHT, 9318c2ecf20Sopenharmony_ci (void *)&map->passive.flags)) { 9328c2ecf20Sopenharmony_ci poll_wait(file, &bedata->inflight_req, wait); 9338c2ecf20Sopenharmony_ci return 0; 9348c2ecf20Sopenharmony_ci } 9358c2ecf20Sopenharmony_ci 9368c2ecf20Sopenharmony_ci spin_lock(&bedata->socket_lock); 9378c2ecf20Sopenharmony_ci ret = get_request(bedata, &req_id); 9388c2ecf20Sopenharmony_ci if (ret < 0) { 9398c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 9408c2ecf20Sopenharmony_ci return ret; 9418c2ecf20Sopenharmony_ci } 9428c2ecf20Sopenharmony_ci req = RING_GET_REQUEST(&bedata->ring, req_id); 9438c2ecf20Sopenharmony_ci req->req_id = req_id; 9448c2ecf20Sopenharmony_ci req->cmd = PVCALLS_POLL; 9458c2ecf20Sopenharmony_ci req->u.poll.id = (uintptr_t) map; 9468c2ecf20Sopenharmony_ci 9478c2ecf20Sopenharmony_ci bedata->ring.req_prod_pvt++; 9488c2ecf20Sopenharmony_ci RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&bedata->ring, notify); 9498c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 9508c2ecf20Sopenharmony_ci if (notify) 9518c2ecf20Sopenharmony_ci notify_remote_via_irq(bedata->irq); 9528c2ecf20Sopenharmony_ci 9538c2ecf20Sopenharmony_ci poll_wait(file, &bedata->inflight_req, wait); 9548c2ecf20Sopenharmony_ci return 0; 9558c2ecf20Sopenharmony_ci} 9568c2ecf20Sopenharmony_ci 9578c2ecf20Sopenharmony_cistatic __poll_t pvcalls_front_poll_active(struct file *file, 9588c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata, 9598c2ecf20Sopenharmony_ci struct sock_mapping *map, 9608c2ecf20Sopenharmony_ci poll_table *wait) 9618c2ecf20Sopenharmony_ci{ 9628c2ecf20Sopenharmony_ci __poll_t mask = 0; 9638c2ecf20Sopenharmony_ci int32_t in_error, out_error; 9648c2ecf20Sopenharmony_ci struct pvcalls_data_intf *intf = map->active.ring; 9658c2ecf20Sopenharmony_ci 9668c2ecf20Sopenharmony_ci out_error = intf->out_error; 9678c2ecf20Sopenharmony_ci in_error = intf->in_error; 9688c2ecf20Sopenharmony_ci 9698c2ecf20Sopenharmony_ci poll_wait(file, &map->active.inflight_conn_req, wait); 9708c2ecf20Sopenharmony_ci if (pvcalls_front_write_todo(map)) 9718c2ecf20Sopenharmony_ci mask |= EPOLLOUT | EPOLLWRNORM; 9728c2ecf20Sopenharmony_ci if (pvcalls_front_read_todo(map)) 9738c2ecf20Sopenharmony_ci mask |= EPOLLIN | EPOLLRDNORM; 9748c2ecf20Sopenharmony_ci if (in_error != 0 || out_error != 0) 9758c2ecf20Sopenharmony_ci mask |= EPOLLERR; 9768c2ecf20Sopenharmony_ci 9778c2ecf20Sopenharmony_ci return mask; 9788c2ecf20Sopenharmony_ci} 9798c2ecf20Sopenharmony_ci 9808c2ecf20Sopenharmony_ci__poll_t pvcalls_front_poll(struct file *file, struct socket *sock, 9818c2ecf20Sopenharmony_ci poll_table *wait) 9828c2ecf20Sopenharmony_ci{ 9838c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata; 9848c2ecf20Sopenharmony_ci struct sock_mapping *map; 9858c2ecf20Sopenharmony_ci __poll_t ret; 9868c2ecf20Sopenharmony_ci 9878c2ecf20Sopenharmony_ci map = pvcalls_enter_sock(sock); 9888c2ecf20Sopenharmony_ci if (IS_ERR(map)) 9898c2ecf20Sopenharmony_ci return EPOLLNVAL; 9908c2ecf20Sopenharmony_ci bedata = dev_get_drvdata(&pvcalls_front_dev->dev); 9918c2ecf20Sopenharmony_ci 9928c2ecf20Sopenharmony_ci if (map->active_socket) 9938c2ecf20Sopenharmony_ci ret = pvcalls_front_poll_active(file, bedata, map, wait); 9948c2ecf20Sopenharmony_ci else 9958c2ecf20Sopenharmony_ci ret = pvcalls_front_poll_passive(file, bedata, map, wait); 9968c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 9978c2ecf20Sopenharmony_ci return ret; 9988c2ecf20Sopenharmony_ci} 9998c2ecf20Sopenharmony_ci 10008c2ecf20Sopenharmony_ciint pvcalls_front_release(struct socket *sock) 10018c2ecf20Sopenharmony_ci{ 10028c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata; 10038c2ecf20Sopenharmony_ci struct sock_mapping *map; 10048c2ecf20Sopenharmony_ci int req_id, notify, ret; 10058c2ecf20Sopenharmony_ci struct xen_pvcalls_request *req; 10068c2ecf20Sopenharmony_ci 10078c2ecf20Sopenharmony_ci if (sock->sk == NULL) 10088c2ecf20Sopenharmony_ci return 0; 10098c2ecf20Sopenharmony_ci 10108c2ecf20Sopenharmony_ci map = pvcalls_enter_sock(sock); 10118c2ecf20Sopenharmony_ci if (IS_ERR(map)) { 10128c2ecf20Sopenharmony_ci if (PTR_ERR(map) == -ENOTCONN) 10138c2ecf20Sopenharmony_ci return -EIO; 10148c2ecf20Sopenharmony_ci else 10158c2ecf20Sopenharmony_ci return 0; 10168c2ecf20Sopenharmony_ci } 10178c2ecf20Sopenharmony_ci bedata = dev_get_drvdata(&pvcalls_front_dev->dev); 10188c2ecf20Sopenharmony_ci 10198c2ecf20Sopenharmony_ci spin_lock(&bedata->socket_lock); 10208c2ecf20Sopenharmony_ci ret = get_request(bedata, &req_id); 10218c2ecf20Sopenharmony_ci if (ret < 0) { 10228c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 10238c2ecf20Sopenharmony_ci pvcalls_exit_sock(sock); 10248c2ecf20Sopenharmony_ci return ret; 10258c2ecf20Sopenharmony_ci } 10268c2ecf20Sopenharmony_ci sock->sk->sk_send_head = NULL; 10278c2ecf20Sopenharmony_ci 10288c2ecf20Sopenharmony_ci req = RING_GET_REQUEST(&bedata->ring, req_id); 10298c2ecf20Sopenharmony_ci req->req_id = req_id; 10308c2ecf20Sopenharmony_ci req->cmd = PVCALLS_RELEASE; 10318c2ecf20Sopenharmony_ci req->u.release.id = (uintptr_t)map; 10328c2ecf20Sopenharmony_ci 10338c2ecf20Sopenharmony_ci bedata->ring.req_prod_pvt++; 10348c2ecf20Sopenharmony_ci RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&bedata->ring, notify); 10358c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 10368c2ecf20Sopenharmony_ci if (notify) 10378c2ecf20Sopenharmony_ci notify_remote_via_irq(bedata->irq); 10388c2ecf20Sopenharmony_ci 10398c2ecf20Sopenharmony_ci wait_event(bedata->inflight_req, 10408c2ecf20Sopenharmony_ci READ_ONCE(bedata->rsp[req_id].req_id) == req_id); 10418c2ecf20Sopenharmony_ci 10428c2ecf20Sopenharmony_ci if (map->active_socket) { 10438c2ecf20Sopenharmony_ci /* 10448c2ecf20Sopenharmony_ci * Set in_error and wake up inflight_conn_req to force 10458c2ecf20Sopenharmony_ci * recvmsg waiters to exit. 10468c2ecf20Sopenharmony_ci */ 10478c2ecf20Sopenharmony_ci map->active.ring->in_error = -EBADF; 10488c2ecf20Sopenharmony_ci wake_up_interruptible(&map->active.inflight_conn_req); 10498c2ecf20Sopenharmony_ci 10508c2ecf20Sopenharmony_ci /* 10518c2ecf20Sopenharmony_ci * We need to make sure that sendmsg/recvmsg on this socket have 10528c2ecf20Sopenharmony_ci * not started before we've cleared sk_send_head here. The 10538c2ecf20Sopenharmony_ci * easiest way to guarantee this is to see that no pvcalls 10548c2ecf20Sopenharmony_ci * (other than us) is in progress on this socket. 10558c2ecf20Sopenharmony_ci */ 10568c2ecf20Sopenharmony_ci while (atomic_read(&map->refcount) > 1) 10578c2ecf20Sopenharmony_ci cpu_relax(); 10588c2ecf20Sopenharmony_ci 10598c2ecf20Sopenharmony_ci pvcalls_front_free_map(bedata, map); 10608c2ecf20Sopenharmony_ci } else { 10618c2ecf20Sopenharmony_ci wake_up(&bedata->inflight_req); 10628c2ecf20Sopenharmony_ci wake_up(&map->passive.inflight_accept_req); 10638c2ecf20Sopenharmony_ci 10648c2ecf20Sopenharmony_ci while (atomic_read(&map->refcount) > 1) 10658c2ecf20Sopenharmony_ci cpu_relax(); 10668c2ecf20Sopenharmony_ci 10678c2ecf20Sopenharmony_ci spin_lock(&bedata->socket_lock); 10688c2ecf20Sopenharmony_ci list_del(&map->list); 10698c2ecf20Sopenharmony_ci spin_unlock(&bedata->socket_lock); 10708c2ecf20Sopenharmony_ci if (READ_ONCE(map->passive.inflight_req_id) != PVCALLS_INVALID_ID && 10718c2ecf20Sopenharmony_ci READ_ONCE(map->passive.inflight_req_id) != 0) { 10728c2ecf20Sopenharmony_ci pvcalls_front_free_map(bedata, 10738c2ecf20Sopenharmony_ci map->passive.accept_map); 10748c2ecf20Sopenharmony_ci } 10758c2ecf20Sopenharmony_ci kfree(map); 10768c2ecf20Sopenharmony_ci } 10778c2ecf20Sopenharmony_ci WRITE_ONCE(bedata->rsp[req_id].req_id, PVCALLS_INVALID_ID); 10788c2ecf20Sopenharmony_ci 10798c2ecf20Sopenharmony_ci pvcalls_exit(); 10808c2ecf20Sopenharmony_ci return 0; 10818c2ecf20Sopenharmony_ci} 10828c2ecf20Sopenharmony_ci 10838c2ecf20Sopenharmony_cistatic const struct xenbus_device_id pvcalls_front_ids[] = { 10848c2ecf20Sopenharmony_ci { "pvcalls" }, 10858c2ecf20Sopenharmony_ci { "" } 10868c2ecf20Sopenharmony_ci}; 10878c2ecf20Sopenharmony_ci 10888c2ecf20Sopenharmony_cistatic int pvcalls_front_remove(struct xenbus_device *dev) 10898c2ecf20Sopenharmony_ci{ 10908c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata; 10918c2ecf20Sopenharmony_ci struct sock_mapping *map = NULL, *n; 10928c2ecf20Sopenharmony_ci 10938c2ecf20Sopenharmony_ci bedata = dev_get_drvdata(&pvcalls_front_dev->dev); 10948c2ecf20Sopenharmony_ci dev_set_drvdata(&dev->dev, NULL); 10958c2ecf20Sopenharmony_ci pvcalls_front_dev = NULL; 10968c2ecf20Sopenharmony_ci if (bedata->irq >= 0) 10978c2ecf20Sopenharmony_ci unbind_from_irqhandler(bedata->irq, dev); 10988c2ecf20Sopenharmony_ci 10998c2ecf20Sopenharmony_ci list_for_each_entry_safe(map, n, &bedata->socket_mappings, list) { 11008c2ecf20Sopenharmony_ci map->sock->sk->sk_send_head = NULL; 11018c2ecf20Sopenharmony_ci if (map->active_socket) { 11028c2ecf20Sopenharmony_ci map->active.ring->in_error = -EBADF; 11038c2ecf20Sopenharmony_ci wake_up_interruptible(&map->active.inflight_conn_req); 11048c2ecf20Sopenharmony_ci } 11058c2ecf20Sopenharmony_ci } 11068c2ecf20Sopenharmony_ci 11078c2ecf20Sopenharmony_ci smp_mb(); 11088c2ecf20Sopenharmony_ci while (atomic_read(&pvcalls_refcount) > 0) 11098c2ecf20Sopenharmony_ci cpu_relax(); 11108c2ecf20Sopenharmony_ci list_for_each_entry_safe(map, n, &bedata->socket_mappings, list) { 11118c2ecf20Sopenharmony_ci if (map->active_socket) { 11128c2ecf20Sopenharmony_ci /* No need to lock, refcount is 0 */ 11138c2ecf20Sopenharmony_ci pvcalls_front_free_map(bedata, map); 11148c2ecf20Sopenharmony_ci } else { 11158c2ecf20Sopenharmony_ci list_del(&map->list); 11168c2ecf20Sopenharmony_ci kfree(map); 11178c2ecf20Sopenharmony_ci } 11188c2ecf20Sopenharmony_ci } 11198c2ecf20Sopenharmony_ci if (bedata->ref != -1) 11208c2ecf20Sopenharmony_ci gnttab_end_foreign_access(bedata->ref, 0, 0); 11218c2ecf20Sopenharmony_ci kfree(bedata->ring.sring); 11228c2ecf20Sopenharmony_ci kfree(bedata); 11238c2ecf20Sopenharmony_ci xenbus_switch_state(dev, XenbusStateClosed); 11248c2ecf20Sopenharmony_ci return 0; 11258c2ecf20Sopenharmony_ci} 11268c2ecf20Sopenharmony_ci 11278c2ecf20Sopenharmony_cistatic int pvcalls_front_probe(struct xenbus_device *dev, 11288c2ecf20Sopenharmony_ci const struct xenbus_device_id *id) 11298c2ecf20Sopenharmony_ci{ 11308c2ecf20Sopenharmony_ci int ret = -ENOMEM, i; 11318c2ecf20Sopenharmony_ci evtchn_port_t evtchn; 11328c2ecf20Sopenharmony_ci unsigned int max_page_order, function_calls, len; 11338c2ecf20Sopenharmony_ci char *versions; 11348c2ecf20Sopenharmony_ci grant_ref_t gref_head = 0; 11358c2ecf20Sopenharmony_ci struct xenbus_transaction xbt; 11368c2ecf20Sopenharmony_ci struct pvcalls_bedata *bedata = NULL; 11378c2ecf20Sopenharmony_ci struct xen_pvcalls_sring *sring; 11388c2ecf20Sopenharmony_ci 11398c2ecf20Sopenharmony_ci if (pvcalls_front_dev != NULL) { 11408c2ecf20Sopenharmony_ci dev_err(&dev->dev, "only one PV Calls connection supported\n"); 11418c2ecf20Sopenharmony_ci return -EINVAL; 11428c2ecf20Sopenharmony_ci } 11438c2ecf20Sopenharmony_ci 11448c2ecf20Sopenharmony_ci versions = xenbus_read(XBT_NIL, dev->otherend, "versions", &len); 11458c2ecf20Sopenharmony_ci if (IS_ERR(versions)) 11468c2ecf20Sopenharmony_ci return PTR_ERR(versions); 11478c2ecf20Sopenharmony_ci if (!len) 11488c2ecf20Sopenharmony_ci return -EINVAL; 11498c2ecf20Sopenharmony_ci if (strcmp(versions, "1")) { 11508c2ecf20Sopenharmony_ci kfree(versions); 11518c2ecf20Sopenharmony_ci return -EINVAL; 11528c2ecf20Sopenharmony_ci } 11538c2ecf20Sopenharmony_ci kfree(versions); 11548c2ecf20Sopenharmony_ci max_page_order = xenbus_read_unsigned(dev->otherend, 11558c2ecf20Sopenharmony_ci "max-page-order", 0); 11568c2ecf20Sopenharmony_ci if (max_page_order < PVCALLS_RING_ORDER) 11578c2ecf20Sopenharmony_ci return -ENODEV; 11588c2ecf20Sopenharmony_ci function_calls = xenbus_read_unsigned(dev->otherend, 11598c2ecf20Sopenharmony_ci "function-calls", 0); 11608c2ecf20Sopenharmony_ci /* See XENBUS_FUNCTIONS_CALLS in pvcalls.h */ 11618c2ecf20Sopenharmony_ci if (function_calls != 1) 11628c2ecf20Sopenharmony_ci return -ENODEV; 11638c2ecf20Sopenharmony_ci pr_info("%s max-page-order is %u\n", __func__, max_page_order); 11648c2ecf20Sopenharmony_ci 11658c2ecf20Sopenharmony_ci bedata = kzalloc(sizeof(struct pvcalls_bedata), GFP_KERNEL); 11668c2ecf20Sopenharmony_ci if (!bedata) 11678c2ecf20Sopenharmony_ci return -ENOMEM; 11688c2ecf20Sopenharmony_ci 11698c2ecf20Sopenharmony_ci dev_set_drvdata(&dev->dev, bedata); 11708c2ecf20Sopenharmony_ci pvcalls_front_dev = dev; 11718c2ecf20Sopenharmony_ci init_waitqueue_head(&bedata->inflight_req); 11728c2ecf20Sopenharmony_ci INIT_LIST_HEAD(&bedata->socket_mappings); 11738c2ecf20Sopenharmony_ci spin_lock_init(&bedata->socket_lock); 11748c2ecf20Sopenharmony_ci bedata->irq = -1; 11758c2ecf20Sopenharmony_ci bedata->ref = -1; 11768c2ecf20Sopenharmony_ci 11778c2ecf20Sopenharmony_ci for (i = 0; i < PVCALLS_NR_RSP_PER_RING; i++) 11788c2ecf20Sopenharmony_ci bedata->rsp[i].req_id = PVCALLS_INVALID_ID; 11798c2ecf20Sopenharmony_ci 11808c2ecf20Sopenharmony_ci sring = (struct xen_pvcalls_sring *) __get_free_page(GFP_KERNEL | 11818c2ecf20Sopenharmony_ci __GFP_ZERO); 11828c2ecf20Sopenharmony_ci if (!sring) 11838c2ecf20Sopenharmony_ci goto error; 11848c2ecf20Sopenharmony_ci SHARED_RING_INIT(sring); 11858c2ecf20Sopenharmony_ci FRONT_RING_INIT(&bedata->ring, sring, XEN_PAGE_SIZE); 11868c2ecf20Sopenharmony_ci 11878c2ecf20Sopenharmony_ci ret = xenbus_alloc_evtchn(dev, &evtchn); 11888c2ecf20Sopenharmony_ci if (ret) 11898c2ecf20Sopenharmony_ci goto error; 11908c2ecf20Sopenharmony_ci 11918c2ecf20Sopenharmony_ci bedata->irq = bind_evtchn_to_irqhandler(evtchn, 11928c2ecf20Sopenharmony_ci pvcalls_front_event_handler, 11938c2ecf20Sopenharmony_ci 0, "pvcalls-frontend", dev); 11948c2ecf20Sopenharmony_ci if (bedata->irq < 0) { 11958c2ecf20Sopenharmony_ci ret = bedata->irq; 11968c2ecf20Sopenharmony_ci goto error; 11978c2ecf20Sopenharmony_ci } 11988c2ecf20Sopenharmony_ci 11998c2ecf20Sopenharmony_ci ret = gnttab_alloc_grant_references(1, &gref_head); 12008c2ecf20Sopenharmony_ci if (ret < 0) 12018c2ecf20Sopenharmony_ci goto error; 12028c2ecf20Sopenharmony_ci ret = gnttab_claim_grant_reference(&gref_head); 12038c2ecf20Sopenharmony_ci if (ret < 0) 12048c2ecf20Sopenharmony_ci goto error; 12058c2ecf20Sopenharmony_ci bedata->ref = ret; 12068c2ecf20Sopenharmony_ci gnttab_grant_foreign_access_ref(bedata->ref, dev->otherend_id, 12078c2ecf20Sopenharmony_ci virt_to_gfn((void *)sring), 0); 12088c2ecf20Sopenharmony_ci 12098c2ecf20Sopenharmony_ci again: 12108c2ecf20Sopenharmony_ci ret = xenbus_transaction_start(&xbt); 12118c2ecf20Sopenharmony_ci if (ret) { 12128c2ecf20Sopenharmony_ci xenbus_dev_fatal(dev, ret, "starting transaction"); 12138c2ecf20Sopenharmony_ci goto error; 12148c2ecf20Sopenharmony_ci } 12158c2ecf20Sopenharmony_ci ret = xenbus_printf(xbt, dev->nodename, "version", "%u", 1); 12168c2ecf20Sopenharmony_ci if (ret) 12178c2ecf20Sopenharmony_ci goto error_xenbus; 12188c2ecf20Sopenharmony_ci ret = xenbus_printf(xbt, dev->nodename, "ring-ref", "%d", bedata->ref); 12198c2ecf20Sopenharmony_ci if (ret) 12208c2ecf20Sopenharmony_ci goto error_xenbus; 12218c2ecf20Sopenharmony_ci ret = xenbus_printf(xbt, dev->nodename, "port", "%u", 12228c2ecf20Sopenharmony_ci evtchn); 12238c2ecf20Sopenharmony_ci if (ret) 12248c2ecf20Sopenharmony_ci goto error_xenbus; 12258c2ecf20Sopenharmony_ci ret = xenbus_transaction_end(xbt, 0); 12268c2ecf20Sopenharmony_ci if (ret) { 12278c2ecf20Sopenharmony_ci if (ret == -EAGAIN) 12288c2ecf20Sopenharmony_ci goto again; 12298c2ecf20Sopenharmony_ci xenbus_dev_fatal(dev, ret, "completing transaction"); 12308c2ecf20Sopenharmony_ci goto error; 12318c2ecf20Sopenharmony_ci } 12328c2ecf20Sopenharmony_ci xenbus_switch_state(dev, XenbusStateInitialised); 12338c2ecf20Sopenharmony_ci 12348c2ecf20Sopenharmony_ci return 0; 12358c2ecf20Sopenharmony_ci 12368c2ecf20Sopenharmony_ci error_xenbus: 12378c2ecf20Sopenharmony_ci xenbus_transaction_end(xbt, 1); 12388c2ecf20Sopenharmony_ci xenbus_dev_fatal(dev, ret, "writing xenstore"); 12398c2ecf20Sopenharmony_ci error: 12408c2ecf20Sopenharmony_ci pvcalls_front_remove(dev); 12418c2ecf20Sopenharmony_ci return ret; 12428c2ecf20Sopenharmony_ci} 12438c2ecf20Sopenharmony_ci 12448c2ecf20Sopenharmony_cistatic void pvcalls_front_changed(struct xenbus_device *dev, 12458c2ecf20Sopenharmony_ci enum xenbus_state backend_state) 12468c2ecf20Sopenharmony_ci{ 12478c2ecf20Sopenharmony_ci switch (backend_state) { 12488c2ecf20Sopenharmony_ci case XenbusStateReconfiguring: 12498c2ecf20Sopenharmony_ci case XenbusStateReconfigured: 12508c2ecf20Sopenharmony_ci case XenbusStateInitialising: 12518c2ecf20Sopenharmony_ci case XenbusStateInitialised: 12528c2ecf20Sopenharmony_ci case XenbusStateUnknown: 12538c2ecf20Sopenharmony_ci break; 12548c2ecf20Sopenharmony_ci 12558c2ecf20Sopenharmony_ci case XenbusStateInitWait: 12568c2ecf20Sopenharmony_ci break; 12578c2ecf20Sopenharmony_ci 12588c2ecf20Sopenharmony_ci case XenbusStateConnected: 12598c2ecf20Sopenharmony_ci xenbus_switch_state(dev, XenbusStateConnected); 12608c2ecf20Sopenharmony_ci break; 12618c2ecf20Sopenharmony_ci 12628c2ecf20Sopenharmony_ci case XenbusStateClosed: 12638c2ecf20Sopenharmony_ci if (dev->state == XenbusStateClosed) 12648c2ecf20Sopenharmony_ci break; 12658c2ecf20Sopenharmony_ci /* Missed the backend's CLOSING state */ 12668c2ecf20Sopenharmony_ci fallthrough; 12678c2ecf20Sopenharmony_ci case XenbusStateClosing: 12688c2ecf20Sopenharmony_ci xenbus_frontend_closed(dev); 12698c2ecf20Sopenharmony_ci break; 12708c2ecf20Sopenharmony_ci } 12718c2ecf20Sopenharmony_ci} 12728c2ecf20Sopenharmony_ci 12738c2ecf20Sopenharmony_cistatic struct xenbus_driver pvcalls_front_driver = { 12748c2ecf20Sopenharmony_ci .ids = pvcalls_front_ids, 12758c2ecf20Sopenharmony_ci .probe = pvcalls_front_probe, 12768c2ecf20Sopenharmony_ci .remove = pvcalls_front_remove, 12778c2ecf20Sopenharmony_ci .otherend_changed = pvcalls_front_changed, 12788c2ecf20Sopenharmony_ci}; 12798c2ecf20Sopenharmony_ci 12808c2ecf20Sopenharmony_cistatic int __init pvcalls_frontend_init(void) 12818c2ecf20Sopenharmony_ci{ 12828c2ecf20Sopenharmony_ci if (!xen_domain()) 12838c2ecf20Sopenharmony_ci return -ENODEV; 12848c2ecf20Sopenharmony_ci 12858c2ecf20Sopenharmony_ci pr_info("Initialising Xen pvcalls frontend driver\n"); 12868c2ecf20Sopenharmony_ci 12878c2ecf20Sopenharmony_ci return xenbus_register_frontend(&pvcalls_front_driver); 12888c2ecf20Sopenharmony_ci} 12898c2ecf20Sopenharmony_ci 12908c2ecf20Sopenharmony_cimodule_init(pvcalls_frontend_init); 12918c2ecf20Sopenharmony_ci 12928c2ecf20Sopenharmony_ciMODULE_DESCRIPTION("Xen PV Calls frontend driver"); 12938c2ecf20Sopenharmony_ciMODULE_AUTHOR("Stefano Stabellini <sstabellini@kernel.org>"); 12948c2ecf20Sopenharmony_ciMODULE_LICENSE("GPL"); 1295