162306a36Sopenharmony_ci/*
262306a36Sopenharmony_ci * Copyright (c) 2005 Voltaire Inc.  All rights reserved.
362306a36Sopenharmony_ci * Copyright (c) 2002-2005, Network Appliance, Inc. All rights reserved.
462306a36Sopenharmony_ci * Copyright (c) 1999-2005, Mellanox Technologies, Inc. All rights reserved.
562306a36Sopenharmony_ci * Copyright (c) 2005 Intel Corporation.  All rights reserved.
662306a36Sopenharmony_ci *
762306a36Sopenharmony_ci * This software is available to you under a choice of one of two
862306a36Sopenharmony_ci * licenses.  You may choose to be licensed under the terms of the GNU
962306a36Sopenharmony_ci * General Public License (GPL) Version 2, available from the file
1062306a36Sopenharmony_ci * COPYING in the main directory of this source tree, or the
1162306a36Sopenharmony_ci * OpenIB.org BSD license below:
1262306a36Sopenharmony_ci *
1362306a36Sopenharmony_ci *     Redistribution and use in source and binary forms, with or
1462306a36Sopenharmony_ci *     without modification, are permitted provided that the following
1562306a36Sopenharmony_ci *     conditions are met:
1662306a36Sopenharmony_ci *
1762306a36Sopenharmony_ci *      - Redistributions of source code must retain the above
1862306a36Sopenharmony_ci *        copyright notice, this list of conditions and the following
1962306a36Sopenharmony_ci *        disclaimer.
2062306a36Sopenharmony_ci *
2162306a36Sopenharmony_ci *      - Redistributions in binary form must reproduce the above
2262306a36Sopenharmony_ci *        copyright notice, this list of conditions and the following
2362306a36Sopenharmony_ci *        disclaimer in the documentation and/or other materials
2462306a36Sopenharmony_ci *        provided with the distribution.
2562306a36Sopenharmony_ci *
2662306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
2762306a36Sopenharmony_ci * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
2862306a36Sopenharmony_ci * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
2962306a36Sopenharmony_ci * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
3062306a36Sopenharmony_ci * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
3162306a36Sopenharmony_ci * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
3262306a36Sopenharmony_ci * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
3362306a36Sopenharmony_ci * SOFTWARE.
3462306a36Sopenharmony_ci */
3562306a36Sopenharmony_ci
3662306a36Sopenharmony_ci#include <linux/mutex.h>
3762306a36Sopenharmony_ci#include <linux/inetdevice.h>
3862306a36Sopenharmony_ci#include <linux/slab.h>
3962306a36Sopenharmony_ci#include <linux/workqueue.h>
4062306a36Sopenharmony_ci#include <net/arp.h>
4162306a36Sopenharmony_ci#include <net/neighbour.h>
4262306a36Sopenharmony_ci#include <net/route.h>
4362306a36Sopenharmony_ci#include <net/netevent.h>
4462306a36Sopenharmony_ci#include <net/ipv6_stubs.h>
4562306a36Sopenharmony_ci#include <net/ip6_route.h>
4662306a36Sopenharmony_ci#include <rdma/ib_addr.h>
4762306a36Sopenharmony_ci#include <rdma/ib_cache.h>
4862306a36Sopenharmony_ci#include <rdma/ib_sa.h>
4962306a36Sopenharmony_ci#include <rdma/ib.h>
5062306a36Sopenharmony_ci#include <rdma/rdma_netlink.h>
5162306a36Sopenharmony_ci#include <net/netlink.h>
5262306a36Sopenharmony_ci
5362306a36Sopenharmony_ci#include "core_priv.h"
5462306a36Sopenharmony_ci
5562306a36Sopenharmony_cistruct addr_req {
5662306a36Sopenharmony_ci	struct list_head list;
5762306a36Sopenharmony_ci	struct sockaddr_storage src_addr;
5862306a36Sopenharmony_ci	struct sockaddr_storage dst_addr;
5962306a36Sopenharmony_ci	struct rdma_dev_addr *addr;
6062306a36Sopenharmony_ci	void *context;
6162306a36Sopenharmony_ci	void (*callback)(int status, struct sockaddr *src_addr,
6262306a36Sopenharmony_ci			 struct rdma_dev_addr *addr, void *context);
6362306a36Sopenharmony_ci	unsigned long timeout;
6462306a36Sopenharmony_ci	struct delayed_work work;
6562306a36Sopenharmony_ci	bool resolve_by_gid_attr;	/* Consider gid attr in resolve phase */
6662306a36Sopenharmony_ci	int status;
6762306a36Sopenharmony_ci	u32 seq;
6862306a36Sopenharmony_ci};
6962306a36Sopenharmony_ci
7062306a36Sopenharmony_cistatic atomic_t ib_nl_addr_request_seq = ATOMIC_INIT(0);
7162306a36Sopenharmony_ci
7262306a36Sopenharmony_cistatic DEFINE_SPINLOCK(lock);
7362306a36Sopenharmony_cistatic LIST_HEAD(req_list);
7462306a36Sopenharmony_cistatic struct workqueue_struct *addr_wq;
7562306a36Sopenharmony_ci
7662306a36Sopenharmony_cistatic const struct nla_policy ib_nl_addr_policy[LS_NLA_TYPE_MAX] = {
7762306a36Sopenharmony_ci	[LS_NLA_TYPE_DGID] = {.type = NLA_BINARY,
7862306a36Sopenharmony_ci		.len = sizeof(struct rdma_nla_ls_gid),
7962306a36Sopenharmony_ci		.validation_type = NLA_VALIDATE_MIN,
8062306a36Sopenharmony_ci		.min = sizeof(struct rdma_nla_ls_gid)},
8162306a36Sopenharmony_ci};
8262306a36Sopenharmony_ci
8362306a36Sopenharmony_cistatic inline bool ib_nl_is_good_ip_resp(const struct nlmsghdr *nlh)
8462306a36Sopenharmony_ci{
8562306a36Sopenharmony_ci	struct nlattr *tb[LS_NLA_TYPE_MAX] = {};
8662306a36Sopenharmony_ci	int ret;
8762306a36Sopenharmony_ci
8862306a36Sopenharmony_ci	if (nlh->nlmsg_flags & RDMA_NL_LS_F_ERR)
8962306a36Sopenharmony_ci		return false;
9062306a36Sopenharmony_ci
9162306a36Sopenharmony_ci	ret = nla_parse_deprecated(tb, LS_NLA_TYPE_MAX - 1, nlmsg_data(nlh),
9262306a36Sopenharmony_ci				   nlmsg_len(nlh), ib_nl_addr_policy, NULL);
9362306a36Sopenharmony_ci	if (ret)
9462306a36Sopenharmony_ci		return false;
9562306a36Sopenharmony_ci
9662306a36Sopenharmony_ci	return true;
9762306a36Sopenharmony_ci}
9862306a36Sopenharmony_ci
9962306a36Sopenharmony_cistatic void ib_nl_process_good_ip_rsep(const struct nlmsghdr *nlh)
10062306a36Sopenharmony_ci{
10162306a36Sopenharmony_ci	const struct nlattr *head, *curr;
10262306a36Sopenharmony_ci	union ib_gid gid;
10362306a36Sopenharmony_ci	struct addr_req *req;
10462306a36Sopenharmony_ci	int len, rem;
10562306a36Sopenharmony_ci	int found = 0;
10662306a36Sopenharmony_ci
10762306a36Sopenharmony_ci	head = (const struct nlattr *)nlmsg_data(nlh);
10862306a36Sopenharmony_ci	len = nlmsg_len(nlh);
10962306a36Sopenharmony_ci
11062306a36Sopenharmony_ci	nla_for_each_attr(curr, head, len, rem) {
11162306a36Sopenharmony_ci		if (curr->nla_type == LS_NLA_TYPE_DGID)
11262306a36Sopenharmony_ci			memcpy(&gid, nla_data(curr), nla_len(curr));
11362306a36Sopenharmony_ci	}
11462306a36Sopenharmony_ci
11562306a36Sopenharmony_ci	spin_lock_bh(&lock);
11662306a36Sopenharmony_ci	list_for_each_entry(req, &req_list, list) {
11762306a36Sopenharmony_ci		if (nlh->nlmsg_seq != req->seq)
11862306a36Sopenharmony_ci			continue;
11962306a36Sopenharmony_ci		/* We set the DGID part, the rest was set earlier */
12062306a36Sopenharmony_ci		rdma_addr_set_dgid(req->addr, &gid);
12162306a36Sopenharmony_ci		req->status = 0;
12262306a36Sopenharmony_ci		found = 1;
12362306a36Sopenharmony_ci		break;
12462306a36Sopenharmony_ci	}
12562306a36Sopenharmony_ci	spin_unlock_bh(&lock);
12662306a36Sopenharmony_ci
12762306a36Sopenharmony_ci	if (!found)
12862306a36Sopenharmony_ci		pr_info("Couldn't find request waiting for DGID: %pI6\n",
12962306a36Sopenharmony_ci			&gid);
13062306a36Sopenharmony_ci}
13162306a36Sopenharmony_ci
13262306a36Sopenharmony_ciint ib_nl_handle_ip_res_resp(struct sk_buff *skb,
13362306a36Sopenharmony_ci			     struct nlmsghdr *nlh,
13462306a36Sopenharmony_ci			     struct netlink_ext_ack *extack)
13562306a36Sopenharmony_ci{
13662306a36Sopenharmony_ci	if ((nlh->nlmsg_flags & NLM_F_REQUEST) ||
13762306a36Sopenharmony_ci	    !(NETLINK_CB(skb).sk))
13862306a36Sopenharmony_ci		return -EPERM;
13962306a36Sopenharmony_ci
14062306a36Sopenharmony_ci	if (ib_nl_is_good_ip_resp(nlh))
14162306a36Sopenharmony_ci		ib_nl_process_good_ip_rsep(nlh);
14262306a36Sopenharmony_ci
14362306a36Sopenharmony_ci	return 0;
14462306a36Sopenharmony_ci}
14562306a36Sopenharmony_ci
14662306a36Sopenharmony_cistatic int ib_nl_ip_send_msg(struct rdma_dev_addr *dev_addr,
14762306a36Sopenharmony_ci			     const void *daddr,
14862306a36Sopenharmony_ci			     u32 seq, u16 family)
14962306a36Sopenharmony_ci{
15062306a36Sopenharmony_ci	struct sk_buff *skb = NULL;
15162306a36Sopenharmony_ci	struct nlmsghdr *nlh;
15262306a36Sopenharmony_ci	struct rdma_ls_ip_resolve_header *header;
15362306a36Sopenharmony_ci	void *data;
15462306a36Sopenharmony_ci	size_t size;
15562306a36Sopenharmony_ci	int attrtype;
15662306a36Sopenharmony_ci	int len;
15762306a36Sopenharmony_ci
15862306a36Sopenharmony_ci	if (family == AF_INET) {
15962306a36Sopenharmony_ci		size = sizeof(struct in_addr);
16062306a36Sopenharmony_ci		attrtype = RDMA_NLA_F_MANDATORY | LS_NLA_TYPE_IPV4;
16162306a36Sopenharmony_ci	} else {
16262306a36Sopenharmony_ci		size = sizeof(struct in6_addr);
16362306a36Sopenharmony_ci		attrtype = RDMA_NLA_F_MANDATORY | LS_NLA_TYPE_IPV6;
16462306a36Sopenharmony_ci	}
16562306a36Sopenharmony_ci
16662306a36Sopenharmony_ci	len = nla_total_size(sizeof(size));
16762306a36Sopenharmony_ci	len += NLMSG_ALIGN(sizeof(*header));
16862306a36Sopenharmony_ci
16962306a36Sopenharmony_ci	skb = nlmsg_new(len, GFP_KERNEL);
17062306a36Sopenharmony_ci	if (!skb)
17162306a36Sopenharmony_ci		return -ENOMEM;
17262306a36Sopenharmony_ci
17362306a36Sopenharmony_ci	data = ibnl_put_msg(skb, &nlh, seq, 0, RDMA_NL_LS,
17462306a36Sopenharmony_ci			    RDMA_NL_LS_OP_IP_RESOLVE, NLM_F_REQUEST);
17562306a36Sopenharmony_ci	if (!data) {
17662306a36Sopenharmony_ci		nlmsg_free(skb);
17762306a36Sopenharmony_ci		return -ENODATA;
17862306a36Sopenharmony_ci	}
17962306a36Sopenharmony_ci
18062306a36Sopenharmony_ci	/* Construct the family header first */
18162306a36Sopenharmony_ci	header = skb_put(skb, NLMSG_ALIGN(sizeof(*header)));
18262306a36Sopenharmony_ci	header->ifindex = dev_addr->bound_dev_if;
18362306a36Sopenharmony_ci	nla_put(skb, attrtype, size, daddr);
18462306a36Sopenharmony_ci
18562306a36Sopenharmony_ci	/* Repair the nlmsg header length */
18662306a36Sopenharmony_ci	nlmsg_end(skb, nlh);
18762306a36Sopenharmony_ci	rdma_nl_multicast(&init_net, skb, RDMA_NL_GROUP_LS, GFP_KERNEL);
18862306a36Sopenharmony_ci
18962306a36Sopenharmony_ci	/* Make the request retry, so when we get the response from userspace
19062306a36Sopenharmony_ci	 * we will have something.
19162306a36Sopenharmony_ci	 */
19262306a36Sopenharmony_ci	return -ENODATA;
19362306a36Sopenharmony_ci}
19462306a36Sopenharmony_ci
19562306a36Sopenharmony_ciint rdma_addr_size(const struct sockaddr *addr)
19662306a36Sopenharmony_ci{
19762306a36Sopenharmony_ci	switch (addr->sa_family) {
19862306a36Sopenharmony_ci	case AF_INET:
19962306a36Sopenharmony_ci		return sizeof(struct sockaddr_in);
20062306a36Sopenharmony_ci	case AF_INET6:
20162306a36Sopenharmony_ci		return sizeof(struct sockaddr_in6);
20262306a36Sopenharmony_ci	case AF_IB:
20362306a36Sopenharmony_ci		return sizeof(struct sockaddr_ib);
20462306a36Sopenharmony_ci	default:
20562306a36Sopenharmony_ci		return 0;
20662306a36Sopenharmony_ci	}
20762306a36Sopenharmony_ci}
20862306a36Sopenharmony_ciEXPORT_SYMBOL(rdma_addr_size);
20962306a36Sopenharmony_ci
21062306a36Sopenharmony_ciint rdma_addr_size_in6(struct sockaddr_in6 *addr)
21162306a36Sopenharmony_ci{
21262306a36Sopenharmony_ci	int ret = rdma_addr_size((struct sockaddr *) addr);
21362306a36Sopenharmony_ci
21462306a36Sopenharmony_ci	return ret <= sizeof(*addr) ? ret : 0;
21562306a36Sopenharmony_ci}
21662306a36Sopenharmony_ciEXPORT_SYMBOL(rdma_addr_size_in6);
21762306a36Sopenharmony_ci
21862306a36Sopenharmony_ciint rdma_addr_size_kss(struct __kernel_sockaddr_storage *addr)
21962306a36Sopenharmony_ci{
22062306a36Sopenharmony_ci	int ret = rdma_addr_size((struct sockaddr *) addr);
22162306a36Sopenharmony_ci
22262306a36Sopenharmony_ci	return ret <= sizeof(*addr) ? ret : 0;
22362306a36Sopenharmony_ci}
22462306a36Sopenharmony_ciEXPORT_SYMBOL(rdma_addr_size_kss);
22562306a36Sopenharmony_ci
22662306a36Sopenharmony_ci/**
22762306a36Sopenharmony_ci * rdma_copy_src_l2_addr - Copy netdevice source addresses
22862306a36Sopenharmony_ci * @dev_addr:	Destination address pointer where to copy the addresses
22962306a36Sopenharmony_ci * @dev:	Netdevice whose source addresses to copy
23062306a36Sopenharmony_ci *
23162306a36Sopenharmony_ci * rdma_copy_src_l2_addr() copies source addresses from the specified netdevice.
23262306a36Sopenharmony_ci * This includes unicast address, broadcast address, device type and
23362306a36Sopenharmony_ci * interface index.
23462306a36Sopenharmony_ci */
23562306a36Sopenharmony_civoid rdma_copy_src_l2_addr(struct rdma_dev_addr *dev_addr,
23662306a36Sopenharmony_ci			   const struct net_device *dev)
23762306a36Sopenharmony_ci{
23862306a36Sopenharmony_ci	dev_addr->dev_type = dev->type;
23962306a36Sopenharmony_ci	memcpy(dev_addr->src_dev_addr, dev->dev_addr, MAX_ADDR_LEN);
24062306a36Sopenharmony_ci	memcpy(dev_addr->broadcast, dev->broadcast, MAX_ADDR_LEN);
24162306a36Sopenharmony_ci	dev_addr->bound_dev_if = dev->ifindex;
24262306a36Sopenharmony_ci}
24362306a36Sopenharmony_ciEXPORT_SYMBOL(rdma_copy_src_l2_addr);
24462306a36Sopenharmony_ci
24562306a36Sopenharmony_cistatic struct net_device *
24662306a36Sopenharmony_cirdma_find_ndev_for_src_ip_rcu(struct net *net, const struct sockaddr *src_in)
24762306a36Sopenharmony_ci{
24862306a36Sopenharmony_ci	struct net_device *dev = NULL;
24962306a36Sopenharmony_ci	int ret = -EADDRNOTAVAIL;
25062306a36Sopenharmony_ci
25162306a36Sopenharmony_ci	switch (src_in->sa_family) {
25262306a36Sopenharmony_ci	case AF_INET:
25362306a36Sopenharmony_ci		dev = __ip_dev_find(net,
25462306a36Sopenharmony_ci				    ((const struct sockaddr_in *)src_in)->sin_addr.s_addr,
25562306a36Sopenharmony_ci				    false);
25662306a36Sopenharmony_ci		if (dev)
25762306a36Sopenharmony_ci			ret = 0;
25862306a36Sopenharmony_ci		break;
25962306a36Sopenharmony_ci#if IS_ENABLED(CONFIG_IPV6)
26062306a36Sopenharmony_ci	case AF_INET6:
26162306a36Sopenharmony_ci		for_each_netdev_rcu(net, dev) {
26262306a36Sopenharmony_ci			if (ipv6_chk_addr(net,
26362306a36Sopenharmony_ci					  &((const struct sockaddr_in6 *)src_in)->sin6_addr,
26462306a36Sopenharmony_ci					  dev, 1)) {
26562306a36Sopenharmony_ci				ret = 0;
26662306a36Sopenharmony_ci				break;
26762306a36Sopenharmony_ci			}
26862306a36Sopenharmony_ci		}
26962306a36Sopenharmony_ci		break;
27062306a36Sopenharmony_ci#endif
27162306a36Sopenharmony_ci	}
27262306a36Sopenharmony_ci	return ret ? ERR_PTR(ret) : dev;
27362306a36Sopenharmony_ci}
27462306a36Sopenharmony_ci
27562306a36Sopenharmony_ciint rdma_translate_ip(const struct sockaddr *addr,
27662306a36Sopenharmony_ci		      struct rdma_dev_addr *dev_addr)
27762306a36Sopenharmony_ci{
27862306a36Sopenharmony_ci	struct net_device *dev;
27962306a36Sopenharmony_ci
28062306a36Sopenharmony_ci	if (dev_addr->bound_dev_if) {
28162306a36Sopenharmony_ci		dev = dev_get_by_index(dev_addr->net, dev_addr->bound_dev_if);
28262306a36Sopenharmony_ci		if (!dev)
28362306a36Sopenharmony_ci			return -ENODEV;
28462306a36Sopenharmony_ci		rdma_copy_src_l2_addr(dev_addr, dev);
28562306a36Sopenharmony_ci		dev_put(dev);
28662306a36Sopenharmony_ci		return 0;
28762306a36Sopenharmony_ci	}
28862306a36Sopenharmony_ci
28962306a36Sopenharmony_ci	rcu_read_lock();
29062306a36Sopenharmony_ci	dev = rdma_find_ndev_for_src_ip_rcu(dev_addr->net, addr);
29162306a36Sopenharmony_ci	if (!IS_ERR(dev))
29262306a36Sopenharmony_ci		rdma_copy_src_l2_addr(dev_addr, dev);
29362306a36Sopenharmony_ci	rcu_read_unlock();
29462306a36Sopenharmony_ci	return PTR_ERR_OR_ZERO(dev);
29562306a36Sopenharmony_ci}
29662306a36Sopenharmony_ciEXPORT_SYMBOL(rdma_translate_ip);
29762306a36Sopenharmony_ci
29862306a36Sopenharmony_cistatic void set_timeout(struct addr_req *req, unsigned long time)
29962306a36Sopenharmony_ci{
30062306a36Sopenharmony_ci	unsigned long delay;
30162306a36Sopenharmony_ci
30262306a36Sopenharmony_ci	delay = time - jiffies;
30362306a36Sopenharmony_ci	if ((long)delay < 0)
30462306a36Sopenharmony_ci		delay = 0;
30562306a36Sopenharmony_ci
30662306a36Sopenharmony_ci	mod_delayed_work(addr_wq, &req->work, delay);
30762306a36Sopenharmony_ci}
30862306a36Sopenharmony_ci
30962306a36Sopenharmony_cistatic void queue_req(struct addr_req *req)
31062306a36Sopenharmony_ci{
31162306a36Sopenharmony_ci	spin_lock_bh(&lock);
31262306a36Sopenharmony_ci	list_add_tail(&req->list, &req_list);
31362306a36Sopenharmony_ci	set_timeout(req, req->timeout);
31462306a36Sopenharmony_ci	spin_unlock_bh(&lock);
31562306a36Sopenharmony_ci}
31662306a36Sopenharmony_ci
31762306a36Sopenharmony_cistatic int ib_nl_fetch_ha(struct rdma_dev_addr *dev_addr,
31862306a36Sopenharmony_ci			  const void *daddr, u32 seq, u16 family)
31962306a36Sopenharmony_ci{
32062306a36Sopenharmony_ci	if (!rdma_nl_chk_listeners(RDMA_NL_GROUP_LS))
32162306a36Sopenharmony_ci		return -EADDRNOTAVAIL;
32262306a36Sopenharmony_ci
32362306a36Sopenharmony_ci	return ib_nl_ip_send_msg(dev_addr, daddr, seq, family);
32462306a36Sopenharmony_ci}
32562306a36Sopenharmony_ci
32662306a36Sopenharmony_cistatic int dst_fetch_ha(const struct dst_entry *dst,
32762306a36Sopenharmony_ci			struct rdma_dev_addr *dev_addr,
32862306a36Sopenharmony_ci			const void *daddr)
32962306a36Sopenharmony_ci{
33062306a36Sopenharmony_ci	struct neighbour *n;
33162306a36Sopenharmony_ci	int ret = 0;
33262306a36Sopenharmony_ci
33362306a36Sopenharmony_ci	n = dst_neigh_lookup(dst, daddr);
33462306a36Sopenharmony_ci	if (!n)
33562306a36Sopenharmony_ci		return -ENODATA;
33662306a36Sopenharmony_ci
33762306a36Sopenharmony_ci	if (!(n->nud_state & NUD_VALID)) {
33862306a36Sopenharmony_ci		neigh_event_send(n, NULL);
33962306a36Sopenharmony_ci		ret = -ENODATA;
34062306a36Sopenharmony_ci	} else {
34162306a36Sopenharmony_ci		neigh_ha_snapshot(dev_addr->dst_dev_addr, n, dst->dev);
34262306a36Sopenharmony_ci	}
34362306a36Sopenharmony_ci
34462306a36Sopenharmony_ci	neigh_release(n);
34562306a36Sopenharmony_ci
34662306a36Sopenharmony_ci	return ret;
34762306a36Sopenharmony_ci}
34862306a36Sopenharmony_ci
34962306a36Sopenharmony_cistatic bool has_gateway(const struct dst_entry *dst, sa_family_t family)
35062306a36Sopenharmony_ci{
35162306a36Sopenharmony_ci	struct rtable *rt;
35262306a36Sopenharmony_ci	struct rt6_info *rt6;
35362306a36Sopenharmony_ci
35462306a36Sopenharmony_ci	if (family == AF_INET) {
35562306a36Sopenharmony_ci		rt = container_of(dst, struct rtable, dst);
35662306a36Sopenharmony_ci		return rt->rt_uses_gateway;
35762306a36Sopenharmony_ci	}
35862306a36Sopenharmony_ci
35962306a36Sopenharmony_ci	rt6 = container_of(dst, struct rt6_info, dst);
36062306a36Sopenharmony_ci	return rt6->rt6i_flags & RTF_GATEWAY;
36162306a36Sopenharmony_ci}
36262306a36Sopenharmony_ci
36362306a36Sopenharmony_cistatic int fetch_ha(const struct dst_entry *dst, struct rdma_dev_addr *dev_addr,
36462306a36Sopenharmony_ci		    const struct sockaddr *dst_in, u32 seq)
36562306a36Sopenharmony_ci{
36662306a36Sopenharmony_ci	const struct sockaddr_in *dst_in4 =
36762306a36Sopenharmony_ci		(const struct sockaddr_in *)dst_in;
36862306a36Sopenharmony_ci	const struct sockaddr_in6 *dst_in6 =
36962306a36Sopenharmony_ci		(const struct sockaddr_in6 *)dst_in;
37062306a36Sopenharmony_ci	const void *daddr = (dst_in->sa_family == AF_INET) ?
37162306a36Sopenharmony_ci		(const void *)&dst_in4->sin_addr.s_addr :
37262306a36Sopenharmony_ci		(const void *)&dst_in6->sin6_addr;
37362306a36Sopenharmony_ci	sa_family_t family = dst_in->sa_family;
37462306a36Sopenharmony_ci
37562306a36Sopenharmony_ci	might_sleep();
37662306a36Sopenharmony_ci
37762306a36Sopenharmony_ci	/* If we have a gateway in IB mode then it must be an IB network */
37862306a36Sopenharmony_ci	if (has_gateway(dst, family) && dev_addr->network == RDMA_NETWORK_IB)
37962306a36Sopenharmony_ci		return ib_nl_fetch_ha(dev_addr, daddr, seq, family);
38062306a36Sopenharmony_ci	else
38162306a36Sopenharmony_ci		return dst_fetch_ha(dst, dev_addr, daddr);
38262306a36Sopenharmony_ci}
38362306a36Sopenharmony_ci
38462306a36Sopenharmony_cistatic int addr4_resolve(struct sockaddr *src_sock,
38562306a36Sopenharmony_ci			 const struct sockaddr *dst_sock,
38662306a36Sopenharmony_ci			 struct rdma_dev_addr *addr,
38762306a36Sopenharmony_ci			 struct rtable **prt)
38862306a36Sopenharmony_ci{
38962306a36Sopenharmony_ci	struct sockaddr_in *src_in = (struct sockaddr_in *)src_sock;
39062306a36Sopenharmony_ci	const struct sockaddr_in *dst_in =
39162306a36Sopenharmony_ci			(const struct sockaddr_in *)dst_sock;
39262306a36Sopenharmony_ci
39362306a36Sopenharmony_ci	__be32 src_ip = src_in->sin_addr.s_addr;
39462306a36Sopenharmony_ci	__be32 dst_ip = dst_in->sin_addr.s_addr;
39562306a36Sopenharmony_ci	struct rtable *rt;
39662306a36Sopenharmony_ci	struct flowi4 fl4;
39762306a36Sopenharmony_ci	int ret;
39862306a36Sopenharmony_ci
39962306a36Sopenharmony_ci	memset(&fl4, 0, sizeof(fl4));
40062306a36Sopenharmony_ci	fl4.daddr = dst_ip;
40162306a36Sopenharmony_ci	fl4.saddr = src_ip;
40262306a36Sopenharmony_ci	fl4.flowi4_oif = addr->bound_dev_if;
40362306a36Sopenharmony_ci	rt = ip_route_output_key(addr->net, &fl4);
40462306a36Sopenharmony_ci	ret = PTR_ERR_OR_ZERO(rt);
40562306a36Sopenharmony_ci	if (ret)
40662306a36Sopenharmony_ci		return ret;
40762306a36Sopenharmony_ci
40862306a36Sopenharmony_ci	src_in->sin_addr.s_addr = fl4.saddr;
40962306a36Sopenharmony_ci
41062306a36Sopenharmony_ci	addr->hoplimit = ip4_dst_hoplimit(&rt->dst);
41162306a36Sopenharmony_ci
41262306a36Sopenharmony_ci	*prt = rt;
41362306a36Sopenharmony_ci	return 0;
41462306a36Sopenharmony_ci}
41562306a36Sopenharmony_ci
41662306a36Sopenharmony_ci#if IS_ENABLED(CONFIG_IPV6)
41762306a36Sopenharmony_cistatic int addr6_resolve(struct sockaddr *src_sock,
41862306a36Sopenharmony_ci			 const struct sockaddr *dst_sock,
41962306a36Sopenharmony_ci			 struct rdma_dev_addr *addr,
42062306a36Sopenharmony_ci			 struct dst_entry **pdst)
42162306a36Sopenharmony_ci{
42262306a36Sopenharmony_ci	struct sockaddr_in6 *src_in = (struct sockaddr_in6 *)src_sock;
42362306a36Sopenharmony_ci	const struct sockaddr_in6 *dst_in =
42462306a36Sopenharmony_ci				(const struct sockaddr_in6 *)dst_sock;
42562306a36Sopenharmony_ci	struct flowi6 fl6;
42662306a36Sopenharmony_ci	struct dst_entry *dst;
42762306a36Sopenharmony_ci
42862306a36Sopenharmony_ci	memset(&fl6, 0, sizeof fl6);
42962306a36Sopenharmony_ci	fl6.daddr = dst_in->sin6_addr;
43062306a36Sopenharmony_ci	fl6.saddr = src_in->sin6_addr;
43162306a36Sopenharmony_ci	fl6.flowi6_oif = addr->bound_dev_if;
43262306a36Sopenharmony_ci
43362306a36Sopenharmony_ci	dst = ipv6_stub->ipv6_dst_lookup_flow(addr->net, NULL, &fl6, NULL);
43462306a36Sopenharmony_ci	if (IS_ERR(dst))
43562306a36Sopenharmony_ci		return PTR_ERR(dst);
43662306a36Sopenharmony_ci
43762306a36Sopenharmony_ci	if (ipv6_addr_any(&src_in->sin6_addr))
43862306a36Sopenharmony_ci		src_in->sin6_addr = fl6.saddr;
43962306a36Sopenharmony_ci
44062306a36Sopenharmony_ci	addr->hoplimit = ip6_dst_hoplimit(dst);
44162306a36Sopenharmony_ci
44262306a36Sopenharmony_ci	*pdst = dst;
44362306a36Sopenharmony_ci	return 0;
44462306a36Sopenharmony_ci}
44562306a36Sopenharmony_ci#else
44662306a36Sopenharmony_cistatic int addr6_resolve(struct sockaddr *src_sock,
44762306a36Sopenharmony_ci			 const struct sockaddr *dst_sock,
44862306a36Sopenharmony_ci			 struct rdma_dev_addr *addr,
44962306a36Sopenharmony_ci			 struct dst_entry **pdst)
45062306a36Sopenharmony_ci{
45162306a36Sopenharmony_ci	return -EADDRNOTAVAIL;
45262306a36Sopenharmony_ci}
45362306a36Sopenharmony_ci#endif
45462306a36Sopenharmony_ci
45562306a36Sopenharmony_cistatic int addr_resolve_neigh(const struct dst_entry *dst,
45662306a36Sopenharmony_ci			      const struct sockaddr *dst_in,
45762306a36Sopenharmony_ci			      struct rdma_dev_addr *addr,
45862306a36Sopenharmony_ci			      unsigned int ndev_flags,
45962306a36Sopenharmony_ci			      u32 seq)
46062306a36Sopenharmony_ci{
46162306a36Sopenharmony_ci	int ret = 0;
46262306a36Sopenharmony_ci
46362306a36Sopenharmony_ci	if (ndev_flags & IFF_LOOPBACK) {
46462306a36Sopenharmony_ci		memcpy(addr->dst_dev_addr, addr->src_dev_addr, MAX_ADDR_LEN);
46562306a36Sopenharmony_ci	} else {
46662306a36Sopenharmony_ci		if (!(ndev_flags & IFF_NOARP)) {
46762306a36Sopenharmony_ci			/* If the device doesn't do ARP internally */
46862306a36Sopenharmony_ci			ret = fetch_ha(dst, addr, dst_in, seq);
46962306a36Sopenharmony_ci		}
47062306a36Sopenharmony_ci	}
47162306a36Sopenharmony_ci	return ret;
47262306a36Sopenharmony_ci}
47362306a36Sopenharmony_ci
47462306a36Sopenharmony_cistatic int copy_src_l2_addr(struct rdma_dev_addr *dev_addr,
47562306a36Sopenharmony_ci			    const struct sockaddr *dst_in,
47662306a36Sopenharmony_ci			    const struct dst_entry *dst,
47762306a36Sopenharmony_ci			    const struct net_device *ndev)
47862306a36Sopenharmony_ci{
47962306a36Sopenharmony_ci	int ret = 0;
48062306a36Sopenharmony_ci
48162306a36Sopenharmony_ci	if (dst->dev->flags & IFF_LOOPBACK)
48262306a36Sopenharmony_ci		ret = rdma_translate_ip(dst_in, dev_addr);
48362306a36Sopenharmony_ci	else
48462306a36Sopenharmony_ci		rdma_copy_src_l2_addr(dev_addr, dst->dev);
48562306a36Sopenharmony_ci
48662306a36Sopenharmony_ci	/*
48762306a36Sopenharmony_ci	 * If there's a gateway and type of device not ARPHRD_INFINIBAND,
48862306a36Sopenharmony_ci	 * we're definitely in RoCE v2 (as RoCE v1 isn't routable) set the
48962306a36Sopenharmony_ci	 * network type accordingly.
49062306a36Sopenharmony_ci	 */
49162306a36Sopenharmony_ci	if (has_gateway(dst, dst_in->sa_family) &&
49262306a36Sopenharmony_ci	    ndev->type != ARPHRD_INFINIBAND)
49362306a36Sopenharmony_ci		dev_addr->network = dst_in->sa_family == AF_INET ?
49462306a36Sopenharmony_ci						RDMA_NETWORK_IPV4 :
49562306a36Sopenharmony_ci						RDMA_NETWORK_IPV6;
49662306a36Sopenharmony_ci	else
49762306a36Sopenharmony_ci		dev_addr->network = RDMA_NETWORK_IB;
49862306a36Sopenharmony_ci
49962306a36Sopenharmony_ci	return ret;
50062306a36Sopenharmony_ci}
50162306a36Sopenharmony_ci
50262306a36Sopenharmony_cistatic int rdma_set_src_addr_rcu(struct rdma_dev_addr *dev_addr,
50362306a36Sopenharmony_ci				 unsigned int *ndev_flags,
50462306a36Sopenharmony_ci				 const struct sockaddr *dst_in,
50562306a36Sopenharmony_ci				 const struct dst_entry *dst)
50662306a36Sopenharmony_ci{
50762306a36Sopenharmony_ci	struct net_device *ndev = READ_ONCE(dst->dev);
50862306a36Sopenharmony_ci
50962306a36Sopenharmony_ci	*ndev_flags = ndev->flags;
51062306a36Sopenharmony_ci	/* A physical device must be the RDMA device to use */
51162306a36Sopenharmony_ci	if (ndev->flags & IFF_LOOPBACK) {
51262306a36Sopenharmony_ci		/*
51362306a36Sopenharmony_ci		 * RDMA (IB/RoCE, iWarp) doesn't run on lo interface or
51462306a36Sopenharmony_ci		 * loopback IP address. So if route is resolved to loopback
51562306a36Sopenharmony_ci		 * interface, translate that to a real ndev based on non
51662306a36Sopenharmony_ci		 * loopback IP address.
51762306a36Sopenharmony_ci		 */
51862306a36Sopenharmony_ci		ndev = rdma_find_ndev_for_src_ip_rcu(dev_net(ndev), dst_in);
51962306a36Sopenharmony_ci		if (IS_ERR(ndev))
52062306a36Sopenharmony_ci			return -ENODEV;
52162306a36Sopenharmony_ci	}
52262306a36Sopenharmony_ci
52362306a36Sopenharmony_ci	return copy_src_l2_addr(dev_addr, dst_in, dst, ndev);
52462306a36Sopenharmony_ci}
52562306a36Sopenharmony_ci
52662306a36Sopenharmony_cistatic int set_addr_netns_by_gid_rcu(struct rdma_dev_addr *addr)
52762306a36Sopenharmony_ci{
52862306a36Sopenharmony_ci	struct net_device *ndev;
52962306a36Sopenharmony_ci
53062306a36Sopenharmony_ci	ndev = rdma_read_gid_attr_ndev_rcu(addr->sgid_attr);
53162306a36Sopenharmony_ci	if (IS_ERR(ndev))
53262306a36Sopenharmony_ci		return PTR_ERR(ndev);
53362306a36Sopenharmony_ci
53462306a36Sopenharmony_ci	/*
53562306a36Sopenharmony_ci	 * Since we are holding the rcu, reading net and ifindex
53662306a36Sopenharmony_ci	 * are safe without any additional reference; because
53762306a36Sopenharmony_ci	 * change_net_namespace() in net/core/dev.c does rcu sync
53862306a36Sopenharmony_ci	 * after it changes the state to IFF_DOWN and before
53962306a36Sopenharmony_ci	 * updating netdev fields {net, ifindex}.
54062306a36Sopenharmony_ci	 */
54162306a36Sopenharmony_ci	addr->net = dev_net(ndev);
54262306a36Sopenharmony_ci	addr->bound_dev_if = ndev->ifindex;
54362306a36Sopenharmony_ci	return 0;
54462306a36Sopenharmony_ci}
54562306a36Sopenharmony_ci
54662306a36Sopenharmony_cistatic void rdma_addr_set_net_defaults(struct rdma_dev_addr *addr)
54762306a36Sopenharmony_ci{
54862306a36Sopenharmony_ci	addr->net = &init_net;
54962306a36Sopenharmony_ci	addr->bound_dev_if = 0;
55062306a36Sopenharmony_ci}
55162306a36Sopenharmony_ci
55262306a36Sopenharmony_cistatic int addr_resolve(struct sockaddr *src_in,
55362306a36Sopenharmony_ci			const struct sockaddr *dst_in,
55462306a36Sopenharmony_ci			struct rdma_dev_addr *addr,
55562306a36Sopenharmony_ci			bool resolve_neigh,
55662306a36Sopenharmony_ci			bool resolve_by_gid_attr,
55762306a36Sopenharmony_ci			u32 seq)
55862306a36Sopenharmony_ci{
55962306a36Sopenharmony_ci	struct dst_entry *dst = NULL;
56062306a36Sopenharmony_ci	unsigned int ndev_flags = 0;
56162306a36Sopenharmony_ci	struct rtable *rt = NULL;
56262306a36Sopenharmony_ci	int ret;
56362306a36Sopenharmony_ci
56462306a36Sopenharmony_ci	if (!addr->net) {
56562306a36Sopenharmony_ci		pr_warn_ratelimited("%s: missing namespace\n", __func__);
56662306a36Sopenharmony_ci		return -EINVAL;
56762306a36Sopenharmony_ci	}
56862306a36Sopenharmony_ci
56962306a36Sopenharmony_ci	rcu_read_lock();
57062306a36Sopenharmony_ci	if (resolve_by_gid_attr) {
57162306a36Sopenharmony_ci		if (!addr->sgid_attr) {
57262306a36Sopenharmony_ci			rcu_read_unlock();
57362306a36Sopenharmony_ci			pr_warn_ratelimited("%s: missing gid_attr\n", __func__);
57462306a36Sopenharmony_ci			return -EINVAL;
57562306a36Sopenharmony_ci		}
57662306a36Sopenharmony_ci		/*
57762306a36Sopenharmony_ci		 * If the request is for a specific gid attribute of the
57862306a36Sopenharmony_ci		 * rdma_dev_addr, derive net from the netdevice of the
57962306a36Sopenharmony_ci		 * GID attribute.
58062306a36Sopenharmony_ci		 */
58162306a36Sopenharmony_ci		ret = set_addr_netns_by_gid_rcu(addr);
58262306a36Sopenharmony_ci		if (ret) {
58362306a36Sopenharmony_ci			rcu_read_unlock();
58462306a36Sopenharmony_ci			return ret;
58562306a36Sopenharmony_ci		}
58662306a36Sopenharmony_ci	}
58762306a36Sopenharmony_ci	if (src_in->sa_family == AF_INET) {
58862306a36Sopenharmony_ci		ret = addr4_resolve(src_in, dst_in, addr, &rt);
58962306a36Sopenharmony_ci		dst = &rt->dst;
59062306a36Sopenharmony_ci	} else {
59162306a36Sopenharmony_ci		ret = addr6_resolve(src_in, dst_in, addr, &dst);
59262306a36Sopenharmony_ci	}
59362306a36Sopenharmony_ci	if (ret) {
59462306a36Sopenharmony_ci		rcu_read_unlock();
59562306a36Sopenharmony_ci		goto done;
59662306a36Sopenharmony_ci	}
59762306a36Sopenharmony_ci	ret = rdma_set_src_addr_rcu(addr, &ndev_flags, dst_in, dst);
59862306a36Sopenharmony_ci	rcu_read_unlock();
59962306a36Sopenharmony_ci
60062306a36Sopenharmony_ci	/*
60162306a36Sopenharmony_ci	 * Resolve neighbor destination address if requested and
60262306a36Sopenharmony_ci	 * only if src addr translation didn't fail.
60362306a36Sopenharmony_ci	 */
60462306a36Sopenharmony_ci	if (!ret && resolve_neigh)
60562306a36Sopenharmony_ci		ret = addr_resolve_neigh(dst, dst_in, addr, ndev_flags, seq);
60662306a36Sopenharmony_ci
60762306a36Sopenharmony_ci	if (src_in->sa_family == AF_INET)
60862306a36Sopenharmony_ci		ip_rt_put(rt);
60962306a36Sopenharmony_ci	else
61062306a36Sopenharmony_ci		dst_release(dst);
61162306a36Sopenharmony_cidone:
61262306a36Sopenharmony_ci	/*
61362306a36Sopenharmony_ci	 * Clear the addr net to go back to its original state, only if it was
61462306a36Sopenharmony_ci	 * derived from GID attribute in this context.
61562306a36Sopenharmony_ci	 */
61662306a36Sopenharmony_ci	if (resolve_by_gid_attr)
61762306a36Sopenharmony_ci		rdma_addr_set_net_defaults(addr);
61862306a36Sopenharmony_ci	return ret;
61962306a36Sopenharmony_ci}
62062306a36Sopenharmony_ci
62162306a36Sopenharmony_cistatic void process_one_req(struct work_struct *_work)
62262306a36Sopenharmony_ci{
62362306a36Sopenharmony_ci	struct addr_req *req;
62462306a36Sopenharmony_ci	struct sockaddr *src_in, *dst_in;
62562306a36Sopenharmony_ci
62662306a36Sopenharmony_ci	req = container_of(_work, struct addr_req, work.work);
62762306a36Sopenharmony_ci
62862306a36Sopenharmony_ci	if (req->status == -ENODATA) {
62962306a36Sopenharmony_ci		src_in = (struct sockaddr *)&req->src_addr;
63062306a36Sopenharmony_ci		dst_in = (struct sockaddr *)&req->dst_addr;
63162306a36Sopenharmony_ci		req->status = addr_resolve(src_in, dst_in, req->addr,
63262306a36Sopenharmony_ci					   true, req->resolve_by_gid_attr,
63362306a36Sopenharmony_ci					   req->seq);
63462306a36Sopenharmony_ci		if (req->status && time_after_eq(jiffies, req->timeout)) {
63562306a36Sopenharmony_ci			req->status = -ETIMEDOUT;
63662306a36Sopenharmony_ci		} else if (req->status == -ENODATA) {
63762306a36Sopenharmony_ci			/* requeue the work for retrying again */
63862306a36Sopenharmony_ci			spin_lock_bh(&lock);
63962306a36Sopenharmony_ci			if (!list_empty(&req->list))
64062306a36Sopenharmony_ci				set_timeout(req, req->timeout);
64162306a36Sopenharmony_ci			spin_unlock_bh(&lock);
64262306a36Sopenharmony_ci			return;
64362306a36Sopenharmony_ci		}
64462306a36Sopenharmony_ci	}
64562306a36Sopenharmony_ci
64662306a36Sopenharmony_ci	req->callback(req->status, (struct sockaddr *)&req->src_addr,
64762306a36Sopenharmony_ci		req->addr, req->context);
64862306a36Sopenharmony_ci	req->callback = NULL;
64962306a36Sopenharmony_ci
65062306a36Sopenharmony_ci	spin_lock_bh(&lock);
65162306a36Sopenharmony_ci	/*
65262306a36Sopenharmony_ci	 * Although the work will normally have been canceled by the workqueue,
65362306a36Sopenharmony_ci	 * it can still be requeued as long as it is on the req_list.
65462306a36Sopenharmony_ci	 */
65562306a36Sopenharmony_ci	cancel_delayed_work(&req->work);
65662306a36Sopenharmony_ci	if (!list_empty(&req->list)) {
65762306a36Sopenharmony_ci		list_del_init(&req->list);
65862306a36Sopenharmony_ci		kfree(req);
65962306a36Sopenharmony_ci	}
66062306a36Sopenharmony_ci	spin_unlock_bh(&lock);
66162306a36Sopenharmony_ci}
66262306a36Sopenharmony_ci
66362306a36Sopenharmony_ciint rdma_resolve_ip(struct sockaddr *src_addr, const struct sockaddr *dst_addr,
66462306a36Sopenharmony_ci		    struct rdma_dev_addr *addr, unsigned long timeout_ms,
66562306a36Sopenharmony_ci		    void (*callback)(int status, struct sockaddr *src_addr,
66662306a36Sopenharmony_ci				     struct rdma_dev_addr *addr, void *context),
66762306a36Sopenharmony_ci		    bool resolve_by_gid_attr, void *context)
66862306a36Sopenharmony_ci{
66962306a36Sopenharmony_ci	struct sockaddr *src_in, *dst_in;
67062306a36Sopenharmony_ci	struct addr_req *req;
67162306a36Sopenharmony_ci	int ret = 0;
67262306a36Sopenharmony_ci
67362306a36Sopenharmony_ci	req = kzalloc(sizeof *req, GFP_KERNEL);
67462306a36Sopenharmony_ci	if (!req)
67562306a36Sopenharmony_ci		return -ENOMEM;
67662306a36Sopenharmony_ci
67762306a36Sopenharmony_ci	src_in = (struct sockaddr *) &req->src_addr;
67862306a36Sopenharmony_ci	dst_in = (struct sockaddr *) &req->dst_addr;
67962306a36Sopenharmony_ci
68062306a36Sopenharmony_ci	if (src_addr) {
68162306a36Sopenharmony_ci		if (src_addr->sa_family != dst_addr->sa_family) {
68262306a36Sopenharmony_ci			ret = -EINVAL;
68362306a36Sopenharmony_ci			goto err;
68462306a36Sopenharmony_ci		}
68562306a36Sopenharmony_ci
68662306a36Sopenharmony_ci		memcpy(src_in, src_addr, rdma_addr_size(src_addr));
68762306a36Sopenharmony_ci	} else {
68862306a36Sopenharmony_ci		src_in->sa_family = dst_addr->sa_family;
68962306a36Sopenharmony_ci	}
69062306a36Sopenharmony_ci
69162306a36Sopenharmony_ci	memcpy(dst_in, dst_addr, rdma_addr_size(dst_addr));
69262306a36Sopenharmony_ci	req->addr = addr;
69362306a36Sopenharmony_ci	req->callback = callback;
69462306a36Sopenharmony_ci	req->context = context;
69562306a36Sopenharmony_ci	req->resolve_by_gid_attr = resolve_by_gid_attr;
69662306a36Sopenharmony_ci	INIT_DELAYED_WORK(&req->work, process_one_req);
69762306a36Sopenharmony_ci	req->seq = (u32)atomic_inc_return(&ib_nl_addr_request_seq);
69862306a36Sopenharmony_ci
69962306a36Sopenharmony_ci	req->status = addr_resolve(src_in, dst_in, addr, true,
70062306a36Sopenharmony_ci				   req->resolve_by_gid_attr, req->seq);
70162306a36Sopenharmony_ci	switch (req->status) {
70262306a36Sopenharmony_ci	case 0:
70362306a36Sopenharmony_ci		req->timeout = jiffies;
70462306a36Sopenharmony_ci		queue_req(req);
70562306a36Sopenharmony_ci		break;
70662306a36Sopenharmony_ci	case -ENODATA:
70762306a36Sopenharmony_ci		req->timeout = msecs_to_jiffies(timeout_ms) + jiffies;
70862306a36Sopenharmony_ci		queue_req(req);
70962306a36Sopenharmony_ci		break;
71062306a36Sopenharmony_ci	default:
71162306a36Sopenharmony_ci		ret = req->status;
71262306a36Sopenharmony_ci		goto err;
71362306a36Sopenharmony_ci	}
71462306a36Sopenharmony_ci	return ret;
71562306a36Sopenharmony_cierr:
71662306a36Sopenharmony_ci	kfree(req);
71762306a36Sopenharmony_ci	return ret;
71862306a36Sopenharmony_ci}
71962306a36Sopenharmony_ciEXPORT_SYMBOL(rdma_resolve_ip);
72062306a36Sopenharmony_ci
72162306a36Sopenharmony_ciint roce_resolve_route_from_path(struct sa_path_rec *rec,
72262306a36Sopenharmony_ci				 const struct ib_gid_attr *attr)
72362306a36Sopenharmony_ci{
72462306a36Sopenharmony_ci	union {
72562306a36Sopenharmony_ci		struct sockaddr     _sockaddr;
72662306a36Sopenharmony_ci		struct sockaddr_in  _sockaddr_in;
72762306a36Sopenharmony_ci		struct sockaddr_in6 _sockaddr_in6;
72862306a36Sopenharmony_ci	} sgid, dgid;
72962306a36Sopenharmony_ci	struct rdma_dev_addr dev_addr = {};
73062306a36Sopenharmony_ci	int ret;
73162306a36Sopenharmony_ci
73262306a36Sopenharmony_ci	might_sleep();
73362306a36Sopenharmony_ci
73462306a36Sopenharmony_ci	if (rec->roce.route_resolved)
73562306a36Sopenharmony_ci		return 0;
73662306a36Sopenharmony_ci
73762306a36Sopenharmony_ci	rdma_gid2ip((struct sockaddr *)&sgid, &rec->sgid);
73862306a36Sopenharmony_ci	rdma_gid2ip((struct sockaddr *)&dgid, &rec->dgid);
73962306a36Sopenharmony_ci
74062306a36Sopenharmony_ci	if (sgid._sockaddr.sa_family != dgid._sockaddr.sa_family)
74162306a36Sopenharmony_ci		return -EINVAL;
74262306a36Sopenharmony_ci
74362306a36Sopenharmony_ci	if (!attr || !attr->ndev)
74462306a36Sopenharmony_ci		return -EINVAL;
74562306a36Sopenharmony_ci
74662306a36Sopenharmony_ci	dev_addr.net = &init_net;
74762306a36Sopenharmony_ci	dev_addr.sgid_attr = attr;
74862306a36Sopenharmony_ci
74962306a36Sopenharmony_ci	ret = addr_resolve((struct sockaddr *)&sgid, (struct sockaddr *)&dgid,
75062306a36Sopenharmony_ci			   &dev_addr, false, true, 0);
75162306a36Sopenharmony_ci	if (ret)
75262306a36Sopenharmony_ci		return ret;
75362306a36Sopenharmony_ci
75462306a36Sopenharmony_ci	if ((dev_addr.network == RDMA_NETWORK_IPV4 ||
75562306a36Sopenharmony_ci	     dev_addr.network == RDMA_NETWORK_IPV6) &&
75662306a36Sopenharmony_ci	    rec->rec_type != SA_PATH_REC_TYPE_ROCE_V2)
75762306a36Sopenharmony_ci		return -EINVAL;
75862306a36Sopenharmony_ci
75962306a36Sopenharmony_ci	rec->roce.route_resolved = true;
76062306a36Sopenharmony_ci	return 0;
76162306a36Sopenharmony_ci}
76262306a36Sopenharmony_ci
76362306a36Sopenharmony_ci/**
76462306a36Sopenharmony_ci * rdma_addr_cancel - Cancel resolve ip request
76562306a36Sopenharmony_ci * @addr:	Pointer to address structure given previously
76662306a36Sopenharmony_ci *		during rdma_resolve_ip().
76762306a36Sopenharmony_ci * rdma_addr_cancel() is synchronous function which cancels any pending
76862306a36Sopenharmony_ci * request if there is any.
76962306a36Sopenharmony_ci */
77062306a36Sopenharmony_civoid rdma_addr_cancel(struct rdma_dev_addr *addr)
77162306a36Sopenharmony_ci{
77262306a36Sopenharmony_ci	struct addr_req *req, *temp_req;
77362306a36Sopenharmony_ci	struct addr_req *found = NULL;
77462306a36Sopenharmony_ci
77562306a36Sopenharmony_ci	spin_lock_bh(&lock);
77662306a36Sopenharmony_ci	list_for_each_entry_safe(req, temp_req, &req_list, list) {
77762306a36Sopenharmony_ci		if (req->addr == addr) {
77862306a36Sopenharmony_ci			/*
77962306a36Sopenharmony_ci			 * Removing from the list means we take ownership of
78062306a36Sopenharmony_ci			 * the req
78162306a36Sopenharmony_ci			 */
78262306a36Sopenharmony_ci			list_del_init(&req->list);
78362306a36Sopenharmony_ci			found = req;
78462306a36Sopenharmony_ci			break;
78562306a36Sopenharmony_ci		}
78662306a36Sopenharmony_ci	}
78762306a36Sopenharmony_ci	spin_unlock_bh(&lock);
78862306a36Sopenharmony_ci
78962306a36Sopenharmony_ci	if (!found)
79062306a36Sopenharmony_ci		return;
79162306a36Sopenharmony_ci
79262306a36Sopenharmony_ci	/*
79362306a36Sopenharmony_ci	 * sync canceling the work after removing it from the req_list
79462306a36Sopenharmony_ci	 * guarentees no work is running and none will be started.
79562306a36Sopenharmony_ci	 */
79662306a36Sopenharmony_ci	cancel_delayed_work_sync(&found->work);
79762306a36Sopenharmony_ci	kfree(found);
79862306a36Sopenharmony_ci}
79962306a36Sopenharmony_ciEXPORT_SYMBOL(rdma_addr_cancel);
80062306a36Sopenharmony_ci
80162306a36Sopenharmony_cistruct resolve_cb_context {
80262306a36Sopenharmony_ci	struct completion comp;
80362306a36Sopenharmony_ci	int status;
80462306a36Sopenharmony_ci};
80562306a36Sopenharmony_ci
80662306a36Sopenharmony_cistatic void resolve_cb(int status, struct sockaddr *src_addr,
80762306a36Sopenharmony_ci	     struct rdma_dev_addr *addr, void *context)
80862306a36Sopenharmony_ci{
80962306a36Sopenharmony_ci	((struct resolve_cb_context *)context)->status = status;
81062306a36Sopenharmony_ci	complete(&((struct resolve_cb_context *)context)->comp);
81162306a36Sopenharmony_ci}
81262306a36Sopenharmony_ci
81362306a36Sopenharmony_ciint rdma_addr_find_l2_eth_by_grh(const union ib_gid *sgid,
81462306a36Sopenharmony_ci				 const union ib_gid *dgid,
81562306a36Sopenharmony_ci				 u8 *dmac, const struct ib_gid_attr *sgid_attr,
81662306a36Sopenharmony_ci				 int *hoplimit)
81762306a36Sopenharmony_ci{
81862306a36Sopenharmony_ci	struct rdma_dev_addr dev_addr;
81962306a36Sopenharmony_ci	struct resolve_cb_context ctx;
82062306a36Sopenharmony_ci	union {
82162306a36Sopenharmony_ci		struct sockaddr_in  _sockaddr_in;
82262306a36Sopenharmony_ci		struct sockaddr_in6 _sockaddr_in6;
82362306a36Sopenharmony_ci	} sgid_addr, dgid_addr;
82462306a36Sopenharmony_ci	int ret;
82562306a36Sopenharmony_ci
82662306a36Sopenharmony_ci	rdma_gid2ip((struct sockaddr *)&sgid_addr, sgid);
82762306a36Sopenharmony_ci	rdma_gid2ip((struct sockaddr *)&dgid_addr, dgid);
82862306a36Sopenharmony_ci
82962306a36Sopenharmony_ci	memset(&dev_addr, 0, sizeof(dev_addr));
83062306a36Sopenharmony_ci	dev_addr.net = &init_net;
83162306a36Sopenharmony_ci	dev_addr.sgid_attr = sgid_attr;
83262306a36Sopenharmony_ci
83362306a36Sopenharmony_ci	init_completion(&ctx.comp);
83462306a36Sopenharmony_ci	ret = rdma_resolve_ip((struct sockaddr *)&sgid_addr,
83562306a36Sopenharmony_ci			      (struct sockaddr *)&dgid_addr, &dev_addr, 1000,
83662306a36Sopenharmony_ci			      resolve_cb, true, &ctx);
83762306a36Sopenharmony_ci	if (ret)
83862306a36Sopenharmony_ci		return ret;
83962306a36Sopenharmony_ci
84062306a36Sopenharmony_ci	wait_for_completion(&ctx.comp);
84162306a36Sopenharmony_ci
84262306a36Sopenharmony_ci	ret = ctx.status;
84362306a36Sopenharmony_ci	if (ret)
84462306a36Sopenharmony_ci		return ret;
84562306a36Sopenharmony_ci
84662306a36Sopenharmony_ci	memcpy(dmac, dev_addr.dst_dev_addr, ETH_ALEN);
84762306a36Sopenharmony_ci	*hoplimit = dev_addr.hoplimit;
84862306a36Sopenharmony_ci	return 0;
84962306a36Sopenharmony_ci}
85062306a36Sopenharmony_ci
85162306a36Sopenharmony_cistatic int netevent_callback(struct notifier_block *self, unsigned long event,
85262306a36Sopenharmony_ci	void *ctx)
85362306a36Sopenharmony_ci{
85462306a36Sopenharmony_ci	struct addr_req *req;
85562306a36Sopenharmony_ci
85662306a36Sopenharmony_ci	if (event == NETEVENT_NEIGH_UPDATE) {
85762306a36Sopenharmony_ci		struct neighbour *neigh = ctx;
85862306a36Sopenharmony_ci
85962306a36Sopenharmony_ci		if (neigh->nud_state & NUD_VALID) {
86062306a36Sopenharmony_ci			spin_lock_bh(&lock);
86162306a36Sopenharmony_ci			list_for_each_entry(req, &req_list, list)
86262306a36Sopenharmony_ci				set_timeout(req, jiffies);
86362306a36Sopenharmony_ci			spin_unlock_bh(&lock);
86462306a36Sopenharmony_ci		}
86562306a36Sopenharmony_ci	}
86662306a36Sopenharmony_ci	return 0;
86762306a36Sopenharmony_ci}
86862306a36Sopenharmony_ci
86962306a36Sopenharmony_cistatic struct notifier_block nb = {
87062306a36Sopenharmony_ci	.notifier_call = netevent_callback
87162306a36Sopenharmony_ci};
87262306a36Sopenharmony_ci
87362306a36Sopenharmony_ciint addr_init(void)
87462306a36Sopenharmony_ci{
87562306a36Sopenharmony_ci	addr_wq = alloc_ordered_workqueue("ib_addr", 0);
87662306a36Sopenharmony_ci	if (!addr_wq)
87762306a36Sopenharmony_ci		return -ENOMEM;
87862306a36Sopenharmony_ci
87962306a36Sopenharmony_ci	register_netevent_notifier(&nb);
88062306a36Sopenharmony_ci
88162306a36Sopenharmony_ci	return 0;
88262306a36Sopenharmony_ci}
88362306a36Sopenharmony_ci
88462306a36Sopenharmony_civoid addr_cleanup(void)
88562306a36Sopenharmony_ci{
88662306a36Sopenharmony_ci	unregister_netevent_notifier(&nb);
88762306a36Sopenharmony_ci	destroy_workqueue(addr_wq);
88862306a36Sopenharmony_ci	WARN_ON(!list_empty(&req_list));
88962306a36Sopenharmony_ci}
890