162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 262306a36Sopenharmony_ci/* AFS vlserver list management. 362306a36Sopenharmony_ci * 462306a36Sopenharmony_ci * Copyright (C) 2018 Red Hat, Inc. All Rights Reserved. 562306a36Sopenharmony_ci * Written by David Howells (dhowells@redhat.com) 662306a36Sopenharmony_ci */ 762306a36Sopenharmony_ci 862306a36Sopenharmony_ci#include <linux/kernel.h> 962306a36Sopenharmony_ci#include <linux/slab.h> 1062306a36Sopenharmony_ci#include "internal.h" 1162306a36Sopenharmony_ci 1262306a36Sopenharmony_cistruct afs_vlserver *afs_alloc_vlserver(const char *name, size_t name_len, 1362306a36Sopenharmony_ci unsigned short port) 1462306a36Sopenharmony_ci{ 1562306a36Sopenharmony_ci struct afs_vlserver *vlserver; 1662306a36Sopenharmony_ci 1762306a36Sopenharmony_ci vlserver = kzalloc(struct_size(vlserver, name, name_len + 1), 1862306a36Sopenharmony_ci GFP_KERNEL); 1962306a36Sopenharmony_ci if (vlserver) { 2062306a36Sopenharmony_ci refcount_set(&vlserver->ref, 1); 2162306a36Sopenharmony_ci rwlock_init(&vlserver->lock); 2262306a36Sopenharmony_ci init_waitqueue_head(&vlserver->probe_wq); 2362306a36Sopenharmony_ci spin_lock_init(&vlserver->probe_lock); 2462306a36Sopenharmony_ci vlserver->rtt = UINT_MAX; 2562306a36Sopenharmony_ci vlserver->name_len = name_len; 2662306a36Sopenharmony_ci vlserver->port = port; 2762306a36Sopenharmony_ci memcpy(vlserver->name, name, name_len); 2862306a36Sopenharmony_ci } 2962306a36Sopenharmony_ci return vlserver; 3062306a36Sopenharmony_ci} 3162306a36Sopenharmony_ci 3262306a36Sopenharmony_cistatic void afs_vlserver_rcu(struct rcu_head *rcu) 3362306a36Sopenharmony_ci{ 3462306a36Sopenharmony_ci struct afs_vlserver *vlserver = container_of(rcu, struct afs_vlserver, rcu); 3562306a36Sopenharmony_ci 3662306a36Sopenharmony_ci afs_put_addrlist(rcu_access_pointer(vlserver->addresses)); 3762306a36Sopenharmony_ci kfree_rcu(vlserver, rcu); 3862306a36Sopenharmony_ci} 3962306a36Sopenharmony_ci 4062306a36Sopenharmony_civoid afs_put_vlserver(struct afs_net *net, struct afs_vlserver *vlserver) 4162306a36Sopenharmony_ci{ 4262306a36Sopenharmony_ci if (vlserver && 4362306a36Sopenharmony_ci refcount_dec_and_test(&vlserver->ref)) 4462306a36Sopenharmony_ci call_rcu(&vlserver->rcu, afs_vlserver_rcu); 4562306a36Sopenharmony_ci} 4662306a36Sopenharmony_ci 4762306a36Sopenharmony_cistruct afs_vlserver_list *afs_alloc_vlserver_list(unsigned int nr_servers) 4862306a36Sopenharmony_ci{ 4962306a36Sopenharmony_ci struct afs_vlserver_list *vllist; 5062306a36Sopenharmony_ci 5162306a36Sopenharmony_ci vllist = kzalloc(struct_size(vllist, servers, nr_servers), GFP_KERNEL); 5262306a36Sopenharmony_ci if (vllist) { 5362306a36Sopenharmony_ci refcount_set(&vllist->ref, 1); 5462306a36Sopenharmony_ci rwlock_init(&vllist->lock); 5562306a36Sopenharmony_ci } 5662306a36Sopenharmony_ci 5762306a36Sopenharmony_ci return vllist; 5862306a36Sopenharmony_ci} 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_civoid afs_put_vlserverlist(struct afs_net *net, struct afs_vlserver_list *vllist) 6162306a36Sopenharmony_ci{ 6262306a36Sopenharmony_ci if (vllist) { 6362306a36Sopenharmony_ci if (refcount_dec_and_test(&vllist->ref)) { 6462306a36Sopenharmony_ci int i; 6562306a36Sopenharmony_ci 6662306a36Sopenharmony_ci for (i = 0; i < vllist->nr_servers; i++) { 6762306a36Sopenharmony_ci afs_put_vlserver(net, vllist->servers[i].server); 6862306a36Sopenharmony_ci } 6962306a36Sopenharmony_ci kfree_rcu(vllist, rcu); 7062306a36Sopenharmony_ci } 7162306a36Sopenharmony_ci } 7262306a36Sopenharmony_ci} 7362306a36Sopenharmony_ci 7462306a36Sopenharmony_cistatic u16 afs_extract_le16(const u8 **_b) 7562306a36Sopenharmony_ci{ 7662306a36Sopenharmony_ci u16 val; 7762306a36Sopenharmony_ci 7862306a36Sopenharmony_ci val = (u16)*(*_b)++ << 0; 7962306a36Sopenharmony_ci val |= (u16)*(*_b)++ << 8; 8062306a36Sopenharmony_ci return val; 8162306a36Sopenharmony_ci} 8262306a36Sopenharmony_ci 8362306a36Sopenharmony_ci/* 8462306a36Sopenharmony_ci * Build a VL server address list from a DNS queried server list. 8562306a36Sopenharmony_ci */ 8662306a36Sopenharmony_cistatic struct afs_addr_list *afs_extract_vl_addrs(const u8 **_b, const u8 *end, 8762306a36Sopenharmony_ci u8 nr_addrs, u16 port) 8862306a36Sopenharmony_ci{ 8962306a36Sopenharmony_ci struct afs_addr_list *alist; 9062306a36Sopenharmony_ci const u8 *b = *_b; 9162306a36Sopenharmony_ci int ret = -EINVAL; 9262306a36Sopenharmony_ci 9362306a36Sopenharmony_ci alist = afs_alloc_addrlist(nr_addrs, VL_SERVICE, port); 9462306a36Sopenharmony_ci if (!alist) 9562306a36Sopenharmony_ci return ERR_PTR(-ENOMEM); 9662306a36Sopenharmony_ci if (nr_addrs == 0) 9762306a36Sopenharmony_ci return alist; 9862306a36Sopenharmony_ci 9962306a36Sopenharmony_ci for (; nr_addrs > 0 && end - b >= nr_addrs; nr_addrs--) { 10062306a36Sopenharmony_ci struct dns_server_list_v1_address hdr; 10162306a36Sopenharmony_ci __be32 x[4]; 10262306a36Sopenharmony_ci 10362306a36Sopenharmony_ci hdr.address_type = *b++; 10462306a36Sopenharmony_ci 10562306a36Sopenharmony_ci switch (hdr.address_type) { 10662306a36Sopenharmony_ci case DNS_ADDRESS_IS_IPV4: 10762306a36Sopenharmony_ci if (end - b < 4) { 10862306a36Sopenharmony_ci _leave(" = -EINVAL [short inet]"); 10962306a36Sopenharmony_ci goto error; 11062306a36Sopenharmony_ci } 11162306a36Sopenharmony_ci memcpy(x, b, 4); 11262306a36Sopenharmony_ci afs_merge_fs_addr4(alist, x[0], port); 11362306a36Sopenharmony_ci b += 4; 11462306a36Sopenharmony_ci break; 11562306a36Sopenharmony_ci 11662306a36Sopenharmony_ci case DNS_ADDRESS_IS_IPV6: 11762306a36Sopenharmony_ci if (end - b < 16) { 11862306a36Sopenharmony_ci _leave(" = -EINVAL [short inet6]"); 11962306a36Sopenharmony_ci goto error; 12062306a36Sopenharmony_ci } 12162306a36Sopenharmony_ci memcpy(x, b, 16); 12262306a36Sopenharmony_ci afs_merge_fs_addr6(alist, x, port); 12362306a36Sopenharmony_ci b += 16; 12462306a36Sopenharmony_ci break; 12562306a36Sopenharmony_ci 12662306a36Sopenharmony_ci default: 12762306a36Sopenharmony_ci _leave(" = -EADDRNOTAVAIL [unknown af %u]", 12862306a36Sopenharmony_ci hdr.address_type); 12962306a36Sopenharmony_ci ret = -EADDRNOTAVAIL; 13062306a36Sopenharmony_ci goto error; 13162306a36Sopenharmony_ci } 13262306a36Sopenharmony_ci } 13362306a36Sopenharmony_ci 13462306a36Sopenharmony_ci /* Start with IPv6 if available. */ 13562306a36Sopenharmony_ci if (alist->nr_ipv4 < alist->nr_addrs) 13662306a36Sopenharmony_ci alist->preferred = alist->nr_ipv4; 13762306a36Sopenharmony_ci 13862306a36Sopenharmony_ci *_b = b; 13962306a36Sopenharmony_ci return alist; 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_cierror: 14262306a36Sopenharmony_ci *_b = b; 14362306a36Sopenharmony_ci afs_put_addrlist(alist); 14462306a36Sopenharmony_ci return ERR_PTR(ret); 14562306a36Sopenharmony_ci} 14662306a36Sopenharmony_ci 14762306a36Sopenharmony_ci/* 14862306a36Sopenharmony_ci * Build a VL server list from a DNS queried server list. 14962306a36Sopenharmony_ci */ 15062306a36Sopenharmony_cistruct afs_vlserver_list *afs_extract_vlserver_list(struct afs_cell *cell, 15162306a36Sopenharmony_ci const void *buffer, 15262306a36Sopenharmony_ci size_t buffer_size) 15362306a36Sopenharmony_ci{ 15462306a36Sopenharmony_ci const struct dns_server_list_v1_header *hdr = buffer; 15562306a36Sopenharmony_ci struct dns_server_list_v1_server bs; 15662306a36Sopenharmony_ci struct afs_vlserver_list *vllist, *previous; 15762306a36Sopenharmony_ci struct afs_addr_list *addrs; 15862306a36Sopenharmony_ci struct afs_vlserver *server; 15962306a36Sopenharmony_ci const u8 *b = buffer, *end = buffer + buffer_size; 16062306a36Sopenharmony_ci int ret = -ENOMEM, nr_servers, i, j; 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_ci _enter(""); 16362306a36Sopenharmony_ci 16462306a36Sopenharmony_ci /* Check that it's a server list, v1 */ 16562306a36Sopenharmony_ci if (end - b < sizeof(*hdr) || 16662306a36Sopenharmony_ci hdr->hdr.content != DNS_PAYLOAD_IS_SERVER_LIST || 16762306a36Sopenharmony_ci hdr->hdr.version != 1) { 16862306a36Sopenharmony_ci pr_notice("kAFS: Got DNS record [%u,%u] len %zu\n", 16962306a36Sopenharmony_ci hdr->hdr.content, hdr->hdr.version, end - b); 17062306a36Sopenharmony_ci ret = -EDESTADDRREQ; 17162306a36Sopenharmony_ci goto dump; 17262306a36Sopenharmony_ci } 17362306a36Sopenharmony_ci 17462306a36Sopenharmony_ci nr_servers = hdr->nr_servers; 17562306a36Sopenharmony_ci 17662306a36Sopenharmony_ci vllist = afs_alloc_vlserver_list(nr_servers); 17762306a36Sopenharmony_ci if (!vllist) 17862306a36Sopenharmony_ci return ERR_PTR(-ENOMEM); 17962306a36Sopenharmony_ci 18062306a36Sopenharmony_ci vllist->source = (hdr->source < NR__dns_record_source) ? 18162306a36Sopenharmony_ci hdr->source : NR__dns_record_source; 18262306a36Sopenharmony_ci vllist->status = (hdr->status < NR__dns_lookup_status) ? 18362306a36Sopenharmony_ci hdr->status : NR__dns_lookup_status; 18462306a36Sopenharmony_ci 18562306a36Sopenharmony_ci read_lock(&cell->vl_servers_lock); 18662306a36Sopenharmony_ci previous = afs_get_vlserverlist( 18762306a36Sopenharmony_ci rcu_dereference_protected(cell->vl_servers, 18862306a36Sopenharmony_ci lockdep_is_held(&cell->vl_servers_lock))); 18962306a36Sopenharmony_ci read_unlock(&cell->vl_servers_lock); 19062306a36Sopenharmony_ci 19162306a36Sopenharmony_ci b += sizeof(*hdr); 19262306a36Sopenharmony_ci while (end - b >= sizeof(bs)) { 19362306a36Sopenharmony_ci bs.name_len = afs_extract_le16(&b); 19462306a36Sopenharmony_ci bs.priority = afs_extract_le16(&b); 19562306a36Sopenharmony_ci bs.weight = afs_extract_le16(&b); 19662306a36Sopenharmony_ci bs.port = afs_extract_le16(&b); 19762306a36Sopenharmony_ci bs.source = *b++; 19862306a36Sopenharmony_ci bs.status = *b++; 19962306a36Sopenharmony_ci bs.protocol = *b++; 20062306a36Sopenharmony_ci bs.nr_addrs = *b++; 20162306a36Sopenharmony_ci 20262306a36Sopenharmony_ci _debug("extract %u %u %u %u %u %u %*.*s", 20362306a36Sopenharmony_ci bs.name_len, bs.priority, bs.weight, 20462306a36Sopenharmony_ci bs.port, bs.protocol, bs.nr_addrs, 20562306a36Sopenharmony_ci bs.name_len, bs.name_len, b); 20662306a36Sopenharmony_ci 20762306a36Sopenharmony_ci if (end - b < bs.name_len) 20862306a36Sopenharmony_ci break; 20962306a36Sopenharmony_ci 21062306a36Sopenharmony_ci ret = -EPROTONOSUPPORT; 21162306a36Sopenharmony_ci if (bs.protocol == DNS_SERVER_PROTOCOL_UNSPECIFIED) { 21262306a36Sopenharmony_ci bs.protocol = DNS_SERVER_PROTOCOL_UDP; 21362306a36Sopenharmony_ci } else if (bs.protocol != DNS_SERVER_PROTOCOL_UDP) { 21462306a36Sopenharmony_ci _leave(" = [proto %u]", bs.protocol); 21562306a36Sopenharmony_ci goto error; 21662306a36Sopenharmony_ci } 21762306a36Sopenharmony_ci 21862306a36Sopenharmony_ci if (bs.port == 0) 21962306a36Sopenharmony_ci bs.port = AFS_VL_PORT; 22062306a36Sopenharmony_ci if (bs.source > NR__dns_record_source) 22162306a36Sopenharmony_ci bs.source = NR__dns_record_source; 22262306a36Sopenharmony_ci if (bs.status > NR__dns_lookup_status) 22362306a36Sopenharmony_ci bs.status = NR__dns_lookup_status; 22462306a36Sopenharmony_ci 22562306a36Sopenharmony_ci /* See if we can update an old server record */ 22662306a36Sopenharmony_ci server = NULL; 22762306a36Sopenharmony_ci for (i = 0; i < previous->nr_servers; i++) { 22862306a36Sopenharmony_ci struct afs_vlserver *p = previous->servers[i].server; 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_ci if (p->name_len == bs.name_len && 23162306a36Sopenharmony_ci p->port == bs.port && 23262306a36Sopenharmony_ci strncasecmp(b, p->name, bs.name_len) == 0) { 23362306a36Sopenharmony_ci server = afs_get_vlserver(p); 23462306a36Sopenharmony_ci break; 23562306a36Sopenharmony_ci } 23662306a36Sopenharmony_ci } 23762306a36Sopenharmony_ci 23862306a36Sopenharmony_ci if (!server) { 23962306a36Sopenharmony_ci ret = -ENOMEM; 24062306a36Sopenharmony_ci server = afs_alloc_vlserver(b, bs.name_len, bs.port); 24162306a36Sopenharmony_ci if (!server) 24262306a36Sopenharmony_ci goto error; 24362306a36Sopenharmony_ci } 24462306a36Sopenharmony_ci 24562306a36Sopenharmony_ci b += bs.name_len; 24662306a36Sopenharmony_ci 24762306a36Sopenharmony_ci /* Extract the addresses - note that we can't skip this as we 24862306a36Sopenharmony_ci * have to advance the payload pointer. 24962306a36Sopenharmony_ci */ 25062306a36Sopenharmony_ci addrs = afs_extract_vl_addrs(&b, end, bs.nr_addrs, bs.port); 25162306a36Sopenharmony_ci if (IS_ERR(addrs)) { 25262306a36Sopenharmony_ci ret = PTR_ERR(addrs); 25362306a36Sopenharmony_ci goto error_2; 25462306a36Sopenharmony_ci } 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_ci if (vllist->nr_servers >= nr_servers) { 25762306a36Sopenharmony_ci _debug("skip %u >= %u", vllist->nr_servers, nr_servers); 25862306a36Sopenharmony_ci afs_put_addrlist(addrs); 25962306a36Sopenharmony_ci afs_put_vlserver(cell->net, server); 26062306a36Sopenharmony_ci continue; 26162306a36Sopenharmony_ci } 26262306a36Sopenharmony_ci 26362306a36Sopenharmony_ci addrs->source = bs.source; 26462306a36Sopenharmony_ci addrs->status = bs.status; 26562306a36Sopenharmony_ci 26662306a36Sopenharmony_ci if (addrs->nr_addrs == 0) { 26762306a36Sopenharmony_ci afs_put_addrlist(addrs); 26862306a36Sopenharmony_ci if (!rcu_access_pointer(server->addresses)) { 26962306a36Sopenharmony_ci afs_put_vlserver(cell->net, server); 27062306a36Sopenharmony_ci continue; 27162306a36Sopenharmony_ci } 27262306a36Sopenharmony_ci } else { 27362306a36Sopenharmony_ci struct afs_addr_list *old = addrs; 27462306a36Sopenharmony_ci 27562306a36Sopenharmony_ci write_lock(&server->lock); 27662306a36Sopenharmony_ci old = rcu_replace_pointer(server->addresses, old, 27762306a36Sopenharmony_ci lockdep_is_held(&server->lock)); 27862306a36Sopenharmony_ci write_unlock(&server->lock); 27962306a36Sopenharmony_ci afs_put_addrlist(old); 28062306a36Sopenharmony_ci } 28162306a36Sopenharmony_ci 28262306a36Sopenharmony_ci 28362306a36Sopenharmony_ci /* TODO: Might want to check for duplicates */ 28462306a36Sopenharmony_ci 28562306a36Sopenharmony_ci /* Insertion-sort by priority and weight */ 28662306a36Sopenharmony_ci for (j = 0; j < vllist->nr_servers; j++) { 28762306a36Sopenharmony_ci if (bs.priority < vllist->servers[j].priority) 28862306a36Sopenharmony_ci break; /* Lower preferable */ 28962306a36Sopenharmony_ci if (bs.priority == vllist->servers[j].priority && 29062306a36Sopenharmony_ci bs.weight > vllist->servers[j].weight) 29162306a36Sopenharmony_ci break; /* Higher preferable */ 29262306a36Sopenharmony_ci } 29362306a36Sopenharmony_ci 29462306a36Sopenharmony_ci if (j < vllist->nr_servers) { 29562306a36Sopenharmony_ci memmove(vllist->servers + j + 1, 29662306a36Sopenharmony_ci vllist->servers + j, 29762306a36Sopenharmony_ci (vllist->nr_servers - j) * sizeof(struct afs_vlserver_entry)); 29862306a36Sopenharmony_ci } 29962306a36Sopenharmony_ci 30062306a36Sopenharmony_ci clear_bit(AFS_VLSERVER_FL_PROBED, &server->flags); 30162306a36Sopenharmony_ci 30262306a36Sopenharmony_ci vllist->servers[j].priority = bs.priority; 30362306a36Sopenharmony_ci vllist->servers[j].weight = bs.weight; 30462306a36Sopenharmony_ci vllist->servers[j].server = server; 30562306a36Sopenharmony_ci vllist->nr_servers++; 30662306a36Sopenharmony_ci } 30762306a36Sopenharmony_ci 30862306a36Sopenharmony_ci if (b != end) { 30962306a36Sopenharmony_ci _debug("parse error %zd", b - end); 31062306a36Sopenharmony_ci goto error; 31162306a36Sopenharmony_ci } 31262306a36Sopenharmony_ci 31362306a36Sopenharmony_ci afs_put_vlserverlist(cell->net, previous); 31462306a36Sopenharmony_ci _leave(" = ok [%u]", vllist->nr_servers); 31562306a36Sopenharmony_ci return vllist; 31662306a36Sopenharmony_ci 31762306a36Sopenharmony_cierror_2: 31862306a36Sopenharmony_ci afs_put_vlserver(cell->net, server); 31962306a36Sopenharmony_cierror: 32062306a36Sopenharmony_ci afs_put_vlserverlist(cell->net, vllist); 32162306a36Sopenharmony_ci afs_put_vlserverlist(cell->net, previous); 32262306a36Sopenharmony_cidump: 32362306a36Sopenharmony_ci if (ret != -ENOMEM) { 32462306a36Sopenharmony_ci printk(KERN_DEBUG "DNS: at %zu\n", (const void *)b - buffer); 32562306a36Sopenharmony_ci print_hex_dump_bytes("DNS: ", DUMP_PREFIX_NONE, buffer, buffer_size); 32662306a36Sopenharmony_ci } 32762306a36Sopenharmony_ci return ERR_PTR(ret); 32862306a36Sopenharmony_ci} 329