1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /* Server address list management
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * Copyright (C) 2017 Red Hat, Inc. All Rights Reserved.
5*4882a593Smuzhiyun * Written by David Howells (dhowells@redhat.com)
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <linux/slab.h>
9*4882a593Smuzhiyun #include <linux/ctype.h>
10*4882a593Smuzhiyun #include <linux/dns_resolver.h>
11*4882a593Smuzhiyun #include <linux/inet.h>
12*4882a593Smuzhiyun #include <keys/rxrpc-type.h>
13*4882a593Smuzhiyun #include "internal.h"
14*4882a593Smuzhiyun #include "afs_fs.h"
15*4882a593Smuzhiyun
16*4882a593Smuzhiyun /*
17*4882a593Smuzhiyun * Release an address list.
18*4882a593Smuzhiyun */
afs_put_addrlist(struct afs_addr_list * alist)19*4882a593Smuzhiyun void afs_put_addrlist(struct afs_addr_list *alist)
20*4882a593Smuzhiyun {
21*4882a593Smuzhiyun if (alist && refcount_dec_and_test(&alist->usage))
22*4882a593Smuzhiyun kfree_rcu(alist, rcu);
23*4882a593Smuzhiyun }
24*4882a593Smuzhiyun
25*4882a593Smuzhiyun /*
26*4882a593Smuzhiyun * Allocate an address list.
27*4882a593Smuzhiyun */
afs_alloc_addrlist(unsigned int nr,unsigned short service,unsigned short port)28*4882a593Smuzhiyun struct afs_addr_list *afs_alloc_addrlist(unsigned int nr,
29*4882a593Smuzhiyun unsigned short service,
30*4882a593Smuzhiyun unsigned short port)
31*4882a593Smuzhiyun {
32*4882a593Smuzhiyun struct afs_addr_list *alist;
33*4882a593Smuzhiyun unsigned int i;
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun _enter("%u,%u,%u", nr, service, port);
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun if (nr > AFS_MAX_ADDRESSES)
38*4882a593Smuzhiyun nr = AFS_MAX_ADDRESSES;
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun alist = kzalloc(struct_size(alist, addrs, nr), GFP_KERNEL);
41*4882a593Smuzhiyun if (!alist)
42*4882a593Smuzhiyun return NULL;
43*4882a593Smuzhiyun
44*4882a593Smuzhiyun refcount_set(&alist->usage, 1);
45*4882a593Smuzhiyun alist->max_addrs = nr;
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun for (i = 0; i < nr; i++) {
48*4882a593Smuzhiyun struct sockaddr_rxrpc *srx = &alist->addrs[i];
49*4882a593Smuzhiyun srx->srx_family = AF_RXRPC;
50*4882a593Smuzhiyun srx->srx_service = service;
51*4882a593Smuzhiyun srx->transport_type = SOCK_DGRAM;
52*4882a593Smuzhiyun srx->transport_len = sizeof(srx->transport.sin6);
53*4882a593Smuzhiyun srx->transport.sin6.sin6_family = AF_INET6;
54*4882a593Smuzhiyun srx->transport.sin6.sin6_port = htons(port);
55*4882a593Smuzhiyun }
56*4882a593Smuzhiyun
57*4882a593Smuzhiyun return alist;
58*4882a593Smuzhiyun }
59*4882a593Smuzhiyun
60*4882a593Smuzhiyun /*
61*4882a593Smuzhiyun * Parse a text string consisting of delimited addresses.
62*4882a593Smuzhiyun */
afs_parse_text_addrs(struct afs_net * net,const char * text,size_t len,char delim,unsigned short service,unsigned short port)63*4882a593Smuzhiyun struct afs_vlserver_list *afs_parse_text_addrs(struct afs_net *net,
64*4882a593Smuzhiyun const char *text, size_t len,
65*4882a593Smuzhiyun char delim,
66*4882a593Smuzhiyun unsigned short service,
67*4882a593Smuzhiyun unsigned short port)
68*4882a593Smuzhiyun {
69*4882a593Smuzhiyun struct afs_vlserver_list *vllist;
70*4882a593Smuzhiyun struct afs_addr_list *alist;
71*4882a593Smuzhiyun const char *p, *end = text + len;
72*4882a593Smuzhiyun const char *problem;
73*4882a593Smuzhiyun unsigned int nr = 0;
74*4882a593Smuzhiyun int ret = -ENOMEM;
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun _enter("%*.*s,%c", (int)len, (int)len, text, delim);
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun if (!len) {
79*4882a593Smuzhiyun _leave(" = -EDESTADDRREQ [empty]");
80*4882a593Smuzhiyun return ERR_PTR(-EDESTADDRREQ);
81*4882a593Smuzhiyun }
82*4882a593Smuzhiyun
83*4882a593Smuzhiyun if (delim == ':' && (memchr(text, ',', len) || !memchr(text, '.', len)))
84*4882a593Smuzhiyun delim = ',';
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun /* Count the addresses */
87*4882a593Smuzhiyun p = text;
88*4882a593Smuzhiyun do {
89*4882a593Smuzhiyun if (!*p) {
90*4882a593Smuzhiyun problem = "nul";
91*4882a593Smuzhiyun goto inval;
92*4882a593Smuzhiyun }
93*4882a593Smuzhiyun if (*p == delim)
94*4882a593Smuzhiyun continue;
95*4882a593Smuzhiyun nr++;
96*4882a593Smuzhiyun if (*p == '[') {
97*4882a593Smuzhiyun p++;
98*4882a593Smuzhiyun if (p == end) {
99*4882a593Smuzhiyun problem = "brace1";
100*4882a593Smuzhiyun goto inval;
101*4882a593Smuzhiyun }
102*4882a593Smuzhiyun p = memchr(p, ']', end - p);
103*4882a593Smuzhiyun if (!p) {
104*4882a593Smuzhiyun problem = "brace2";
105*4882a593Smuzhiyun goto inval;
106*4882a593Smuzhiyun }
107*4882a593Smuzhiyun p++;
108*4882a593Smuzhiyun if (p >= end)
109*4882a593Smuzhiyun break;
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun p = memchr(p, delim, end - p);
113*4882a593Smuzhiyun if (!p)
114*4882a593Smuzhiyun break;
115*4882a593Smuzhiyun p++;
116*4882a593Smuzhiyun } while (p < end);
117*4882a593Smuzhiyun
118*4882a593Smuzhiyun _debug("%u/%u addresses", nr, AFS_MAX_ADDRESSES);
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun vllist = afs_alloc_vlserver_list(1);
121*4882a593Smuzhiyun if (!vllist)
122*4882a593Smuzhiyun return ERR_PTR(-ENOMEM);
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun vllist->nr_servers = 1;
125*4882a593Smuzhiyun vllist->servers[0].server = afs_alloc_vlserver("<dummy>", 7, AFS_VL_PORT);
126*4882a593Smuzhiyun if (!vllist->servers[0].server)
127*4882a593Smuzhiyun goto error_vl;
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun alist = afs_alloc_addrlist(nr, service, AFS_VL_PORT);
130*4882a593Smuzhiyun if (!alist)
131*4882a593Smuzhiyun goto error;
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun /* Extract the addresses */
134*4882a593Smuzhiyun p = text;
135*4882a593Smuzhiyun do {
136*4882a593Smuzhiyun const char *q, *stop;
137*4882a593Smuzhiyun unsigned int xport = port;
138*4882a593Smuzhiyun __be32 x[4];
139*4882a593Smuzhiyun int family;
140*4882a593Smuzhiyun
141*4882a593Smuzhiyun if (*p == delim) {
142*4882a593Smuzhiyun p++;
143*4882a593Smuzhiyun continue;
144*4882a593Smuzhiyun }
145*4882a593Smuzhiyun
146*4882a593Smuzhiyun if (*p == '[') {
147*4882a593Smuzhiyun p++;
148*4882a593Smuzhiyun q = memchr(p, ']', end - p);
149*4882a593Smuzhiyun } else {
150*4882a593Smuzhiyun for (q = p; q < end; q++)
151*4882a593Smuzhiyun if (*q == '+' || *q == delim)
152*4882a593Smuzhiyun break;
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun if (in4_pton(p, q - p, (u8 *)&x[0], -1, &stop)) {
156*4882a593Smuzhiyun family = AF_INET;
157*4882a593Smuzhiyun } else if (in6_pton(p, q - p, (u8 *)x, -1, &stop)) {
158*4882a593Smuzhiyun family = AF_INET6;
159*4882a593Smuzhiyun } else {
160*4882a593Smuzhiyun problem = "family";
161*4882a593Smuzhiyun goto bad_address;
162*4882a593Smuzhiyun }
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun p = q;
165*4882a593Smuzhiyun if (stop != p) {
166*4882a593Smuzhiyun problem = "nostop";
167*4882a593Smuzhiyun goto bad_address;
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun
170*4882a593Smuzhiyun if (q < end && *q == ']')
171*4882a593Smuzhiyun p++;
172*4882a593Smuzhiyun
173*4882a593Smuzhiyun if (p < end) {
174*4882a593Smuzhiyun if (*p == '+') {
175*4882a593Smuzhiyun /* Port number specification "+1234" */
176*4882a593Smuzhiyun xport = 0;
177*4882a593Smuzhiyun p++;
178*4882a593Smuzhiyun if (p >= end || !isdigit(*p)) {
179*4882a593Smuzhiyun problem = "port";
180*4882a593Smuzhiyun goto bad_address;
181*4882a593Smuzhiyun }
182*4882a593Smuzhiyun do {
183*4882a593Smuzhiyun xport *= 10;
184*4882a593Smuzhiyun xport += *p - '0';
185*4882a593Smuzhiyun if (xport > 65535) {
186*4882a593Smuzhiyun problem = "pval";
187*4882a593Smuzhiyun goto bad_address;
188*4882a593Smuzhiyun }
189*4882a593Smuzhiyun p++;
190*4882a593Smuzhiyun } while (p < end && isdigit(*p));
191*4882a593Smuzhiyun } else if (*p == delim) {
192*4882a593Smuzhiyun p++;
193*4882a593Smuzhiyun } else {
194*4882a593Smuzhiyun problem = "weird";
195*4882a593Smuzhiyun goto bad_address;
196*4882a593Smuzhiyun }
197*4882a593Smuzhiyun }
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun if (family == AF_INET)
200*4882a593Smuzhiyun afs_merge_fs_addr4(alist, x[0], xport);
201*4882a593Smuzhiyun else
202*4882a593Smuzhiyun afs_merge_fs_addr6(alist, x, xport);
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun } while (p < end);
205*4882a593Smuzhiyun
206*4882a593Smuzhiyun rcu_assign_pointer(vllist->servers[0].server->addresses, alist);
207*4882a593Smuzhiyun _leave(" = [nr %u]", alist->nr_addrs);
208*4882a593Smuzhiyun return vllist;
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun inval:
211*4882a593Smuzhiyun _leave(" = -EINVAL [%s %zu %*.*s]",
212*4882a593Smuzhiyun problem, p - text, (int)len, (int)len, text);
213*4882a593Smuzhiyun return ERR_PTR(-EINVAL);
214*4882a593Smuzhiyun bad_address:
215*4882a593Smuzhiyun _leave(" = -EINVAL [%s %zu %*.*s]",
216*4882a593Smuzhiyun problem, p - text, (int)len, (int)len, text);
217*4882a593Smuzhiyun ret = -EINVAL;
218*4882a593Smuzhiyun error:
219*4882a593Smuzhiyun afs_put_addrlist(alist);
220*4882a593Smuzhiyun error_vl:
221*4882a593Smuzhiyun afs_put_vlserverlist(net, vllist);
222*4882a593Smuzhiyun return ERR_PTR(ret);
223*4882a593Smuzhiyun }
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun /*
226*4882a593Smuzhiyun * Compare old and new address lists to see if there's been any change.
227*4882a593Smuzhiyun * - How to do this in better than O(Nlog(N)) time?
228*4882a593Smuzhiyun * - We don't really want to sort the address list, but would rather take the
229*4882a593Smuzhiyun * list as we got it so as not to undo record rotation by the DNS server.
230*4882a593Smuzhiyun */
231*4882a593Smuzhiyun #if 0
232*4882a593Smuzhiyun static int afs_cmp_addr_list(const struct afs_addr_list *a1,
233*4882a593Smuzhiyun const struct afs_addr_list *a2)
234*4882a593Smuzhiyun {
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun #endif
237*4882a593Smuzhiyun
238*4882a593Smuzhiyun /*
239*4882a593Smuzhiyun * Perform a DNS query for VL servers and build a up an address list.
240*4882a593Smuzhiyun */
afs_dns_query(struct afs_cell * cell,time64_t * _expiry)241*4882a593Smuzhiyun struct afs_vlserver_list *afs_dns_query(struct afs_cell *cell, time64_t *_expiry)
242*4882a593Smuzhiyun {
243*4882a593Smuzhiyun struct afs_vlserver_list *vllist;
244*4882a593Smuzhiyun char *result = NULL;
245*4882a593Smuzhiyun int ret;
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun _enter("%s", cell->name);
248*4882a593Smuzhiyun
249*4882a593Smuzhiyun ret = dns_query(cell->net->net, "afsdb", cell->name, cell->name_len,
250*4882a593Smuzhiyun "srv=1", &result, _expiry, true);
251*4882a593Smuzhiyun if (ret < 0) {
252*4882a593Smuzhiyun _leave(" = %d [dns]", ret);
253*4882a593Smuzhiyun return ERR_PTR(ret);
254*4882a593Smuzhiyun }
255*4882a593Smuzhiyun
256*4882a593Smuzhiyun if (*_expiry == 0)
257*4882a593Smuzhiyun *_expiry = ktime_get_real_seconds() + 60;
258*4882a593Smuzhiyun
259*4882a593Smuzhiyun if (ret > 1 && result[0] == 0)
260*4882a593Smuzhiyun vllist = afs_extract_vlserver_list(cell, result, ret);
261*4882a593Smuzhiyun else
262*4882a593Smuzhiyun vllist = afs_parse_text_addrs(cell->net, result, ret, ',',
263*4882a593Smuzhiyun VL_SERVICE, AFS_VL_PORT);
264*4882a593Smuzhiyun kfree(result);
265*4882a593Smuzhiyun if (IS_ERR(vllist) && vllist != ERR_PTR(-ENOMEM))
266*4882a593Smuzhiyun pr_err("Failed to parse DNS data %ld\n", PTR_ERR(vllist));
267*4882a593Smuzhiyun
268*4882a593Smuzhiyun return vllist;
269*4882a593Smuzhiyun }
270*4882a593Smuzhiyun
271*4882a593Smuzhiyun /*
272*4882a593Smuzhiyun * Merge an IPv4 entry into a fileserver address list.
273*4882a593Smuzhiyun */
afs_merge_fs_addr4(struct afs_addr_list * alist,__be32 xdr,u16 port)274*4882a593Smuzhiyun void afs_merge_fs_addr4(struct afs_addr_list *alist, __be32 xdr, u16 port)
275*4882a593Smuzhiyun {
276*4882a593Smuzhiyun struct sockaddr_rxrpc *srx;
277*4882a593Smuzhiyun u32 addr = ntohl(xdr);
278*4882a593Smuzhiyun int i;
279*4882a593Smuzhiyun
280*4882a593Smuzhiyun if (alist->nr_addrs >= alist->max_addrs)
281*4882a593Smuzhiyun return;
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun for (i = 0; i < alist->nr_ipv4; i++) {
284*4882a593Smuzhiyun struct sockaddr_in *a = &alist->addrs[i].transport.sin;
285*4882a593Smuzhiyun u32 a_addr = ntohl(a->sin_addr.s_addr);
286*4882a593Smuzhiyun u16 a_port = ntohs(a->sin_port);
287*4882a593Smuzhiyun
288*4882a593Smuzhiyun if (addr == a_addr && port == a_port)
289*4882a593Smuzhiyun return;
290*4882a593Smuzhiyun if (addr == a_addr && port < a_port)
291*4882a593Smuzhiyun break;
292*4882a593Smuzhiyun if (addr < a_addr)
293*4882a593Smuzhiyun break;
294*4882a593Smuzhiyun }
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun if (i < alist->nr_addrs)
297*4882a593Smuzhiyun memmove(alist->addrs + i + 1,
298*4882a593Smuzhiyun alist->addrs + i,
299*4882a593Smuzhiyun sizeof(alist->addrs[0]) * (alist->nr_addrs - i));
300*4882a593Smuzhiyun
301*4882a593Smuzhiyun srx = &alist->addrs[i];
302*4882a593Smuzhiyun srx->srx_family = AF_RXRPC;
303*4882a593Smuzhiyun srx->transport_type = SOCK_DGRAM;
304*4882a593Smuzhiyun srx->transport_len = sizeof(srx->transport.sin);
305*4882a593Smuzhiyun srx->transport.sin.sin_family = AF_INET;
306*4882a593Smuzhiyun srx->transport.sin.sin_port = htons(port);
307*4882a593Smuzhiyun srx->transport.sin.sin_addr.s_addr = xdr;
308*4882a593Smuzhiyun alist->nr_ipv4++;
309*4882a593Smuzhiyun alist->nr_addrs++;
310*4882a593Smuzhiyun }
311*4882a593Smuzhiyun
312*4882a593Smuzhiyun /*
313*4882a593Smuzhiyun * Merge an IPv6 entry into a fileserver address list.
314*4882a593Smuzhiyun */
afs_merge_fs_addr6(struct afs_addr_list * alist,__be32 * xdr,u16 port)315*4882a593Smuzhiyun void afs_merge_fs_addr6(struct afs_addr_list *alist, __be32 *xdr, u16 port)
316*4882a593Smuzhiyun {
317*4882a593Smuzhiyun struct sockaddr_rxrpc *srx;
318*4882a593Smuzhiyun int i, diff;
319*4882a593Smuzhiyun
320*4882a593Smuzhiyun if (alist->nr_addrs >= alist->max_addrs)
321*4882a593Smuzhiyun return;
322*4882a593Smuzhiyun
323*4882a593Smuzhiyun for (i = alist->nr_ipv4; i < alist->nr_addrs; i++) {
324*4882a593Smuzhiyun struct sockaddr_in6 *a = &alist->addrs[i].transport.sin6;
325*4882a593Smuzhiyun u16 a_port = ntohs(a->sin6_port);
326*4882a593Smuzhiyun
327*4882a593Smuzhiyun diff = memcmp(xdr, &a->sin6_addr, 16);
328*4882a593Smuzhiyun if (diff == 0 && port == a_port)
329*4882a593Smuzhiyun return;
330*4882a593Smuzhiyun if (diff == 0 && port < a_port)
331*4882a593Smuzhiyun break;
332*4882a593Smuzhiyun if (diff < 0)
333*4882a593Smuzhiyun break;
334*4882a593Smuzhiyun }
335*4882a593Smuzhiyun
336*4882a593Smuzhiyun if (i < alist->nr_addrs)
337*4882a593Smuzhiyun memmove(alist->addrs + i + 1,
338*4882a593Smuzhiyun alist->addrs + i,
339*4882a593Smuzhiyun sizeof(alist->addrs[0]) * (alist->nr_addrs - i));
340*4882a593Smuzhiyun
341*4882a593Smuzhiyun srx = &alist->addrs[i];
342*4882a593Smuzhiyun srx->srx_family = AF_RXRPC;
343*4882a593Smuzhiyun srx->transport_type = SOCK_DGRAM;
344*4882a593Smuzhiyun srx->transport_len = sizeof(srx->transport.sin6);
345*4882a593Smuzhiyun srx->transport.sin6.sin6_family = AF_INET6;
346*4882a593Smuzhiyun srx->transport.sin6.sin6_port = htons(port);
347*4882a593Smuzhiyun memcpy(&srx->transport.sin6.sin6_addr, xdr, 16);
348*4882a593Smuzhiyun alist->nr_addrs++;
349*4882a593Smuzhiyun }
350*4882a593Smuzhiyun
351*4882a593Smuzhiyun /*
352*4882a593Smuzhiyun * Get an address to try.
353*4882a593Smuzhiyun */
afs_iterate_addresses(struct afs_addr_cursor * ac)354*4882a593Smuzhiyun bool afs_iterate_addresses(struct afs_addr_cursor *ac)
355*4882a593Smuzhiyun {
356*4882a593Smuzhiyun unsigned long set, failed;
357*4882a593Smuzhiyun int index;
358*4882a593Smuzhiyun
359*4882a593Smuzhiyun if (!ac->alist)
360*4882a593Smuzhiyun return false;
361*4882a593Smuzhiyun
362*4882a593Smuzhiyun set = ac->alist->responded;
363*4882a593Smuzhiyun failed = ac->alist->failed;
364*4882a593Smuzhiyun _enter("%lx-%lx-%lx,%d", set, failed, ac->tried, ac->index);
365*4882a593Smuzhiyun
366*4882a593Smuzhiyun ac->nr_iterations++;
367*4882a593Smuzhiyun
368*4882a593Smuzhiyun set &= ~(failed | ac->tried);
369*4882a593Smuzhiyun
370*4882a593Smuzhiyun if (!set)
371*4882a593Smuzhiyun return false;
372*4882a593Smuzhiyun
373*4882a593Smuzhiyun index = READ_ONCE(ac->alist->preferred);
374*4882a593Smuzhiyun if (test_bit(index, &set))
375*4882a593Smuzhiyun goto selected;
376*4882a593Smuzhiyun
377*4882a593Smuzhiyun index = __ffs(set);
378*4882a593Smuzhiyun
379*4882a593Smuzhiyun selected:
380*4882a593Smuzhiyun ac->index = index;
381*4882a593Smuzhiyun set_bit(index, &ac->tried);
382*4882a593Smuzhiyun ac->responded = false;
383*4882a593Smuzhiyun return true;
384*4882a593Smuzhiyun }
385*4882a593Smuzhiyun
386*4882a593Smuzhiyun /*
387*4882a593Smuzhiyun * Release an address list cursor.
388*4882a593Smuzhiyun */
afs_end_cursor(struct afs_addr_cursor * ac)389*4882a593Smuzhiyun int afs_end_cursor(struct afs_addr_cursor *ac)
390*4882a593Smuzhiyun {
391*4882a593Smuzhiyun struct afs_addr_list *alist;
392*4882a593Smuzhiyun
393*4882a593Smuzhiyun alist = ac->alist;
394*4882a593Smuzhiyun if (alist) {
395*4882a593Smuzhiyun if (ac->responded &&
396*4882a593Smuzhiyun ac->index != alist->preferred &&
397*4882a593Smuzhiyun test_bit(ac->alist->preferred, &ac->tried))
398*4882a593Smuzhiyun WRITE_ONCE(alist->preferred, ac->index);
399*4882a593Smuzhiyun afs_put_addrlist(alist);
400*4882a593Smuzhiyun ac->alist = NULL;
401*4882a593Smuzhiyun }
402*4882a593Smuzhiyun
403*4882a593Smuzhiyun return ac->error;
404*4882a593Smuzhiyun }
405