1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun #include <linux/errno.h>
3*4882a593Smuzhiyun #include <linux/ip.h>
4*4882a593Smuzhiyun #include <linux/kernel.h>
5*4882a593Smuzhiyun #include <linux/module.h>
6*4882a593Smuzhiyun #include <linux/skbuff.h>
7*4882a593Smuzhiyun #include <linux/socket.h>
8*4882a593Smuzhiyun #include <linux/types.h>
9*4882a593Smuzhiyun #include <net/checksum.h>
10*4882a593Smuzhiyun #include <net/dst_cache.h>
11*4882a593Smuzhiyun #include <net/ip.h>
12*4882a593Smuzhiyun #include <net/ip6_fib.h>
13*4882a593Smuzhiyun #include <net/ip6_route.h>
14*4882a593Smuzhiyun #include <net/lwtunnel.h>
15*4882a593Smuzhiyun #include <net/protocol.h>
16*4882a593Smuzhiyun #include <uapi/linux/ila.h>
17*4882a593Smuzhiyun #include "ila.h"
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun struct ila_lwt {
20*4882a593Smuzhiyun struct ila_params p;
21*4882a593Smuzhiyun struct dst_cache dst_cache;
22*4882a593Smuzhiyun u32 connected : 1;
23*4882a593Smuzhiyun u32 lwt_output : 1;
24*4882a593Smuzhiyun };
25*4882a593Smuzhiyun
ila_lwt_lwtunnel(struct lwtunnel_state * lwt)26*4882a593Smuzhiyun static inline struct ila_lwt *ila_lwt_lwtunnel(
27*4882a593Smuzhiyun struct lwtunnel_state *lwt)
28*4882a593Smuzhiyun {
29*4882a593Smuzhiyun return (struct ila_lwt *)lwt->data;
30*4882a593Smuzhiyun }
31*4882a593Smuzhiyun
ila_params_lwtunnel(struct lwtunnel_state * lwt)32*4882a593Smuzhiyun static inline struct ila_params *ila_params_lwtunnel(
33*4882a593Smuzhiyun struct lwtunnel_state *lwt)
34*4882a593Smuzhiyun {
35*4882a593Smuzhiyun return &ila_lwt_lwtunnel(lwt)->p;
36*4882a593Smuzhiyun }
37*4882a593Smuzhiyun
ila_output(struct net * net,struct sock * sk,struct sk_buff * skb)38*4882a593Smuzhiyun static int ila_output(struct net *net, struct sock *sk, struct sk_buff *skb)
39*4882a593Smuzhiyun {
40*4882a593Smuzhiyun struct dst_entry *orig_dst = skb_dst(skb);
41*4882a593Smuzhiyun struct rt6_info *rt = (struct rt6_info *)orig_dst;
42*4882a593Smuzhiyun struct ila_lwt *ilwt = ila_lwt_lwtunnel(orig_dst->lwtstate);
43*4882a593Smuzhiyun struct dst_entry *dst;
44*4882a593Smuzhiyun int err = -EINVAL;
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun if (skb->protocol != htons(ETH_P_IPV6))
47*4882a593Smuzhiyun goto drop;
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun if (ilwt->lwt_output)
50*4882a593Smuzhiyun ila_update_ipv6_locator(skb,
51*4882a593Smuzhiyun ila_params_lwtunnel(orig_dst->lwtstate),
52*4882a593Smuzhiyun true);
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun if (rt->rt6i_flags & (RTF_GATEWAY | RTF_CACHE)) {
55*4882a593Smuzhiyun /* Already have a next hop address in route, no need for
56*4882a593Smuzhiyun * dest cache route.
57*4882a593Smuzhiyun */
58*4882a593Smuzhiyun return orig_dst->lwtstate->orig_output(net, sk, skb);
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun dst = dst_cache_get(&ilwt->dst_cache);
62*4882a593Smuzhiyun if (unlikely(!dst)) {
63*4882a593Smuzhiyun struct ipv6hdr *ip6h = ipv6_hdr(skb);
64*4882a593Smuzhiyun struct flowi6 fl6;
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun /* Lookup a route for the new destination. Take into
67*4882a593Smuzhiyun * account that the base route may already have a gateway.
68*4882a593Smuzhiyun */
69*4882a593Smuzhiyun
70*4882a593Smuzhiyun memset(&fl6, 0, sizeof(fl6));
71*4882a593Smuzhiyun fl6.flowi6_oif = orig_dst->dev->ifindex;
72*4882a593Smuzhiyun fl6.flowi6_iif = LOOPBACK_IFINDEX;
73*4882a593Smuzhiyun fl6.daddr = *rt6_nexthop((struct rt6_info *)orig_dst,
74*4882a593Smuzhiyun &ip6h->daddr);
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun dst = ip6_route_output(net, NULL, &fl6);
77*4882a593Smuzhiyun if (dst->error) {
78*4882a593Smuzhiyun err = -EHOSTUNREACH;
79*4882a593Smuzhiyun dst_release(dst);
80*4882a593Smuzhiyun goto drop;
81*4882a593Smuzhiyun }
82*4882a593Smuzhiyun
83*4882a593Smuzhiyun dst = xfrm_lookup(net, dst, flowi6_to_flowi(&fl6), NULL, 0);
84*4882a593Smuzhiyun if (IS_ERR(dst)) {
85*4882a593Smuzhiyun err = PTR_ERR(dst);
86*4882a593Smuzhiyun goto drop;
87*4882a593Smuzhiyun }
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun if (ilwt->connected)
90*4882a593Smuzhiyun dst_cache_set_ip6(&ilwt->dst_cache, dst, &fl6.saddr);
91*4882a593Smuzhiyun }
92*4882a593Smuzhiyun
93*4882a593Smuzhiyun skb_dst_set(skb, dst);
94*4882a593Smuzhiyun return dst_output(net, sk, skb);
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun drop:
97*4882a593Smuzhiyun kfree_skb(skb);
98*4882a593Smuzhiyun return err;
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun
ila_input(struct sk_buff * skb)101*4882a593Smuzhiyun static int ila_input(struct sk_buff *skb)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun struct dst_entry *dst = skb_dst(skb);
104*4882a593Smuzhiyun struct ila_lwt *ilwt = ila_lwt_lwtunnel(dst->lwtstate);
105*4882a593Smuzhiyun
106*4882a593Smuzhiyun if (skb->protocol != htons(ETH_P_IPV6))
107*4882a593Smuzhiyun goto drop;
108*4882a593Smuzhiyun
109*4882a593Smuzhiyun if (!ilwt->lwt_output)
110*4882a593Smuzhiyun ila_update_ipv6_locator(skb,
111*4882a593Smuzhiyun ila_params_lwtunnel(dst->lwtstate),
112*4882a593Smuzhiyun false);
113*4882a593Smuzhiyun
114*4882a593Smuzhiyun return dst->lwtstate->orig_input(skb);
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun drop:
117*4882a593Smuzhiyun kfree_skb(skb);
118*4882a593Smuzhiyun return -EINVAL;
119*4882a593Smuzhiyun }
120*4882a593Smuzhiyun
121*4882a593Smuzhiyun static const struct nla_policy ila_nl_policy[ILA_ATTR_MAX + 1] = {
122*4882a593Smuzhiyun [ILA_ATTR_LOCATOR] = { .type = NLA_U64, },
123*4882a593Smuzhiyun [ILA_ATTR_CSUM_MODE] = { .type = NLA_U8, },
124*4882a593Smuzhiyun [ILA_ATTR_IDENT_TYPE] = { .type = NLA_U8, },
125*4882a593Smuzhiyun [ILA_ATTR_HOOK_TYPE] = { .type = NLA_U8, },
126*4882a593Smuzhiyun };
127*4882a593Smuzhiyun
ila_build_state(struct net * net,struct nlattr * nla,unsigned int family,const void * cfg,struct lwtunnel_state ** ts,struct netlink_ext_ack * extack)128*4882a593Smuzhiyun static int ila_build_state(struct net *net, struct nlattr *nla,
129*4882a593Smuzhiyun unsigned int family, const void *cfg,
130*4882a593Smuzhiyun struct lwtunnel_state **ts,
131*4882a593Smuzhiyun struct netlink_ext_ack *extack)
132*4882a593Smuzhiyun {
133*4882a593Smuzhiyun struct ila_lwt *ilwt;
134*4882a593Smuzhiyun struct ila_params *p;
135*4882a593Smuzhiyun struct nlattr *tb[ILA_ATTR_MAX + 1];
136*4882a593Smuzhiyun struct lwtunnel_state *newts;
137*4882a593Smuzhiyun const struct fib6_config *cfg6 = cfg;
138*4882a593Smuzhiyun struct ila_addr *iaddr;
139*4882a593Smuzhiyun u8 ident_type = ILA_ATYPE_USE_FORMAT;
140*4882a593Smuzhiyun u8 hook_type = ILA_HOOK_ROUTE_OUTPUT;
141*4882a593Smuzhiyun u8 csum_mode = ILA_CSUM_NO_ACTION;
142*4882a593Smuzhiyun bool lwt_output = true;
143*4882a593Smuzhiyun u8 eff_ident_type;
144*4882a593Smuzhiyun int ret;
145*4882a593Smuzhiyun
146*4882a593Smuzhiyun if (family != AF_INET6)
147*4882a593Smuzhiyun return -EINVAL;
148*4882a593Smuzhiyun
149*4882a593Smuzhiyun ret = nla_parse_nested_deprecated(tb, ILA_ATTR_MAX, nla,
150*4882a593Smuzhiyun ila_nl_policy, extack);
151*4882a593Smuzhiyun if (ret < 0)
152*4882a593Smuzhiyun return ret;
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun if (!tb[ILA_ATTR_LOCATOR])
155*4882a593Smuzhiyun return -EINVAL;
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun iaddr = (struct ila_addr *)&cfg6->fc_dst;
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun if (tb[ILA_ATTR_IDENT_TYPE])
160*4882a593Smuzhiyun ident_type = nla_get_u8(tb[ILA_ATTR_IDENT_TYPE]);
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun if (ident_type == ILA_ATYPE_USE_FORMAT) {
163*4882a593Smuzhiyun /* Infer identifier type from type field in formatted
164*4882a593Smuzhiyun * identifier.
165*4882a593Smuzhiyun */
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun if (cfg6->fc_dst_len < 8 * sizeof(struct ila_locator) + 3) {
168*4882a593Smuzhiyun /* Need to have full locator and at least type field
169*4882a593Smuzhiyun * included in destination
170*4882a593Smuzhiyun */
171*4882a593Smuzhiyun return -EINVAL;
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun eff_ident_type = iaddr->ident.type;
175*4882a593Smuzhiyun } else {
176*4882a593Smuzhiyun eff_ident_type = ident_type;
177*4882a593Smuzhiyun }
178*4882a593Smuzhiyun
179*4882a593Smuzhiyun switch (eff_ident_type) {
180*4882a593Smuzhiyun case ILA_ATYPE_IID:
181*4882a593Smuzhiyun /* Don't allow ILA for IID type */
182*4882a593Smuzhiyun return -EINVAL;
183*4882a593Smuzhiyun case ILA_ATYPE_LUID:
184*4882a593Smuzhiyun break;
185*4882a593Smuzhiyun case ILA_ATYPE_VIRT_V4:
186*4882a593Smuzhiyun case ILA_ATYPE_VIRT_UNI_V6:
187*4882a593Smuzhiyun case ILA_ATYPE_VIRT_MULTI_V6:
188*4882a593Smuzhiyun case ILA_ATYPE_NONLOCAL_ADDR:
189*4882a593Smuzhiyun /* These ILA formats are not supported yet. */
190*4882a593Smuzhiyun default:
191*4882a593Smuzhiyun return -EINVAL;
192*4882a593Smuzhiyun }
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun if (tb[ILA_ATTR_HOOK_TYPE])
195*4882a593Smuzhiyun hook_type = nla_get_u8(tb[ILA_ATTR_HOOK_TYPE]);
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun switch (hook_type) {
198*4882a593Smuzhiyun case ILA_HOOK_ROUTE_OUTPUT:
199*4882a593Smuzhiyun lwt_output = true;
200*4882a593Smuzhiyun break;
201*4882a593Smuzhiyun case ILA_HOOK_ROUTE_INPUT:
202*4882a593Smuzhiyun lwt_output = false;
203*4882a593Smuzhiyun break;
204*4882a593Smuzhiyun default:
205*4882a593Smuzhiyun return -EINVAL;
206*4882a593Smuzhiyun }
207*4882a593Smuzhiyun
208*4882a593Smuzhiyun if (tb[ILA_ATTR_CSUM_MODE])
209*4882a593Smuzhiyun csum_mode = nla_get_u8(tb[ILA_ATTR_CSUM_MODE]);
210*4882a593Smuzhiyun
211*4882a593Smuzhiyun if (csum_mode == ILA_CSUM_NEUTRAL_MAP &&
212*4882a593Smuzhiyun ila_csum_neutral_set(iaddr->ident)) {
213*4882a593Smuzhiyun /* Don't allow translation if checksum neutral bit is
214*4882a593Smuzhiyun * configured and it's set in the SIR address.
215*4882a593Smuzhiyun */
216*4882a593Smuzhiyun return -EINVAL;
217*4882a593Smuzhiyun }
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun newts = lwtunnel_state_alloc(sizeof(*ilwt));
220*4882a593Smuzhiyun if (!newts)
221*4882a593Smuzhiyun return -ENOMEM;
222*4882a593Smuzhiyun
223*4882a593Smuzhiyun ilwt = ila_lwt_lwtunnel(newts);
224*4882a593Smuzhiyun ret = dst_cache_init(&ilwt->dst_cache, GFP_ATOMIC);
225*4882a593Smuzhiyun if (ret) {
226*4882a593Smuzhiyun kfree(newts);
227*4882a593Smuzhiyun return ret;
228*4882a593Smuzhiyun }
229*4882a593Smuzhiyun
230*4882a593Smuzhiyun ilwt->lwt_output = !!lwt_output;
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun p = ila_params_lwtunnel(newts);
233*4882a593Smuzhiyun
234*4882a593Smuzhiyun p->csum_mode = csum_mode;
235*4882a593Smuzhiyun p->ident_type = ident_type;
236*4882a593Smuzhiyun p->locator.v64 = (__force __be64)nla_get_u64(tb[ILA_ATTR_LOCATOR]);
237*4882a593Smuzhiyun
238*4882a593Smuzhiyun /* Precompute checksum difference for translation since we
239*4882a593Smuzhiyun * know both the old locator and the new one.
240*4882a593Smuzhiyun */
241*4882a593Smuzhiyun p->locator_match = iaddr->loc;
242*4882a593Smuzhiyun
243*4882a593Smuzhiyun ila_init_saved_csum(p);
244*4882a593Smuzhiyun
245*4882a593Smuzhiyun newts->type = LWTUNNEL_ENCAP_ILA;
246*4882a593Smuzhiyun newts->flags |= LWTUNNEL_STATE_OUTPUT_REDIRECT |
247*4882a593Smuzhiyun LWTUNNEL_STATE_INPUT_REDIRECT;
248*4882a593Smuzhiyun
249*4882a593Smuzhiyun if (cfg6->fc_dst_len == 8 * sizeof(struct in6_addr))
250*4882a593Smuzhiyun ilwt->connected = 1;
251*4882a593Smuzhiyun
252*4882a593Smuzhiyun *ts = newts;
253*4882a593Smuzhiyun
254*4882a593Smuzhiyun return 0;
255*4882a593Smuzhiyun }
256*4882a593Smuzhiyun
ila_destroy_state(struct lwtunnel_state * lwt)257*4882a593Smuzhiyun static void ila_destroy_state(struct lwtunnel_state *lwt)
258*4882a593Smuzhiyun {
259*4882a593Smuzhiyun dst_cache_destroy(&ila_lwt_lwtunnel(lwt)->dst_cache);
260*4882a593Smuzhiyun }
261*4882a593Smuzhiyun
ila_fill_encap_info(struct sk_buff * skb,struct lwtunnel_state * lwtstate)262*4882a593Smuzhiyun static int ila_fill_encap_info(struct sk_buff *skb,
263*4882a593Smuzhiyun struct lwtunnel_state *lwtstate)
264*4882a593Smuzhiyun {
265*4882a593Smuzhiyun struct ila_params *p = ila_params_lwtunnel(lwtstate);
266*4882a593Smuzhiyun struct ila_lwt *ilwt = ila_lwt_lwtunnel(lwtstate);
267*4882a593Smuzhiyun
268*4882a593Smuzhiyun if (nla_put_u64_64bit(skb, ILA_ATTR_LOCATOR, (__force u64)p->locator.v64,
269*4882a593Smuzhiyun ILA_ATTR_PAD))
270*4882a593Smuzhiyun goto nla_put_failure;
271*4882a593Smuzhiyun
272*4882a593Smuzhiyun if (nla_put_u8(skb, ILA_ATTR_CSUM_MODE, (__force u8)p->csum_mode))
273*4882a593Smuzhiyun goto nla_put_failure;
274*4882a593Smuzhiyun
275*4882a593Smuzhiyun if (nla_put_u8(skb, ILA_ATTR_IDENT_TYPE, (__force u8)p->ident_type))
276*4882a593Smuzhiyun goto nla_put_failure;
277*4882a593Smuzhiyun
278*4882a593Smuzhiyun if (nla_put_u8(skb, ILA_ATTR_HOOK_TYPE,
279*4882a593Smuzhiyun ilwt->lwt_output ? ILA_HOOK_ROUTE_OUTPUT :
280*4882a593Smuzhiyun ILA_HOOK_ROUTE_INPUT))
281*4882a593Smuzhiyun goto nla_put_failure;
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun return 0;
284*4882a593Smuzhiyun
285*4882a593Smuzhiyun nla_put_failure:
286*4882a593Smuzhiyun return -EMSGSIZE;
287*4882a593Smuzhiyun }
288*4882a593Smuzhiyun
ila_encap_nlsize(struct lwtunnel_state * lwtstate)289*4882a593Smuzhiyun static int ila_encap_nlsize(struct lwtunnel_state *lwtstate)
290*4882a593Smuzhiyun {
291*4882a593Smuzhiyun return nla_total_size_64bit(sizeof(u64)) + /* ILA_ATTR_LOCATOR */
292*4882a593Smuzhiyun nla_total_size(sizeof(u8)) + /* ILA_ATTR_CSUM_MODE */
293*4882a593Smuzhiyun nla_total_size(sizeof(u8)) + /* ILA_ATTR_IDENT_TYPE */
294*4882a593Smuzhiyun nla_total_size(sizeof(u8)) + /* ILA_ATTR_HOOK_TYPE */
295*4882a593Smuzhiyun 0;
296*4882a593Smuzhiyun }
297*4882a593Smuzhiyun
ila_encap_cmp(struct lwtunnel_state * a,struct lwtunnel_state * b)298*4882a593Smuzhiyun static int ila_encap_cmp(struct lwtunnel_state *a, struct lwtunnel_state *b)
299*4882a593Smuzhiyun {
300*4882a593Smuzhiyun struct ila_params *a_p = ila_params_lwtunnel(a);
301*4882a593Smuzhiyun struct ila_params *b_p = ila_params_lwtunnel(b);
302*4882a593Smuzhiyun
303*4882a593Smuzhiyun return (a_p->locator.v64 != b_p->locator.v64);
304*4882a593Smuzhiyun }
305*4882a593Smuzhiyun
306*4882a593Smuzhiyun static const struct lwtunnel_encap_ops ila_encap_ops = {
307*4882a593Smuzhiyun .build_state = ila_build_state,
308*4882a593Smuzhiyun .destroy_state = ila_destroy_state,
309*4882a593Smuzhiyun .output = ila_output,
310*4882a593Smuzhiyun .input = ila_input,
311*4882a593Smuzhiyun .fill_encap = ila_fill_encap_info,
312*4882a593Smuzhiyun .get_encap_size = ila_encap_nlsize,
313*4882a593Smuzhiyun .cmp_encap = ila_encap_cmp,
314*4882a593Smuzhiyun .owner = THIS_MODULE,
315*4882a593Smuzhiyun };
316*4882a593Smuzhiyun
ila_lwt_init(void)317*4882a593Smuzhiyun int ila_lwt_init(void)
318*4882a593Smuzhiyun {
319*4882a593Smuzhiyun return lwtunnel_encap_add_ops(&ila_encap_ops, LWTUNNEL_ENCAP_ILA);
320*4882a593Smuzhiyun }
321*4882a593Smuzhiyun
ila_lwt_fini(void)322*4882a593Smuzhiyun void ila_lwt_fini(void)
323*4882a593Smuzhiyun {
324*4882a593Smuzhiyun lwtunnel_encap_del_ops(&ila_encap_ops, LWTUNNEL_ENCAP_ILA);
325*4882a593Smuzhiyun }
326