xref: /OK3568_Linux_fs/kernel/samples/bpf/xdp_router_ipv4_kern.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* Copyright (C) 2017 Cavium, Inc.
2*4882a593Smuzhiyun  *
3*4882a593Smuzhiyun  * This program is free software; you can redistribute it and/or modify it
4*4882a593Smuzhiyun  * under the terms of version 2 of the GNU General Public License
5*4882a593Smuzhiyun  * as published by the Free Software Foundation.
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun #define KBUILD_MODNAME "foo"
8*4882a593Smuzhiyun #include <uapi/linux/bpf.h>
9*4882a593Smuzhiyun #include <linux/in.h>
10*4882a593Smuzhiyun #include <linux/if_ether.h>
11*4882a593Smuzhiyun #include <linux/if_packet.h>
12*4882a593Smuzhiyun #include <linux/if_vlan.h>
13*4882a593Smuzhiyun #include <linux/ip.h>
14*4882a593Smuzhiyun #include <linux/ipv6.h>
15*4882a593Smuzhiyun #include <bpf/bpf_helpers.h>
16*4882a593Smuzhiyun #include <linux/slab.h>
17*4882a593Smuzhiyun #include <net/ip_fib.h>
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun struct trie_value {
20*4882a593Smuzhiyun 	__u8 prefix[4];
21*4882a593Smuzhiyun 	__be64 value;
22*4882a593Smuzhiyun 	int ifindex;
23*4882a593Smuzhiyun 	int metric;
24*4882a593Smuzhiyun 	__be32 gw;
25*4882a593Smuzhiyun };
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun /* Key for lpm_trie*/
28*4882a593Smuzhiyun union key_4 {
29*4882a593Smuzhiyun 	u32 b32[2];
30*4882a593Smuzhiyun 	u8 b8[8];
31*4882a593Smuzhiyun };
32*4882a593Smuzhiyun 
33*4882a593Smuzhiyun struct arp_entry {
34*4882a593Smuzhiyun 	__be64 mac;
35*4882a593Smuzhiyun 	__be32 dst;
36*4882a593Smuzhiyun };
37*4882a593Smuzhiyun 
38*4882a593Smuzhiyun struct direct_map {
39*4882a593Smuzhiyun 	struct arp_entry arp;
40*4882a593Smuzhiyun 	int ifindex;
41*4882a593Smuzhiyun 	__be64 mac;
42*4882a593Smuzhiyun };
43*4882a593Smuzhiyun 
44*4882a593Smuzhiyun /* Map for trie implementation*/
45*4882a593Smuzhiyun struct {
46*4882a593Smuzhiyun 	__uint(type, BPF_MAP_TYPE_LPM_TRIE);
47*4882a593Smuzhiyun 	__uint(key_size, 8);
48*4882a593Smuzhiyun 	__uint(value_size, sizeof(struct trie_value));
49*4882a593Smuzhiyun 	__uint(max_entries, 50);
50*4882a593Smuzhiyun 	__uint(map_flags, BPF_F_NO_PREALLOC);
51*4882a593Smuzhiyun } lpm_map SEC(".maps");
52*4882a593Smuzhiyun 
53*4882a593Smuzhiyun /* Map for counter*/
54*4882a593Smuzhiyun struct {
55*4882a593Smuzhiyun 	__uint(type, BPF_MAP_TYPE_PERCPU_ARRAY);
56*4882a593Smuzhiyun 	__type(key, u32);
57*4882a593Smuzhiyun 	__type(value, u64);
58*4882a593Smuzhiyun 	__uint(max_entries, 256);
59*4882a593Smuzhiyun } rxcnt SEC(".maps");
60*4882a593Smuzhiyun 
61*4882a593Smuzhiyun /* Map for ARP table*/
62*4882a593Smuzhiyun struct {
63*4882a593Smuzhiyun 	__uint(type, BPF_MAP_TYPE_HASH);
64*4882a593Smuzhiyun 	__type(key, __be32);
65*4882a593Smuzhiyun 	__type(value, __be64);
66*4882a593Smuzhiyun 	__uint(max_entries, 50);
67*4882a593Smuzhiyun } arp_table SEC(".maps");
68*4882a593Smuzhiyun 
69*4882a593Smuzhiyun /* Map to keep the exact match entries in the route table*/
70*4882a593Smuzhiyun struct {
71*4882a593Smuzhiyun 	__uint(type, BPF_MAP_TYPE_HASH);
72*4882a593Smuzhiyun 	__type(key, __be32);
73*4882a593Smuzhiyun 	__type(value, struct direct_map);
74*4882a593Smuzhiyun 	__uint(max_entries, 50);
75*4882a593Smuzhiyun } exact_match SEC(".maps");
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun struct {
78*4882a593Smuzhiyun 	__uint(type, BPF_MAP_TYPE_DEVMAP);
79*4882a593Smuzhiyun 	__uint(key_size, sizeof(int));
80*4882a593Smuzhiyun 	__uint(value_size, sizeof(int));
81*4882a593Smuzhiyun 	__uint(max_entries, 100);
82*4882a593Smuzhiyun } tx_port SEC(".maps");
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun /* Function to set source and destination mac of the packet */
set_src_dst_mac(void * data,void * src,void * dst)85*4882a593Smuzhiyun static inline void set_src_dst_mac(void *data, void *src, void *dst)
86*4882a593Smuzhiyun {
87*4882a593Smuzhiyun 	unsigned short *source = src;
88*4882a593Smuzhiyun 	unsigned short *dest  = dst;
89*4882a593Smuzhiyun 	unsigned short *p = data;
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun 	__builtin_memcpy(p, dest, 6);
92*4882a593Smuzhiyun 	__builtin_memcpy(p + 3, source, 6);
93*4882a593Smuzhiyun }
94*4882a593Smuzhiyun 
95*4882a593Smuzhiyun /* Parse IPV4 packet to get SRC, DST IP and protocol */
parse_ipv4(void * data,u64 nh_off,void * data_end,__be32 * src,__be32 * dest)96*4882a593Smuzhiyun static inline int parse_ipv4(void *data, u64 nh_off, void *data_end,
97*4882a593Smuzhiyun 			     __be32 *src, __be32 *dest)
98*4882a593Smuzhiyun {
99*4882a593Smuzhiyun 	struct iphdr *iph = data + nh_off;
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun 	if (iph + 1 > data_end)
102*4882a593Smuzhiyun 		return 0;
103*4882a593Smuzhiyun 	*src = iph->saddr;
104*4882a593Smuzhiyun 	*dest = iph->daddr;
105*4882a593Smuzhiyun 	return iph->protocol;
106*4882a593Smuzhiyun }
107*4882a593Smuzhiyun 
108*4882a593Smuzhiyun SEC("xdp_router_ipv4")
xdp_router_ipv4_prog(struct xdp_md * ctx)109*4882a593Smuzhiyun int xdp_router_ipv4_prog(struct xdp_md *ctx)
110*4882a593Smuzhiyun {
111*4882a593Smuzhiyun 	void *data_end = (void *)(long)ctx->data_end;
112*4882a593Smuzhiyun 	__be64 *dest_mac = NULL, *src_mac = NULL;
113*4882a593Smuzhiyun 	void *data = (void *)(long)ctx->data;
114*4882a593Smuzhiyun 	struct trie_value *prefix_value;
115*4882a593Smuzhiyun 	int rc = XDP_DROP, forward_to;
116*4882a593Smuzhiyun 	struct ethhdr *eth = data;
117*4882a593Smuzhiyun 	union key_4 key4;
118*4882a593Smuzhiyun 	long *value;
119*4882a593Smuzhiyun 	u16 h_proto;
120*4882a593Smuzhiyun 	u32 ipproto;
121*4882a593Smuzhiyun 	u64 nh_off;
122*4882a593Smuzhiyun 
123*4882a593Smuzhiyun 	nh_off = sizeof(*eth);
124*4882a593Smuzhiyun 	if (data + nh_off > data_end)
125*4882a593Smuzhiyun 		return rc;
126*4882a593Smuzhiyun 
127*4882a593Smuzhiyun 	h_proto = eth->h_proto;
128*4882a593Smuzhiyun 
129*4882a593Smuzhiyun 	if (h_proto == htons(ETH_P_8021Q) || h_proto == htons(ETH_P_8021AD)) {
130*4882a593Smuzhiyun 		struct vlan_hdr *vhdr;
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun 		vhdr = data + nh_off;
133*4882a593Smuzhiyun 		nh_off += sizeof(struct vlan_hdr);
134*4882a593Smuzhiyun 		if (data + nh_off > data_end)
135*4882a593Smuzhiyun 			return rc;
136*4882a593Smuzhiyun 		h_proto = vhdr->h_vlan_encapsulated_proto;
137*4882a593Smuzhiyun 	}
138*4882a593Smuzhiyun 	if (h_proto == htons(ETH_P_ARP)) {
139*4882a593Smuzhiyun 		return XDP_PASS;
140*4882a593Smuzhiyun 	} else if (h_proto == htons(ETH_P_IP)) {
141*4882a593Smuzhiyun 		struct direct_map *direct_entry;
142*4882a593Smuzhiyun 		__be32 src_ip = 0, dest_ip = 0;
143*4882a593Smuzhiyun 
144*4882a593Smuzhiyun 		ipproto = parse_ipv4(data, nh_off, data_end, &src_ip, &dest_ip);
145*4882a593Smuzhiyun 		direct_entry = bpf_map_lookup_elem(&exact_match, &dest_ip);
146*4882a593Smuzhiyun 		/* Check for exact match, this would give a faster lookup*/
147*4882a593Smuzhiyun 		if (direct_entry && direct_entry->mac && direct_entry->arp.mac) {
148*4882a593Smuzhiyun 			src_mac = &direct_entry->mac;
149*4882a593Smuzhiyun 			dest_mac = &direct_entry->arp.mac;
150*4882a593Smuzhiyun 			forward_to = direct_entry->ifindex;
151*4882a593Smuzhiyun 		} else {
152*4882a593Smuzhiyun 			/* Look up in the trie for lpm*/
153*4882a593Smuzhiyun 			key4.b32[0] = 32;
154*4882a593Smuzhiyun 			key4.b8[4] = dest_ip & 0xff;
155*4882a593Smuzhiyun 			key4.b8[5] = (dest_ip >> 8) & 0xff;
156*4882a593Smuzhiyun 			key4.b8[6] = (dest_ip >> 16) & 0xff;
157*4882a593Smuzhiyun 			key4.b8[7] = (dest_ip >> 24) & 0xff;
158*4882a593Smuzhiyun 			prefix_value = bpf_map_lookup_elem(&lpm_map, &key4);
159*4882a593Smuzhiyun 			if (!prefix_value)
160*4882a593Smuzhiyun 				return XDP_DROP;
161*4882a593Smuzhiyun 			src_mac = &prefix_value->value;
162*4882a593Smuzhiyun 			if (!src_mac)
163*4882a593Smuzhiyun 				return XDP_DROP;
164*4882a593Smuzhiyun 			dest_mac = bpf_map_lookup_elem(&arp_table, &dest_ip);
165*4882a593Smuzhiyun 			if (!dest_mac) {
166*4882a593Smuzhiyun 				if (!prefix_value->gw)
167*4882a593Smuzhiyun 					return XDP_DROP;
168*4882a593Smuzhiyun 				dest_ip = prefix_value->gw;
169*4882a593Smuzhiyun 				dest_mac = bpf_map_lookup_elem(&arp_table, &dest_ip);
170*4882a593Smuzhiyun 			}
171*4882a593Smuzhiyun 			forward_to = prefix_value->ifindex;
172*4882a593Smuzhiyun 		}
173*4882a593Smuzhiyun 	} else {
174*4882a593Smuzhiyun 		ipproto = 0;
175*4882a593Smuzhiyun 	}
176*4882a593Smuzhiyun 	if (src_mac && dest_mac) {
177*4882a593Smuzhiyun 		set_src_dst_mac(data, src_mac, dest_mac);
178*4882a593Smuzhiyun 		value = bpf_map_lookup_elem(&rxcnt, &ipproto);
179*4882a593Smuzhiyun 		if (value)
180*4882a593Smuzhiyun 			*value += 1;
181*4882a593Smuzhiyun 		return  bpf_redirect_map(&tx_port, forward_to, 0);
182*4882a593Smuzhiyun 	}
183*4882a593Smuzhiyun 	return rc;
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun 
186*4882a593Smuzhiyun char _license[] SEC("license") = "GPL";
187