xref: /OK3568_Linux_fs/kernel/tools/testing/selftests/net/msg_zerocopy.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* Evaluate MSG_ZEROCOPY
2*4882a593Smuzhiyun  *
3*4882a593Smuzhiyun  * Send traffic between two processes over one of the supported
4*4882a593Smuzhiyun  * protocols and modes:
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  * PF_INET/PF_INET6
7*4882a593Smuzhiyun  * - SOCK_STREAM
8*4882a593Smuzhiyun  * - SOCK_DGRAM
9*4882a593Smuzhiyun  * - SOCK_DGRAM with UDP_CORK
10*4882a593Smuzhiyun  * - SOCK_RAW
11*4882a593Smuzhiyun  * - SOCK_RAW with IP_HDRINCL
12*4882a593Smuzhiyun  *
13*4882a593Smuzhiyun  * PF_PACKET
14*4882a593Smuzhiyun  * - SOCK_DGRAM
15*4882a593Smuzhiyun  * - SOCK_RAW
16*4882a593Smuzhiyun  *
17*4882a593Smuzhiyun  * PF_RDS
18*4882a593Smuzhiyun  * - SOCK_SEQPACKET
19*4882a593Smuzhiyun  *
20*4882a593Smuzhiyun  * Start this program on two connected hosts, one in send mode and
21*4882a593Smuzhiyun  * the other with option '-r' to put it in receiver mode.
22*4882a593Smuzhiyun  *
23*4882a593Smuzhiyun  * If zerocopy mode ('-z') is enabled, the sender will verify that
24*4882a593Smuzhiyun  * the kernel queues completions on the error queue for all zerocopy
25*4882a593Smuzhiyun  * transfers.
26*4882a593Smuzhiyun  */
27*4882a593Smuzhiyun 
28*4882a593Smuzhiyun #define _GNU_SOURCE
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun #include <arpa/inet.h>
31*4882a593Smuzhiyun #include <error.h>
32*4882a593Smuzhiyun #include <errno.h>
33*4882a593Smuzhiyun #include <limits.h>
34*4882a593Smuzhiyun #include <linux/errqueue.h>
35*4882a593Smuzhiyun #include <linux/if_packet.h>
36*4882a593Smuzhiyun #include <linux/ipv6.h>
37*4882a593Smuzhiyun #include <linux/socket.h>
38*4882a593Smuzhiyun #include <linux/sockios.h>
39*4882a593Smuzhiyun #include <net/ethernet.h>
40*4882a593Smuzhiyun #include <net/if.h>
41*4882a593Smuzhiyun #include <netinet/ip.h>
42*4882a593Smuzhiyun #include <netinet/ip6.h>
43*4882a593Smuzhiyun #include <netinet/tcp.h>
44*4882a593Smuzhiyun #include <netinet/udp.h>
45*4882a593Smuzhiyun #include <poll.h>
46*4882a593Smuzhiyun #include <sched.h>
47*4882a593Smuzhiyun #include <stdbool.h>
48*4882a593Smuzhiyun #include <stdio.h>
49*4882a593Smuzhiyun #include <stdint.h>
50*4882a593Smuzhiyun #include <stdlib.h>
51*4882a593Smuzhiyun #include <string.h>
52*4882a593Smuzhiyun #include <sys/ioctl.h>
53*4882a593Smuzhiyun #include <sys/socket.h>
54*4882a593Smuzhiyun #include <sys/stat.h>
55*4882a593Smuzhiyun #include <sys/time.h>
56*4882a593Smuzhiyun #include <sys/types.h>
57*4882a593Smuzhiyun #include <sys/wait.h>
58*4882a593Smuzhiyun #include <unistd.h>
59*4882a593Smuzhiyun #include <linux/rds.h>
60*4882a593Smuzhiyun 
61*4882a593Smuzhiyun #ifndef SO_EE_ORIGIN_ZEROCOPY
62*4882a593Smuzhiyun #define SO_EE_ORIGIN_ZEROCOPY		5
63*4882a593Smuzhiyun #endif
64*4882a593Smuzhiyun 
65*4882a593Smuzhiyun #ifndef SO_ZEROCOPY
66*4882a593Smuzhiyun #define SO_ZEROCOPY	60
67*4882a593Smuzhiyun #endif
68*4882a593Smuzhiyun 
69*4882a593Smuzhiyun #ifndef SO_EE_CODE_ZEROCOPY_COPIED
70*4882a593Smuzhiyun #define SO_EE_CODE_ZEROCOPY_COPIED	1
71*4882a593Smuzhiyun #endif
72*4882a593Smuzhiyun 
73*4882a593Smuzhiyun #ifndef MSG_ZEROCOPY
74*4882a593Smuzhiyun #define MSG_ZEROCOPY	0x4000000
75*4882a593Smuzhiyun #endif
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun static int  cfg_cork;
78*4882a593Smuzhiyun static bool cfg_cork_mixed;
79*4882a593Smuzhiyun static int  cfg_cpu		= -1;		/* default: pin to last cpu */
80*4882a593Smuzhiyun static int  cfg_family		= PF_UNSPEC;
81*4882a593Smuzhiyun static int  cfg_ifindex		= 1;
82*4882a593Smuzhiyun static int  cfg_payload_len;
83*4882a593Smuzhiyun static int  cfg_port		= 8000;
84*4882a593Smuzhiyun static bool cfg_rx;
85*4882a593Smuzhiyun static int  cfg_runtime_ms	= 4200;
86*4882a593Smuzhiyun static int  cfg_verbose;
87*4882a593Smuzhiyun static int  cfg_waittime_ms	= 500;
88*4882a593Smuzhiyun static bool cfg_zerocopy;
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun static socklen_t cfg_alen;
91*4882a593Smuzhiyun static struct sockaddr_storage cfg_dst_addr;
92*4882a593Smuzhiyun static struct sockaddr_storage cfg_src_addr;
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun static char payload[IP_MAXPACKET];
95*4882a593Smuzhiyun static long packets, bytes, completions, expected_completions;
96*4882a593Smuzhiyun static int  zerocopied = -1;
97*4882a593Smuzhiyun static uint32_t next_completion;
98*4882a593Smuzhiyun 
gettimeofday_ms(void)99*4882a593Smuzhiyun static unsigned long gettimeofday_ms(void)
100*4882a593Smuzhiyun {
101*4882a593Smuzhiyun 	struct timeval tv;
102*4882a593Smuzhiyun 
103*4882a593Smuzhiyun 	gettimeofday(&tv, NULL);
104*4882a593Smuzhiyun 	return (tv.tv_sec * 1000) + (tv.tv_usec / 1000);
105*4882a593Smuzhiyun }
106*4882a593Smuzhiyun 
get_ip_csum(const uint16_t * start,int num_words)107*4882a593Smuzhiyun static uint16_t get_ip_csum(const uint16_t *start, int num_words)
108*4882a593Smuzhiyun {
109*4882a593Smuzhiyun 	unsigned long sum = 0;
110*4882a593Smuzhiyun 	int i;
111*4882a593Smuzhiyun 
112*4882a593Smuzhiyun 	for (i = 0; i < num_words; i++)
113*4882a593Smuzhiyun 		sum += start[i];
114*4882a593Smuzhiyun 
115*4882a593Smuzhiyun 	while (sum >> 16)
116*4882a593Smuzhiyun 		sum = (sum & 0xFFFF) + (sum >> 16);
117*4882a593Smuzhiyun 
118*4882a593Smuzhiyun 	return ~sum;
119*4882a593Smuzhiyun }
120*4882a593Smuzhiyun 
do_setcpu(int cpu)121*4882a593Smuzhiyun static int do_setcpu(int cpu)
122*4882a593Smuzhiyun {
123*4882a593Smuzhiyun 	cpu_set_t mask;
124*4882a593Smuzhiyun 
125*4882a593Smuzhiyun 	CPU_ZERO(&mask);
126*4882a593Smuzhiyun 	CPU_SET(cpu, &mask);
127*4882a593Smuzhiyun 	if (sched_setaffinity(0, sizeof(mask), &mask))
128*4882a593Smuzhiyun 		fprintf(stderr, "cpu: unable to pin, may increase variance.\n");
129*4882a593Smuzhiyun 	else if (cfg_verbose)
130*4882a593Smuzhiyun 		fprintf(stderr, "cpu: %u\n", cpu);
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun 	return 0;
133*4882a593Smuzhiyun }
134*4882a593Smuzhiyun 
do_setsockopt(int fd,int level,int optname,int val)135*4882a593Smuzhiyun static void do_setsockopt(int fd, int level, int optname, int val)
136*4882a593Smuzhiyun {
137*4882a593Smuzhiyun 	if (setsockopt(fd, level, optname, &val, sizeof(val)))
138*4882a593Smuzhiyun 		error(1, errno, "setsockopt %d.%d: %d", level, optname, val);
139*4882a593Smuzhiyun }
140*4882a593Smuzhiyun 
do_poll(int fd,int events)141*4882a593Smuzhiyun static int do_poll(int fd, int events)
142*4882a593Smuzhiyun {
143*4882a593Smuzhiyun 	struct pollfd pfd;
144*4882a593Smuzhiyun 	int ret;
145*4882a593Smuzhiyun 
146*4882a593Smuzhiyun 	pfd.events = events;
147*4882a593Smuzhiyun 	pfd.revents = 0;
148*4882a593Smuzhiyun 	pfd.fd = fd;
149*4882a593Smuzhiyun 
150*4882a593Smuzhiyun 	ret = poll(&pfd, 1, cfg_waittime_ms);
151*4882a593Smuzhiyun 	if (ret == -1)
152*4882a593Smuzhiyun 		error(1, errno, "poll");
153*4882a593Smuzhiyun 
154*4882a593Smuzhiyun 	return ret && (pfd.revents & events);
155*4882a593Smuzhiyun }
156*4882a593Smuzhiyun 
do_accept(int fd)157*4882a593Smuzhiyun static int do_accept(int fd)
158*4882a593Smuzhiyun {
159*4882a593Smuzhiyun 	int fda = fd;
160*4882a593Smuzhiyun 
161*4882a593Smuzhiyun 	fd = accept(fda, NULL, NULL);
162*4882a593Smuzhiyun 	if (fd == -1)
163*4882a593Smuzhiyun 		error(1, errno, "accept");
164*4882a593Smuzhiyun 	if (close(fda))
165*4882a593Smuzhiyun 		error(1, errno, "close listen sock");
166*4882a593Smuzhiyun 
167*4882a593Smuzhiyun 	return fd;
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun 
add_zcopy_cookie(struct msghdr * msg,uint32_t cookie)170*4882a593Smuzhiyun static void add_zcopy_cookie(struct msghdr *msg, uint32_t cookie)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun 	struct cmsghdr *cm;
173*4882a593Smuzhiyun 
174*4882a593Smuzhiyun 	if (!msg->msg_control)
175*4882a593Smuzhiyun 		error(1, errno, "NULL cookie");
176*4882a593Smuzhiyun 	cm = (void *)msg->msg_control;
177*4882a593Smuzhiyun 	cm->cmsg_len = CMSG_LEN(sizeof(cookie));
178*4882a593Smuzhiyun 	cm->cmsg_level = SOL_RDS;
179*4882a593Smuzhiyun 	cm->cmsg_type = RDS_CMSG_ZCOPY_COOKIE;
180*4882a593Smuzhiyun 	memcpy(CMSG_DATA(cm), &cookie, sizeof(cookie));
181*4882a593Smuzhiyun }
182*4882a593Smuzhiyun 
do_sendmsg(int fd,struct msghdr * msg,bool do_zerocopy,int domain)183*4882a593Smuzhiyun static bool do_sendmsg(int fd, struct msghdr *msg, bool do_zerocopy, int domain)
184*4882a593Smuzhiyun {
185*4882a593Smuzhiyun 	int ret, len, i, flags;
186*4882a593Smuzhiyun 	static uint32_t cookie;
187*4882a593Smuzhiyun 	char ckbuf[CMSG_SPACE(sizeof(cookie))];
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun 	len = 0;
190*4882a593Smuzhiyun 	for (i = 0; i < msg->msg_iovlen; i++)
191*4882a593Smuzhiyun 		len += msg->msg_iov[i].iov_len;
192*4882a593Smuzhiyun 
193*4882a593Smuzhiyun 	flags = MSG_DONTWAIT;
194*4882a593Smuzhiyun 	if (do_zerocopy) {
195*4882a593Smuzhiyun 		flags |= MSG_ZEROCOPY;
196*4882a593Smuzhiyun 		if (domain == PF_RDS) {
197*4882a593Smuzhiyun 			memset(&msg->msg_control, 0, sizeof(msg->msg_control));
198*4882a593Smuzhiyun 			msg->msg_controllen = CMSG_SPACE(sizeof(cookie));
199*4882a593Smuzhiyun 			msg->msg_control = (struct cmsghdr *)ckbuf;
200*4882a593Smuzhiyun 			add_zcopy_cookie(msg, ++cookie);
201*4882a593Smuzhiyun 		}
202*4882a593Smuzhiyun 	}
203*4882a593Smuzhiyun 
204*4882a593Smuzhiyun 	ret = sendmsg(fd, msg, flags);
205*4882a593Smuzhiyun 	if (ret == -1 && errno == EAGAIN)
206*4882a593Smuzhiyun 		return false;
207*4882a593Smuzhiyun 	if (ret == -1)
208*4882a593Smuzhiyun 		error(1, errno, "send");
209*4882a593Smuzhiyun 	if (cfg_verbose && ret != len)
210*4882a593Smuzhiyun 		fprintf(stderr, "send: ret=%u != %u\n", ret, len);
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun 	if (len) {
213*4882a593Smuzhiyun 		packets++;
214*4882a593Smuzhiyun 		bytes += ret;
215*4882a593Smuzhiyun 		if (do_zerocopy && ret)
216*4882a593Smuzhiyun 			expected_completions++;
217*4882a593Smuzhiyun 	}
218*4882a593Smuzhiyun 	if (do_zerocopy && domain == PF_RDS) {
219*4882a593Smuzhiyun 		msg->msg_control = NULL;
220*4882a593Smuzhiyun 		msg->msg_controllen = 0;
221*4882a593Smuzhiyun 	}
222*4882a593Smuzhiyun 
223*4882a593Smuzhiyun 	return true;
224*4882a593Smuzhiyun }
225*4882a593Smuzhiyun 
do_sendmsg_corked(int fd,struct msghdr * msg)226*4882a593Smuzhiyun static void do_sendmsg_corked(int fd, struct msghdr *msg)
227*4882a593Smuzhiyun {
228*4882a593Smuzhiyun 	bool do_zerocopy = cfg_zerocopy;
229*4882a593Smuzhiyun 	int i, payload_len, extra_len;
230*4882a593Smuzhiyun 
231*4882a593Smuzhiyun 	/* split up the packet. for non-multiple, make first buffer longer */
232*4882a593Smuzhiyun 	payload_len = cfg_payload_len / cfg_cork;
233*4882a593Smuzhiyun 	extra_len = cfg_payload_len - (cfg_cork * payload_len);
234*4882a593Smuzhiyun 
235*4882a593Smuzhiyun 	do_setsockopt(fd, IPPROTO_UDP, UDP_CORK, 1);
236*4882a593Smuzhiyun 
237*4882a593Smuzhiyun 	for (i = 0; i < cfg_cork; i++) {
238*4882a593Smuzhiyun 
239*4882a593Smuzhiyun 		/* in mixed-frags mode, alternate zerocopy and copy frags
240*4882a593Smuzhiyun 		 * start with non-zerocopy, to ensure attach later works
241*4882a593Smuzhiyun 		 */
242*4882a593Smuzhiyun 		if (cfg_cork_mixed)
243*4882a593Smuzhiyun 			do_zerocopy = (i & 1);
244*4882a593Smuzhiyun 
245*4882a593Smuzhiyun 		msg->msg_iov[0].iov_len = payload_len + extra_len;
246*4882a593Smuzhiyun 		extra_len = 0;
247*4882a593Smuzhiyun 
248*4882a593Smuzhiyun 		do_sendmsg(fd, msg, do_zerocopy,
249*4882a593Smuzhiyun 			   (cfg_dst_addr.ss_family == AF_INET ?
250*4882a593Smuzhiyun 			    PF_INET : PF_INET6));
251*4882a593Smuzhiyun 	}
252*4882a593Smuzhiyun 
253*4882a593Smuzhiyun 	do_setsockopt(fd, IPPROTO_UDP, UDP_CORK, 0);
254*4882a593Smuzhiyun }
255*4882a593Smuzhiyun 
setup_iph(struct iphdr * iph,uint16_t payload_len)256*4882a593Smuzhiyun static int setup_iph(struct iphdr *iph, uint16_t payload_len)
257*4882a593Smuzhiyun {
258*4882a593Smuzhiyun 	struct sockaddr_in *daddr = (void *) &cfg_dst_addr;
259*4882a593Smuzhiyun 	struct sockaddr_in *saddr = (void *) &cfg_src_addr;
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun 	memset(iph, 0, sizeof(*iph));
262*4882a593Smuzhiyun 
263*4882a593Smuzhiyun 	iph->version	= 4;
264*4882a593Smuzhiyun 	iph->tos	= 0;
265*4882a593Smuzhiyun 	iph->ihl	= 5;
266*4882a593Smuzhiyun 	iph->ttl	= 2;
267*4882a593Smuzhiyun 	iph->saddr	= saddr->sin_addr.s_addr;
268*4882a593Smuzhiyun 	iph->daddr	= daddr->sin_addr.s_addr;
269*4882a593Smuzhiyun 	iph->protocol	= IPPROTO_EGP;
270*4882a593Smuzhiyun 	iph->tot_len	= htons(sizeof(*iph) + payload_len);
271*4882a593Smuzhiyun 	iph->check	= get_ip_csum((void *) iph, iph->ihl << 1);
272*4882a593Smuzhiyun 
273*4882a593Smuzhiyun 	return sizeof(*iph);
274*4882a593Smuzhiyun }
275*4882a593Smuzhiyun 
setup_ip6h(struct ipv6hdr * ip6h,uint16_t payload_len)276*4882a593Smuzhiyun static int setup_ip6h(struct ipv6hdr *ip6h, uint16_t payload_len)
277*4882a593Smuzhiyun {
278*4882a593Smuzhiyun 	struct sockaddr_in6 *daddr = (void *) &cfg_dst_addr;
279*4882a593Smuzhiyun 	struct sockaddr_in6 *saddr = (void *) &cfg_src_addr;
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 	memset(ip6h, 0, sizeof(*ip6h));
282*4882a593Smuzhiyun 
283*4882a593Smuzhiyun 	ip6h->version		= 6;
284*4882a593Smuzhiyun 	ip6h->payload_len	= htons(payload_len);
285*4882a593Smuzhiyun 	ip6h->nexthdr		= IPPROTO_EGP;
286*4882a593Smuzhiyun 	ip6h->hop_limit		= 2;
287*4882a593Smuzhiyun 	ip6h->saddr		= saddr->sin6_addr;
288*4882a593Smuzhiyun 	ip6h->daddr		= daddr->sin6_addr;
289*4882a593Smuzhiyun 
290*4882a593Smuzhiyun 	return sizeof(*ip6h);
291*4882a593Smuzhiyun }
292*4882a593Smuzhiyun 
293*4882a593Smuzhiyun 
setup_sockaddr(int domain,const char * str_addr,struct sockaddr_storage * sockaddr)294*4882a593Smuzhiyun static void setup_sockaddr(int domain, const char *str_addr,
295*4882a593Smuzhiyun 			   struct sockaddr_storage *sockaddr)
296*4882a593Smuzhiyun {
297*4882a593Smuzhiyun 	struct sockaddr_in6 *addr6 = (void *) sockaddr;
298*4882a593Smuzhiyun 	struct sockaddr_in *addr4 = (void *) sockaddr;
299*4882a593Smuzhiyun 
300*4882a593Smuzhiyun 	switch (domain) {
301*4882a593Smuzhiyun 	case PF_INET:
302*4882a593Smuzhiyun 		memset(addr4, 0, sizeof(*addr4));
303*4882a593Smuzhiyun 		addr4->sin_family = AF_INET;
304*4882a593Smuzhiyun 		addr4->sin_port = htons(cfg_port);
305*4882a593Smuzhiyun 		if (str_addr &&
306*4882a593Smuzhiyun 		    inet_pton(AF_INET, str_addr, &(addr4->sin_addr)) != 1)
307*4882a593Smuzhiyun 			error(1, 0, "ipv4 parse error: %s", str_addr);
308*4882a593Smuzhiyun 		break;
309*4882a593Smuzhiyun 	case PF_INET6:
310*4882a593Smuzhiyun 		memset(addr6, 0, sizeof(*addr6));
311*4882a593Smuzhiyun 		addr6->sin6_family = AF_INET6;
312*4882a593Smuzhiyun 		addr6->sin6_port = htons(cfg_port);
313*4882a593Smuzhiyun 		if (str_addr &&
314*4882a593Smuzhiyun 		    inet_pton(AF_INET6, str_addr, &(addr6->sin6_addr)) != 1)
315*4882a593Smuzhiyun 			error(1, 0, "ipv6 parse error: %s", str_addr);
316*4882a593Smuzhiyun 		break;
317*4882a593Smuzhiyun 	default:
318*4882a593Smuzhiyun 		error(1, 0, "illegal domain");
319*4882a593Smuzhiyun 	}
320*4882a593Smuzhiyun }
321*4882a593Smuzhiyun 
do_setup_tx(int domain,int type,int protocol)322*4882a593Smuzhiyun static int do_setup_tx(int domain, int type, int protocol)
323*4882a593Smuzhiyun {
324*4882a593Smuzhiyun 	int fd;
325*4882a593Smuzhiyun 
326*4882a593Smuzhiyun 	fd = socket(domain, type, protocol);
327*4882a593Smuzhiyun 	if (fd == -1)
328*4882a593Smuzhiyun 		error(1, errno, "socket t");
329*4882a593Smuzhiyun 
330*4882a593Smuzhiyun 	do_setsockopt(fd, SOL_SOCKET, SO_SNDBUF, 1 << 21);
331*4882a593Smuzhiyun 	if (cfg_zerocopy)
332*4882a593Smuzhiyun 		do_setsockopt(fd, SOL_SOCKET, SO_ZEROCOPY, 1);
333*4882a593Smuzhiyun 
334*4882a593Smuzhiyun 	if (domain != PF_PACKET && domain != PF_RDS)
335*4882a593Smuzhiyun 		if (connect(fd, (void *) &cfg_dst_addr, cfg_alen))
336*4882a593Smuzhiyun 			error(1, errno, "connect");
337*4882a593Smuzhiyun 
338*4882a593Smuzhiyun 	if (domain == PF_RDS) {
339*4882a593Smuzhiyun 		if (bind(fd, (void *) &cfg_src_addr, cfg_alen))
340*4882a593Smuzhiyun 			error(1, errno, "bind");
341*4882a593Smuzhiyun 	}
342*4882a593Smuzhiyun 
343*4882a593Smuzhiyun 	return fd;
344*4882a593Smuzhiyun }
345*4882a593Smuzhiyun 
do_process_zerocopy_cookies(struct rds_zcopy_cookies * ck)346*4882a593Smuzhiyun static uint32_t do_process_zerocopy_cookies(struct rds_zcopy_cookies *ck)
347*4882a593Smuzhiyun {
348*4882a593Smuzhiyun 	int i;
349*4882a593Smuzhiyun 
350*4882a593Smuzhiyun 	if (ck->num > RDS_MAX_ZCOOKIES)
351*4882a593Smuzhiyun 		error(1, 0, "Returned %d cookies, max expected %d\n",
352*4882a593Smuzhiyun 		      ck->num, RDS_MAX_ZCOOKIES);
353*4882a593Smuzhiyun 	for (i = 0; i < ck->num; i++)
354*4882a593Smuzhiyun 		if (cfg_verbose >= 2)
355*4882a593Smuzhiyun 			fprintf(stderr, "%d\n", ck->cookies[i]);
356*4882a593Smuzhiyun 	return ck->num;
357*4882a593Smuzhiyun }
358*4882a593Smuzhiyun 
do_recvmsg_completion(int fd)359*4882a593Smuzhiyun static bool do_recvmsg_completion(int fd)
360*4882a593Smuzhiyun {
361*4882a593Smuzhiyun 	char cmsgbuf[CMSG_SPACE(sizeof(struct rds_zcopy_cookies))];
362*4882a593Smuzhiyun 	struct rds_zcopy_cookies *ck;
363*4882a593Smuzhiyun 	struct cmsghdr *cmsg;
364*4882a593Smuzhiyun 	struct msghdr msg;
365*4882a593Smuzhiyun 	bool ret = false;
366*4882a593Smuzhiyun 
367*4882a593Smuzhiyun 	memset(&msg, 0, sizeof(msg));
368*4882a593Smuzhiyun 	msg.msg_control = cmsgbuf;
369*4882a593Smuzhiyun 	msg.msg_controllen = sizeof(cmsgbuf);
370*4882a593Smuzhiyun 
371*4882a593Smuzhiyun 	if (recvmsg(fd, &msg, MSG_DONTWAIT))
372*4882a593Smuzhiyun 		return ret;
373*4882a593Smuzhiyun 
374*4882a593Smuzhiyun 	if (msg.msg_flags & MSG_CTRUNC)
375*4882a593Smuzhiyun 		error(1, errno, "recvmsg notification: truncated");
376*4882a593Smuzhiyun 
377*4882a593Smuzhiyun 	for (cmsg = CMSG_FIRSTHDR(&msg); cmsg; cmsg = CMSG_NXTHDR(&msg, cmsg)) {
378*4882a593Smuzhiyun 		if (cmsg->cmsg_level == SOL_RDS &&
379*4882a593Smuzhiyun 		    cmsg->cmsg_type == RDS_CMSG_ZCOPY_COMPLETION) {
380*4882a593Smuzhiyun 
381*4882a593Smuzhiyun 			ck = (struct rds_zcopy_cookies *)CMSG_DATA(cmsg);
382*4882a593Smuzhiyun 			completions += do_process_zerocopy_cookies(ck);
383*4882a593Smuzhiyun 			ret = true;
384*4882a593Smuzhiyun 			break;
385*4882a593Smuzhiyun 		}
386*4882a593Smuzhiyun 		error(0, 0, "ignoring cmsg at level %d type %d\n",
387*4882a593Smuzhiyun 			    cmsg->cmsg_level, cmsg->cmsg_type);
388*4882a593Smuzhiyun 	}
389*4882a593Smuzhiyun 	return ret;
390*4882a593Smuzhiyun }
391*4882a593Smuzhiyun 
do_recv_completion(int fd,int domain)392*4882a593Smuzhiyun static bool do_recv_completion(int fd, int domain)
393*4882a593Smuzhiyun {
394*4882a593Smuzhiyun 	struct sock_extended_err *serr;
395*4882a593Smuzhiyun 	struct msghdr msg = {};
396*4882a593Smuzhiyun 	struct cmsghdr *cm;
397*4882a593Smuzhiyun 	uint32_t hi, lo, range;
398*4882a593Smuzhiyun 	int ret, zerocopy;
399*4882a593Smuzhiyun 	char control[100];
400*4882a593Smuzhiyun 
401*4882a593Smuzhiyun 	if (domain == PF_RDS)
402*4882a593Smuzhiyun 		return do_recvmsg_completion(fd);
403*4882a593Smuzhiyun 
404*4882a593Smuzhiyun 	msg.msg_control = control;
405*4882a593Smuzhiyun 	msg.msg_controllen = sizeof(control);
406*4882a593Smuzhiyun 
407*4882a593Smuzhiyun 	ret = recvmsg(fd, &msg, MSG_ERRQUEUE);
408*4882a593Smuzhiyun 	if (ret == -1 && errno == EAGAIN)
409*4882a593Smuzhiyun 		return false;
410*4882a593Smuzhiyun 	if (ret == -1)
411*4882a593Smuzhiyun 		error(1, errno, "recvmsg notification");
412*4882a593Smuzhiyun 	if (msg.msg_flags & MSG_CTRUNC)
413*4882a593Smuzhiyun 		error(1, errno, "recvmsg notification: truncated");
414*4882a593Smuzhiyun 
415*4882a593Smuzhiyun 	cm = CMSG_FIRSTHDR(&msg);
416*4882a593Smuzhiyun 	if (!cm)
417*4882a593Smuzhiyun 		error(1, 0, "cmsg: no cmsg");
418*4882a593Smuzhiyun 	if (!((cm->cmsg_level == SOL_IP && cm->cmsg_type == IP_RECVERR) ||
419*4882a593Smuzhiyun 	      (cm->cmsg_level == SOL_IPV6 && cm->cmsg_type == IPV6_RECVERR) ||
420*4882a593Smuzhiyun 	      (cm->cmsg_level == SOL_PACKET && cm->cmsg_type == PACKET_TX_TIMESTAMP)))
421*4882a593Smuzhiyun 		error(1, 0, "serr: wrong type: %d.%d",
422*4882a593Smuzhiyun 		      cm->cmsg_level, cm->cmsg_type);
423*4882a593Smuzhiyun 
424*4882a593Smuzhiyun 	serr = (void *) CMSG_DATA(cm);
425*4882a593Smuzhiyun 
426*4882a593Smuzhiyun 	if (serr->ee_origin != SO_EE_ORIGIN_ZEROCOPY)
427*4882a593Smuzhiyun 		error(1, 0, "serr: wrong origin: %u", serr->ee_origin);
428*4882a593Smuzhiyun 	if (serr->ee_errno != 0)
429*4882a593Smuzhiyun 		error(1, 0, "serr: wrong error code: %u", serr->ee_errno);
430*4882a593Smuzhiyun 
431*4882a593Smuzhiyun 	hi = serr->ee_data;
432*4882a593Smuzhiyun 	lo = serr->ee_info;
433*4882a593Smuzhiyun 	range = hi - lo + 1;
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun 	/* Detect notification gaps. These should not happen often, if at all.
436*4882a593Smuzhiyun 	 * Gaps can occur due to drops, reordering and retransmissions.
437*4882a593Smuzhiyun 	 */
438*4882a593Smuzhiyun 	if (lo != next_completion)
439*4882a593Smuzhiyun 		fprintf(stderr, "gap: %u..%u does not append to %u\n",
440*4882a593Smuzhiyun 			lo, hi, next_completion);
441*4882a593Smuzhiyun 	next_completion = hi + 1;
442*4882a593Smuzhiyun 
443*4882a593Smuzhiyun 	zerocopy = !(serr->ee_code & SO_EE_CODE_ZEROCOPY_COPIED);
444*4882a593Smuzhiyun 	if (zerocopied == -1)
445*4882a593Smuzhiyun 		zerocopied = zerocopy;
446*4882a593Smuzhiyun 	else if (zerocopied != zerocopy) {
447*4882a593Smuzhiyun 		fprintf(stderr, "serr: inconsistent\n");
448*4882a593Smuzhiyun 		zerocopied = zerocopy;
449*4882a593Smuzhiyun 	}
450*4882a593Smuzhiyun 
451*4882a593Smuzhiyun 	if (cfg_verbose >= 2)
452*4882a593Smuzhiyun 		fprintf(stderr, "completed: %u (h=%u l=%u)\n",
453*4882a593Smuzhiyun 			range, hi, lo);
454*4882a593Smuzhiyun 
455*4882a593Smuzhiyun 	completions += range;
456*4882a593Smuzhiyun 	return true;
457*4882a593Smuzhiyun }
458*4882a593Smuzhiyun 
459*4882a593Smuzhiyun /* Read all outstanding messages on the errqueue */
do_recv_completions(int fd,int domain)460*4882a593Smuzhiyun static void do_recv_completions(int fd, int domain)
461*4882a593Smuzhiyun {
462*4882a593Smuzhiyun 	while (do_recv_completion(fd, domain)) {}
463*4882a593Smuzhiyun }
464*4882a593Smuzhiyun 
465*4882a593Smuzhiyun /* Wait for all remaining completions on the errqueue */
do_recv_remaining_completions(int fd,int domain)466*4882a593Smuzhiyun static void do_recv_remaining_completions(int fd, int domain)
467*4882a593Smuzhiyun {
468*4882a593Smuzhiyun 	int64_t tstop = gettimeofday_ms() + cfg_waittime_ms;
469*4882a593Smuzhiyun 
470*4882a593Smuzhiyun 	while (completions < expected_completions &&
471*4882a593Smuzhiyun 	       gettimeofday_ms() < tstop) {
472*4882a593Smuzhiyun 		if (do_poll(fd, domain == PF_RDS ? POLLIN : POLLERR))
473*4882a593Smuzhiyun 			do_recv_completions(fd, domain);
474*4882a593Smuzhiyun 	}
475*4882a593Smuzhiyun 
476*4882a593Smuzhiyun 	if (completions < expected_completions)
477*4882a593Smuzhiyun 		fprintf(stderr, "missing notifications: %lu < %lu\n",
478*4882a593Smuzhiyun 			completions, expected_completions);
479*4882a593Smuzhiyun }
480*4882a593Smuzhiyun 
do_tx(int domain,int type,int protocol)481*4882a593Smuzhiyun static void do_tx(int domain, int type, int protocol)
482*4882a593Smuzhiyun {
483*4882a593Smuzhiyun 	struct iovec iov[3] = { {0} };
484*4882a593Smuzhiyun 	struct sockaddr_ll laddr;
485*4882a593Smuzhiyun 	struct msghdr msg = {0};
486*4882a593Smuzhiyun 	struct ethhdr eth;
487*4882a593Smuzhiyun 	union {
488*4882a593Smuzhiyun 		struct ipv6hdr ip6h;
489*4882a593Smuzhiyun 		struct iphdr iph;
490*4882a593Smuzhiyun 	} nh;
491*4882a593Smuzhiyun 	uint64_t tstop;
492*4882a593Smuzhiyun 	int fd;
493*4882a593Smuzhiyun 
494*4882a593Smuzhiyun 	fd = do_setup_tx(domain, type, protocol);
495*4882a593Smuzhiyun 
496*4882a593Smuzhiyun 	if (domain == PF_PACKET) {
497*4882a593Smuzhiyun 		uint16_t proto = cfg_family == PF_INET ? ETH_P_IP : ETH_P_IPV6;
498*4882a593Smuzhiyun 
499*4882a593Smuzhiyun 		/* sock_raw passes ll header as data */
500*4882a593Smuzhiyun 		if (type == SOCK_RAW) {
501*4882a593Smuzhiyun 			memset(eth.h_dest, 0x06, ETH_ALEN);
502*4882a593Smuzhiyun 			memset(eth.h_source, 0x02, ETH_ALEN);
503*4882a593Smuzhiyun 			eth.h_proto = htons(proto);
504*4882a593Smuzhiyun 			iov[0].iov_base = &eth;
505*4882a593Smuzhiyun 			iov[0].iov_len = sizeof(eth);
506*4882a593Smuzhiyun 			msg.msg_iovlen++;
507*4882a593Smuzhiyun 		}
508*4882a593Smuzhiyun 
509*4882a593Smuzhiyun 		/* both sock_raw and sock_dgram expect name */
510*4882a593Smuzhiyun 		memset(&laddr, 0, sizeof(laddr));
511*4882a593Smuzhiyun 		laddr.sll_family	= AF_PACKET;
512*4882a593Smuzhiyun 		laddr.sll_ifindex	= cfg_ifindex;
513*4882a593Smuzhiyun 		laddr.sll_protocol	= htons(proto);
514*4882a593Smuzhiyun 		laddr.sll_halen		= ETH_ALEN;
515*4882a593Smuzhiyun 
516*4882a593Smuzhiyun 		memset(laddr.sll_addr, 0x06, ETH_ALEN);
517*4882a593Smuzhiyun 
518*4882a593Smuzhiyun 		msg.msg_name		= &laddr;
519*4882a593Smuzhiyun 		msg.msg_namelen		= sizeof(laddr);
520*4882a593Smuzhiyun 	}
521*4882a593Smuzhiyun 
522*4882a593Smuzhiyun 	/* packet and raw sockets with hdrincl must pass network header */
523*4882a593Smuzhiyun 	if (domain == PF_PACKET || protocol == IPPROTO_RAW) {
524*4882a593Smuzhiyun 		if (cfg_family == PF_INET)
525*4882a593Smuzhiyun 			iov[1].iov_len = setup_iph(&nh.iph, cfg_payload_len);
526*4882a593Smuzhiyun 		else
527*4882a593Smuzhiyun 			iov[1].iov_len = setup_ip6h(&nh.ip6h, cfg_payload_len);
528*4882a593Smuzhiyun 
529*4882a593Smuzhiyun 		iov[1].iov_base = (void *) &nh;
530*4882a593Smuzhiyun 		msg.msg_iovlen++;
531*4882a593Smuzhiyun 	}
532*4882a593Smuzhiyun 
533*4882a593Smuzhiyun 	if (domain == PF_RDS) {
534*4882a593Smuzhiyun 		msg.msg_name = &cfg_dst_addr;
535*4882a593Smuzhiyun 		msg.msg_namelen =  (cfg_dst_addr.ss_family == AF_INET ?
536*4882a593Smuzhiyun 				    sizeof(struct sockaddr_in) :
537*4882a593Smuzhiyun 				    sizeof(struct sockaddr_in6));
538*4882a593Smuzhiyun 	}
539*4882a593Smuzhiyun 
540*4882a593Smuzhiyun 	iov[2].iov_base = payload;
541*4882a593Smuzhiyun 	iov[2].iov_len = cfg_payload_len;
542*4882a593Smuzhiyun 	msg.msg_iovlen++;
543*4882a593Smuzhiyun 	msg.msg_iov = &iov[3 - msg.msg_iovlen];
544*4882a593Smuzhiyun 
545*4882a593Smuzhiyun 	tstop = gettimeofday_ms() + cfg_runtime_ms;
546*4882a593Smuzhiyun 	do {
547*4882a593Smuzhiyun 		if (cfg_cork)
548*4882a593Smuzhiyun 			do_sendmsg_corked(fd, &msg);
549*4882a593Smuzhiyun 		else
550*4882a593Smuzhiyun 			do_sendmsg(fd, &msg, cfg_zerocopy, domain);
551*4882a593Smuzhiyun 
552*4882a593Smuzhiyun 		while (!do_poll(fd, POLLOUT)) {
553*4882a593Smuzhiyun 			if (cfg_zerocopy)
554*4882a593Smuzhiyun 				do_recv_completions(fd, domain);
555*4882a593Smuzhiyun 		}
556*4882a593Smuzhiyun 
557*4882a593Smuzhiyun 	} while (gettimeofday_ms() < tstop);
558*4882a593Smuzhiyun 
559*4882a593Smuzhiyun 	if (cfg_zerocopy)
560*4882a593Smuzhiyun 		do_recv_remaining_completions(fd, domain);
561*4882a593Smuzhiyun 
562*4882a593Smuzhiyun 	if (close(fd))
563*4882a593Smuzhiyun 		error(1, errno, "close");
564*4882a593Smuzhiyun 
565*4882a593Smuzhiyun 	fprintf(stderr, "tx=%lu (%lu MB) txc=%lu zc=%c\n",
566*4882a593Smuzhiyun 		packets, bytes >> 20, completions,
567*4882a593Smuzhiyun 		zerocopied == 1 ? 'y' : 'n');
568*4882a593Smuzhiyun }
569*4882a593Smuzhiyun 
do_setup_rx(int domain,int type,int protocol)570*4882a593Smuzhiyun static int do_setup_rx(int domain, int type, int protocol)
571*4882a593Smuzhiyun {
572*4882a593Smuzhiyun 	int fd;
573*4882a593Smuzhiyun 
574*4882a593Smuzhiyun 	/* If tx over PF_PACKET, rx over PF_INET(6)/SOCK_RAW,
575*4882a593Smuzhiyun 	 * to recv the only copy of the packet, not a clone
576*4882a593Smuzhiyun 	 */
577*4882a593Smuzhiyun 	if (domain == PF_PACKET)
578*4882a593Smuzhiyun 		error(1, 0, "Use PF_INET/SOCK_RAW to read");
579*4882a593Smuzhiyun 
580*4882a593Smuzhiyun 	if (type == SOCK_RAW && protocol == IPPROTO_RAW)
581*4882a593Smuzhiyun 		error(1, 0, "IPPROTO_RAW: not supported on Rx");
582*4882a593Smuzhiyun 
583*4882a593Smuzhiyun 	fd = socket(domain, type, protocol);
584*4882a593Smuzhiyun 	if (fd == -1)
585*4882a593Smuzhiyun 		error(1, errno, "socket r");
586*4882a593Smuzhiyun 
587*4882a593Smuzhiyun 	do_setsockopt(fd, SOL_SOCKET, SO_RCVBUF, 1 << 21);
588*4882a593Smuzhiyun 	do_setsockopt(fd, SOL_SOCKET, SO_RCVLOWAT, 1 << 16);
589*4882a593Smuzhiyun 	do_setsockopt(fd, SOL_SOCKET, SO_REUSEPORT, 1);
590*4882a593Smuzhiyun 
591*4882a593Smuzhiyun 	if (bind(fd, (void *) &cfg_dst_addr, cfg_alen))
592*4882a593Smuzhiyun 		error(1, errno, "bind");
593*4882a593Smuzhiyun 
594*4882a593Smuzhiyun 	if (type == SOCK_STREAM) {
595*4882a593Smuzhiyun 		if (listen(fd, 1))
596*4882a593Smuzhiyun 			error(1, errno, "listen");
597*4882a593Smuzhiyun 		fd = do_accept(fd);
598*4882a593Smuzhiyun 	}
599*4882a593Smuzhiyun 
600*4882a593Smuzhiyun 	return fd;
601*4882a593Smuzhiyun }
602*4882a593Smuzhiyun 
603*4882a593Smuzhiyun /* Flush all outstanding bytes for the tcp receive queue */
do_flush_tcp(int fd)604*4882a593Smuzhiyun static void do_flush_tcp(int fd)
605*4882a593Smuzhiyun {
606*4882a593Smuzhiyun 	int ret;
607*4882a593Smuzhiyun 
608*4882a593Smuzhiyun 	/* MSG_TRUNC flushes up to len bytes */
609*4882a593Smuzhiyun 	ret = recv(fd, NULL, 1 << 21, MSG_TRUNC | MSG_DONTWAIT);
610*4882a593Smuzhiyun 	if (ret == -1 && errno == EAGAIN)
611*4882a593Smuzhiyun 		return;
612*4882a593Smuzhiyun 	if (ret == -1)
613*4882a593Smuzhiyun 		error(1, errno, "flush");
614*4882a593Smuzhiyun 	if (!ret)
615*4882a593Smuzhiyun 		return;
616*4882a593Smuzhiyun 
617*4882a593Smuzhiyun 	packets++;
618*4882a593Smuzhiyun 	bytes += ret;
619*4882a593Smuzhiyun }
620*4882a593Smuzhiyun 
621*4882a593Smuzhiyun /* Flush all outstanding datagrams. Verify first few bytes of each. */
do_flush_datagram(int fd,int type)622*4882a593Smuzhiyun static void do_flush_datagram(int fd, int type)
623*4882a593Smuzhiyun {
624*4882a593Smuzhiyun 	int ret, off = 0;
625*4882a593Smuzhiyun 	char buf[64];
626*4882a593Smuzhiyun 
627*4882a593Smuzhiyun 	/* MSG_TRUNC will return full datagram length */
628*4882a593Smuzhiyun 	ret = recv(fd, buf, sizeof(buf), MSG_DONTWAIT | MSG_TRUNC);
629*4882a593Smuzhiyun 	if (ret == -1 && errno == EAGAIN)
630*4882a593Smuzhiyun 		return;
631*4882a593Smuzhiyun 
632*4882a593Smuzhiyun 	/* raw ipv4 return with header, raw ipv6 without */
633*4882a593Smuzhiyun 	if (cfg_family == PF_INET && type == SOCK_RAW) {
634*4882a593Smuzhiyun 		off += sizeof(struct iphdr);
635*4882a593Smuzhiyun 		ret -= sizeof(struct iphdr);
636*4882a593Smuzhiyun 	}
637*4882a593Smuzhiyun 
638*4882a593Smuzhiyun 	if (ret == -1)
639*4882a593Smuzhiyun 		error(1, errno, "recv");
640*4882a593Smuzhiyun 	if (ret != cfg_payload_len)
641*4882a593Smuzhiyun 		error(1, 0, "recv: ret=%u != %u", ret, cfg_payload_len);
642*4882a593Smuzhiyun 	if (ret > sizeof(buf) - off)
643*4882a593Smuzhiyun 		ret = sizeof(buf) - off;
644*4882a593Smuzhiyun 	if (memcmp(buf + off, payload, ret))
645*4882a593Smuzhiyun 		error(1, 0, "recv: data mismatch");
646*4882a593Smuzhiyun 
647*4882a593Smuzhiyun 	packets++;
648*4882a593Smuzhiyun 	bytes += cfg_payload_len;
649*4882a593Smuzhiyun }
650*4882a593Smuzhiyun 
do_rx(int domain,int type,int protocol)651*4882a593Smuzhiyun static void do_rx(int domain, int type, int protocol)
652*4882a593Smuzhiyun {
653*4882a593Smuzhiyun 	const int cfg_receiver_wait_ms = 400;
654*4882a593Smuzhiyun 	uint64_t tstop;
655*4882a593Smuzhiyun 	int fd;
656*4882a593Smuzhiyun 
657*4882a593Smuzhiyun 	fd = do_setup_rx(domain, type, protocol);
658*4882a593Smuzhiyun 
659*4882a593Smuzhiyun 	tstop = gettimeofday_ms() + cfg_runtime_ms + cfg_receiver_wait_ms;
660*4882a593Smuzhiyun 	do {
661*4882a593Smuzhiyun 		if (type == SOCK_STREAM)
662*4882a593Smuzhiyun 			do_flush_tcp(fd);
663*4882a593Smuzhiyun 		else
664*4882a593Smuzhiyun 			do_flush_datagram(fd, type);
665*4882a593Smuzhiyun 
666*4882a593Smuzhiyun 		do_poll(fd, POLLIN);
667*4882a593Smuzhiyun 
668*4882a593Smuzhiyun 	} while (gettimeofday_ms() < tstop);
669*4882a593Smuzhiyun 
670*4882a593Smuzhiyun 	if (close(fd))
671*4882a593Smuzhiyun 		error(1, errno, "close");
672*4882a593Smuzhiyun 
673*4882a593Smuzhiyun 	fprintf(stderr, "rx=%lu (%lu MB)\n", packets, bytes >> 20);
674*4882a593Smuzhiyun }
675*4882a593Smuzhiyun 
do_test(int domain,int type,int protocol)676*4882a593Smuzhiyun static void do_test(int domain, int type, int protocol)
677*4882a593Smuzhiyun {
678*4882a593Smuzhiyun 	int i;
679*4882a593Smuzhiyun 
680*4882a593Smuzhiyun 	if (cfg_cork && (domain == PF_PACKET || type != SOCK_DGRAM))
681*4882a593Smuzhiyun 		error(1, 0, "can only cork udp sockets");
682*4882a593Smuzhiyun 
683*4882a593Smuzhiyun 	do_setcpu(cfg_cpu);
684*4882a593Smuzhiyun 
685*4882a593Smuzhiyun 	for (i = 0; i < IP_MAXPACKET; i++)
686*4882a593Smuzhiyun 		payload[i] = 'a' + (i % 26);
687*4882a593Smuzhiyun 
688*4882a593Smuzhiyun 	if (cfg_rx)
689*4882a593Smuzhiyun 		do_rx(domain, type, protocol);
690*4882a593Smuzhiyun 	else
691*4882a593Smuzhiyun 		do_tx(domain, type, protocol);
692*4882a593Smuzhiyun }
693*4882a593Smuzhiyun 
usage(const char * filepath)694*4882a593Smuzhiyun static void usage(const char *filepath)
695*4882a593Smuzhiyun {
696*4882a593Smuzhiyun 	error(1, 0, "Usage: %s [options] <test>", filepath);
697*4882a593Smuzhiyun }
698*4882a593Smuzhiyun 
parse_opts(int argc,char ** argv)699*4882a593Smuzhiyun static void parse_opts(int argc, char **argv)
700*4882a593Smuzhiyun {
701*4882a593Smuzhiyun 	const int max_payload_len = sizeof(payload) -
702*4882a593Smuzhiyun 				    sizeof(struct ipv6hdr) -
703*4882a593Smuzhiyun 				    sizeof(struct tcphdr) -
704*4882a593Smuzhiyun 				    40 /* max tcp options */;
705*4882a593Smuzhiyun 	int c;
706*4882a593Smuzhiyun 	char *daddr = NULL, *saddr = NULL;
707*4882a593Smuzhiyun 	char *cfg_test;
708*4882a593Smuzhiyun 
709*4882a593Smuzhiyun 	cfg_payload_len = max_payload_len;
710*4882a593Smuzhiyun 
711*4882a593Smuzhiyun 	while ((c = getopt(argc, argv, "46c:C:D:i:mp:rs:S:t:vz")) != -1) {
712*4882a593Smuzhiyun 		switch (c) {
713*4882a593Smuzhiyun 		case '4':
714*4882a593Smuzhiyun 			if (cfg_family != PF_UNSPEC)
715*4882a593Smuzhiyun 				error(1, 0, "Pass one of -4 or -6");
716*4882a593Smuzhiyun 			cfg_family = PF_INET;
717*4882a593Smuzhiyun 			cfg_alen = sizeof(struct sockaddr_in);
718*4882a593Smuzhiyun 			break;
719*4882a593Smuzhiyun 		case '6':
720*4882a593Smuzhiyun 			if (cfg_family != PF_UNSPEC)
721*4882a593Smuzhiyun 				error(1, 0, "Pass one of -4 or -6");
722*4882a593Smuzhiyun 			cfg_family = PF_INET6;
723*4882a593Smuzhiyun 			cfg_alen = sizeof(struct sockaddr_in6);
724*4882a593Smuzhiyun 			break;
725*4882a593Smuzhiyun 		case 'c':
726*4882a593Smuzhiyun 			cfg_cork = strtol(optarg, NULL, 0);
727*4882a593Smuzhiyun 			break;
728*4882a593Smuzhiyun 		case 'C':
729*4882a593Smuzhiyun 			cfg_cpu = strtol(optarg, NULL, 0);
730*4882a593Smuzhiyun 			break;
731*4882a593Smuzhiyun 		case 'D':
732*4882a593Smuzhiyun 			daddr = optarg;
733*4882a593Smuzhiyun 			break;
734*4882a593Smuzhiyun 		case 'i':
735*4882a593Smuzhiyun 			cfg_ifindex = if_nametoindex(optarg);
736*4882a593Smuzhiyun 			if (cfg_ifindex == 0)
737*4882a593Smuzhiyun 				error(1, errno, "invalid iface: %s", optarg);
738*4882a593Smuzhiyun 			break;
739*4882a593Smuzhiyun 		case 'm':
740*4882a593Smuzhiyun 			cfg_cork_mixed = true;
741*4882a593Smuzhiyun 			break;
742*4882a593Smuzhiyun 		case 'p':
743*4882a593Smuzhiyun 			cfg_port = strtoul(optarg, NULL, 0);
744*4882a593Smuzhiyun 			break;
745*4882a593Smuzhiyun 		case 'r':
746*4882a593Smuzhiyun 			cfg_rx = true;
747*4882a593Smuzhiyun 			break;
748*4882a593Smuzhiyun 		case 's':
749*4882a593Smuzhiyun 			cfg_payload_len = strtoul(optarg, NULL, 0);
750*4882a593Smuzhiyun 			break;
751*4882a593Smuzhiyun 		case 'S':
752*4882a593Smuzhiyun 			saddr = optarg;
753*4882a593Smuzhiyun 			break;
754*4882a593Smuzhiyun 		case 't':
755*4882a593Smuzhiyun 			cfg_runtime_ms = 200 + strtoul(optarg, NULL, 10) * 1000;
756*4882a593Smuzhiyun 			break;
757*4882a593Smuzhiyun 		case 'v':
758*4882a593Smuzhiyun 			cfg_verbose++;
759*4882a593Smuzhiyun 			break;
760*4882a593Smuzhiyun 		case 'z':
761*4882a593Smuzhiyun 			cfg_zerocopy = true;
762*4882a593Smuzhiyun 			break;
763*4882a593Smuzhiyun 		}
764*4882a593Smuzhiyun 	}
765*4882a593Smuzhiyun 
766*4882a593Smuzhiyun 	cfg_test = argv[argc - 1];
767*4882a593Smuzhiyun 	if (strcmp(cfg_test, "rds") == 0) {
768*4882a593Smuzhiyun 		if (!daddr)
769*4882a593Smuzhiyun 			error(1, 0, "-D <server addr> required for PF_RDS\n");
770*4882a593Smuzhiyun 		if (!cfg_rx && !saddr)
771*4882a593Smuzhiyun 			error(1, 0, "-S <client addr> required for PF_RDS\n");
772*4882a593Smuzhiyun 	}
773*4882a593Smuzhiyun 	setup_sockaddr(cfg_family, daddr, &cfg_dst_addr);
774*4882a593Smuzhiyun 	setup_sockaddr(cfg_family, saddr, &cfg_src_addr);
775*4882a593Smuzhiyun 
776*4882a593Smuzhiyun 	if (cfg_payload_len > max_payload_len)
777*4882a593Smuzhiyun 		error(1, 0, "-s: payload exceeds max (%d)", max_payload_len);
778*4882a593Smuzhiyun 	if (cfg_cork_mixed && (!cfg_zerocopy || !cfg_cork))
779*4882a593Smuzhiyun 		error(1, 0, "-m: cork_mixed requires corking and zerocopy");
780*4882a593Smuzhiyun 
781*4882a593Smuzhiyun 	if (optind != argc - 1)
782*4882a593Smuzhiyun 		usage(argv[0]);
783*4882a593Smuzhiyun }
784*4882a593Smuzhiyun 
main(int argc,char ** argv)785*4882a593Smuzhiyun int main(int argc, char **argv)
786*4882a593Smuzhiyun {
787*4882a593Smuzhiyun 	const char *cfg_test;
788*4882a593Smuzhiyun 
789*4882a593Smuzhiyun 	parse_opts(argc, argv);
790*4882a593Smuzhiyun 
791*4882a593Smuzhiyun 	cfg_test = argv[argc - 1];
792*4882a593Smuzhiyun 
793*4882a593Smuzhiyun 	if (!strcmp(cfg_test, "packet"))
794*4882a593Smuzhiyun 		do_test(PF_PACKET, SOCK_RAW, 0);
795*4882a593Smuzhiyun 	else if (!strcmp(cfg_test, "packet_dgram"))
796*4882a593Smuzhiyun 		do_test(PF_PACKET, SOCK_DGRAM, 0);
797*4882a593Smuzhiyun 	else if (!strcmp(cfg_test, "raw"))
798*4882a593Smuzhiyun 		do_test(cfg_family, SOCK_RAW, IPPROTO_EGP);
799*4882a593Smuzhiyun 	else if (!strcmp(cfg_test, "raw_hdrincl"))
800*4882a593Smuzhiyun 		do_test(cfg_family, SOCK_RAW, IPPROTO_RAW);
801*4882a593Smuzhiyun 	else if (!strcmp(cfg_test, "tcp"))
802*4882a593Smuzhiyun 		do_test(cfg_family, SOCK_STREAM, 0);
803*4882a593Smuzhiyun 	else if (!strcmp(cfg_test, "udp"))
804*4882a593Smuzhiyun 		do_test(cfg_family, SOCK_DGRAM, 0);
805*4882a593Smuzhiyun 	else if (!strcmp(cfg_test, "rds"))
806*4882a593Smuzhiyun 		do_test(PF_RDS, SOCK_SEQPACKET, 0);
807*4882a593Smuzhiyun 	else
808*4882a593Smuzhiyun 		error(1, 0, "unknown cfg_test %s", cfg_test);
809*4882a593Smuzhiyun 
810*4882a593Smuzhiyun 	return 0;
811*4882a593Smuzhiyun }
812