xref: /OK3568_Linux_fs/kernel/tools/testing/selftests/net/udpgso_bench_tx.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun 
3*4882a593Smuzhiyun #define _GNU_SOURCE
4*4882a593Smuzhiyun 
5*4882a593Smuzhiyun #include <arpa/inet.h>
6*4882a593Smuzhiyun #include <errno.h>
7*4882a593Smuzhiyun #include <error.h>
8*4882a593Smuzhiyun #include <linux/errqueue.h>
9*4882a593Smuzhiyun #include <linux/net_tstamp.h>
10*4882a593Smuzhiyun #include <netinet/if_ether.h>
11*4882a593Smuzhiyun #include <netinet/in.h>
12*4882a593Smuzhiyun #include <netinet/ip.h>
13*4882a593Smuzhiyun #include <netinet/ip6.h>
14*4882a593Smuzhiyun #include <netinet/udp.h>
15*4882a593Smuzhiyun #include <poll.h>
16*4882a593Smuzhiyun #include <sched.h>
17*4882a593Smuzhiyun #include <signal.h>
18*4882a593Smuzhiyun #include <stdbool.h>
19*4882a593Smuzhiyun #include <stdio.h>
20*4882a593Smuzhiyun #include <stdlib.h>
21*4882a593Smuzhiyun #include <string.h>
22*4882a593Smuzhiyun #include <sys/socket.h>
23*4882a593Smuzhiyun #include <sys/time.h>
24*4882a593Smuzhiyun #include <sys/poll.h>
25*4882a593Smuzhiyun #include <sys/types.h>
26*4882a593Smuzhiyun #include <unistd.h>
27*4882a593Smuzhiyun 
28*4882a593Smuzhiyun #include "../kselftest.h"
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun #ifndef ETH_MAX_MTU
31*4882a593Smuzhiyun #define ETH_MAX_MTU 0xFFFFU
32*4882a593Smuzhiyun #endif
33*4882a593Smuzhiyun 
34*4882a593Smuzhiyun #ifndef UDP_SEGMENT
35*4882a593Smuzhiyun #define UDP_SEGMENT		103
36*4882a593Smuzhiyun #endif
37*4882a593Smuzhiyun 
38*4882a593Smuzhiyun #ifndef SO_ZEROCOPY
39*4882a593Smuzhiyun #define SO_ZEROCOPY	60
40*4882a593Smuzhiyun #endif
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun #ifndef SO_EE_ORIGIN_ZEROCOPY
43*4882a593Smuzhiyun #define SO_EE_ORIGIN_ZEROCOPY 5
44*4882a593Smuzhiyun #endif
45*4882a593Smuzhiyun 
46*4882a593Smuzhiyun #ifndef MSG_ZEROCOPY
47*4882a593Smuzhiyun #define MSG_ZEROCOPY	0x4000000
48*4882a593Smuzhiyun #endif
49*4882a593Smuzhiyun 
50*4882a593Smuzhiyun #ifndef ENOTSUPP
51*4882a593Smuzhiyun #define ENOTSUPP	524
52*4882a593Smuzhiyun #endif
53*4882a593Smuzhiyun 
54*4882a593Smuzhiyun #define NUM_PKT		100
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun static bool	cfg_cache_trash;
57*4882a593Smuzhiyun static int	cfg_cpu		= -1;
58*4882a593Smuzhiyun static int	cfg_connected	= true;
59*4882a593Smuzhiyun static int	cfg_family	= PF_UNSPEC;
60*4882a593Smuzhiyun static uint16_t	cfg_mss;
61*4882a593Smuzhiyun static int	cfg_payload_len	= (1472 * 42);
62*4882a593Smuzhiyun static int	cfg_port	= 8000;
63*4882a593Smuzhiyun static int	cfg_runtime_ms	= -1;
64*4882a593Smuzhiyun static bool	cfg_poll;
65*4882a593Smuzhiyun static bool	cfg_segment;
66*4882a593Smuzhiyun static bool	cfg_sendmmsg;
67*4882a593Smuzhiyun static bool	cfg_tcp;
68*4882a593Smuzhiyun static uint32_t	cfg_tx_ts = SOF_TIMESTAMPING_TX_SOFTWARE;
69*4882a593Smuzhiyun static bool	cfg_tx_tstamp;
70*4882a593Smuzhiyun static bool	cfg_audit;
71*4882a593Smuzhiyun static bool	cfg_verbose;
72*4882a593Smuzhiyun static bool	cfg_zerocopy;
73*4882a593Smuzhiyun static int	cfg_msg_nr;
74*4882a593Smuzhiyun static uint16_t	cfg_gso_size;
75*4882a593Smuzhiyun static unsigned long total_num_msgs;
76*4882a593Smuzhiyun static unsigned long total_num_sends;
77*4882a593Smuzhiyun static unsigned long stat_tx_ts;
78*4882a593Smuzhiyun static unsigned long stat_tx_ts_errors;
79*4882a593Smuzhiyun static unsigned long tstart;
80*4882a593Smuzhiyun static unsigned long tend;
81*4882a593Smuzhiyun static unsigned long stat_zcopies;
82*4882a593Smuzhiyun 
83*4882a593Smuzhiyun static socklen_t cfg_alen;
84*4882a593Smuzhiyun static struct sockaddr_storage cfg_dst_addr;
85*4882a593Smuzhiyun 
86*4882a593Smuzhiyun static bool interrupted;
87*4882a593Smuzhiyun static char buf[NUM_PKT][ETH_MAX_MTU];
88*4882a593Smuzhiyun 
sigint_handler(int signum)89*4882a593Smuzhiyun static void sigint_handler(int signum)
90*4882a593Smuzhiyun {
91*4882a593Smuzhiyun 	if (signum == SIGINT)
92*4882a593Smuzhiyun 		interrupted = true;
93*4882a593Smuzhiyun }
94*4882a593Smuzhiyun 
gettimeofday_ms(void)95*4882a593Smuzhiyun static unsigned long gettimeofday_ms(void)
96*4882a593Smuzhiyun {
97*4882a593Smuzhiyun 	struct timeval tv;
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun 	gettimeofday(&tv, NULL);
100*4882a593Smuzhiyun 	return (tv.tv_sec * 1000) + (tv.tv_usec / 1000);
101*4882a593Smuzhiyun }
102*4882a593Smuzhiyun 
set_cpu(int cpu)103*4882a593Smuzhiyun static int set_cpu(int cpu)
104*4882a593Smuzhiyun {
105*4882a593Smuzhiyun 	cpu_set_t mask;
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun 	CPU_ZERO(&mask);
108*4882a593Smuzhiyun 	CPU_SET(cpu, &mask);
109*4882a593Smuzhiyun 	if (sched_setaffinity(0, sizeof(mask), &mask))
110*4882a593Smuzhiyun 		error(1, 0, "setaffinity %d", cpu);
111*4882a593Smuzhiyun 
112*4882a593Smuzhiyun 	return 0;
113*4882a593Smuzhiyun }
114*4882a593Smuzhiyun 
setup_sockaddr(int domain,const char * str_addr,void * sockaddr)115*4882a593Smuzhiyun static void setup_sockaddr(int domain, const char *str_addr, void *sockaddr)
116*4882a593Smuzhiyun {
117*4882a593Smuzhiyun 	struct sockaddr_in6 *addr6 = (void *) sockaddr;
118*4882a593Smuzhiyun 	struct sockaddr_in *addr4 = (void *) sockaddr;
119*4882a593Smuzhiyun 
120*4882a593Smuzhiyun 	switch (domain) {
121*4882a593Smuzhiyun 	case PF_INET:
122*4882a593Smuzhiyun 		addr4->sin_family = AF_INET;
123*4882a593Smuzhiyun 		addr4->sin_port = htons(cfg_port);
124*4882a593Smuzhiyun 		if (inet_pton(AF_INET, str_addr, &(addr4->sin_addr)) != 1)
125*4882a593Smuzhiyun 			error(1, 0, "ipv4 parse error: %s", str_addr);
126*4882a593Smuzhiyun 		break;
127*4882a593Smuzhiyun 	case PF_INET6:
128*4882a593Smuzhiyun 		addr6->sin6_family = AF_INET6;
129*4882a593Smuzhiyun 		addr6->sin6_port = htons(cfg_port);
130*4882a593Smuzhiyun 		if (inet_pton(AF_INET6, str_addr, &(addr6->sin6_addr)) != 1)
131*4882a593Smuzhiyun 			error(1, 0, "ipv6 parse error: %s", str_addr);
132*4882a593Smuzhiyun 		break;
133*4882a593Smuzhiyun 	default:
134*4882a593Smuzhiyun 		error(1, 0, "illegal domain");
135*4882a593Smuzhiyun 	}
136*4882a593Smuzhiyun }
137*4882a593Smuzhiyun 
flush_cmsg(struct cmsghdr * cmsg)138*4882a593Smuzhiyun static void flush_cmsg(struct cmsghdr *cmsg)
139*4882a593Smuzhiyun {
140*4882a593Smuzhiyun 	struct sock_extended_err *err;
141*4882a593Smuzhiyun 	struct scm_timestamping *tss;
142*4882a593Smuzhiyun 	__u32 lo;
143*4882a593Smuzhiyun 	__u32 hi;
144*4882a593Smuzhiyun 	int i;
145*4882a593Smuzhiyun 
146*4882a593Smuzhiyun 	switch (cmsg->cmsg_level) {
147*4882a593Smuzhiyun 	case SOL_SOCKET:
148*4882a593Smuzhiyun 		if (cmsg->cmsg_type == SO_TIMESTAMPING) {
149*4882a593Smuzhiyun 			i = (cfg_tx_ts == SOF_TIMESTAMPING_TX_HARDWARE) ? 2 : 0;
150*4882a593Smuzhiyun 			tss = (struct scm_timestamping *)CMSG_DATA(cmsg);
151*4882a593Smuzhiyun 			if (tss->ts[i].tv_sec == 0)
152*4882a593Smuzhiyun 				stat_tx_ts_errors++;
153*4882a593Smuzhiyun 		} else {
154*4882a593Smuzhiyun 			error(1, 0, "unknown SOL_SOCKET cmsg type=%u\n",
155*4882a593Smuzhiyun 			      cmsg->cmsg_type);
156*4882a593Smuzhiyun 		}
157*4882a593Smuzhiyun 		break;
158*4882a593Smuzhiyun 	case SOL_IP:
159*4882a593Smuzhiyun 	case SOL_IPV6:
160*4882a593Smuzhiyun 		switch (cmsg->cmsg_type) {
161*4882a593Smuzhiyun 		case IP_RECVERR:
162*4882a593Smuzhiyun 		case IPV6_RECVERR:
163*4882a593Smuzhiyun 		{
164*4882a593Smuzhiyun 			err = (struct sock_extended_err *)CMSG_DATA(cmsg);
165*4882a593Smuzhiyun 			switch (err->ee_origin) {
166*4882a593Smuzhiyun 			case SO_EE_ORIGIN_TIMESTAMPING:
167*4882a593Smuzhiyun 				/* Got a TX timestamp from error queue */
168*4882a593Smuzhiyun 				stat_tx_ts++;
169*4882a593Smuzhiyun 				break;
170*4882a593Smuzhiyun 			case SO_EE_ORIGIN_ICMP:
171*4882a593Smuzhiyun 			case SO_EE_ORIGIN_ICMP6:
172*4882a593Smuzhiyun 				if (cfg_verbose)
173*4882a593Smuzhiyun 					fprintf(stderr,
174*4882a593Smuzhiyun 						"received ICMP error: type=%u, code=%u\n",
175*4882a593Smuzhiyun 						err->ee_type, err->ee_code);
176*4882a593Smuzhiyun 				break;
177*4882a593Smuzhiyun 			case SO_EE_ORIGIN_ZEROCOPY:
178*4882a593Smuzhiyun 			{
179*4882a593Smuzhiyun 				lo = err->ee_info;
180*4882a593Smuzhiyun 				hi = err->ee_data;
181*4882a593Smuzhiyun 				/* range of IDs acknowledged */
182*4882a593Smuzhiyun 				stat_zcopies += hi - lo + 1;
183*4882a593Smuzhiyun 				break;
184*4882a593Smuzhiyun 			}
185*4882a593Smuzhiyun 			case SO_EE_ORIGIN_LOCAL:
186*4882a593Smuzhiyun 				if (cfg_verbose)
187*4882a593Smuzhiyun 					fprintf(stderr,
188*4882a593Smuzhiyun 						"received packet with local origin: %u\n",
189*4882a593Smuzhiyun 						err->ee_origin);
190*4882a593Smuzhiyun 				break;
191*4882a593Smuzhiyun 			default:
192*4882a593Smuzhiyun 				error(0, 1, "received packet with origin: %u",
193*4882a593Smuzhiyun 				      err->ee_origin);
194*4882a593Smuzhiyun 			}
195*4882a593Smuzhiyun 			break;
196*4882a593Smuzhiyun 		}
197*4882a593Smuzhiyun 		default:
198*4882a593Smuzhiyun 			error(0, 1, "unknown IP msg type=%u\n",
199*4882a593Smuzhiyun 			      cmsg->cmsg_type);
200*4882a593Smuzhiyun 			break;
201*4882a593Smuzhiyun 		}
202*4882a593Smuzhiyun 		break;
203*4882a593Smuzhiyun 	default:
204*4882a593Smuzhiyun 		error(0, 1, "unknown cmsg level=%u\n",
205*4882a593Smuzhiyun 		      cmsg->cmsg_level);
206*4882a593Smuzhiyun 	}
207*4882a593Smuzhiyun }
208*4882a593Smuzhiyun 
flush_errqueue_recv(int fd)209*4882a593Smuzhiyun static void flush_errqueue_recv(int fd)
210*4882a593Smuzhiyun {
211*4882a593Smuzhiyun 	char control[CMSG_SPACE(sizeof(struct scm_timestamping)) +
212*4882a593Smuzhiyun 		     CMSG_SPACE(sizeof(struct sock_extended_err)) +
213*4882a593Smuzhiyun 		     CMSG_SPACE(sizeof(struct sockaddr_in6))] = {0};
214*4882a593Smuzhiyun 	struct msghdr msg = {0};
215*4882a593Smuzhiyun 	struct cmsghdr *cmsg;
216*4882a593Smuzhiyun 	int ret;
217*4882a593Smuzhiyun 
218*4882a593Smuzhiyun 	while (1) {
219*4882a593Smuzhiyun 		msg.msg_control = control;
220*4882a593Smuzhiyun 		msg.msg_controllen = sizeof(control);
221*4882a593Smuzhiyun 		ret = recvmsg(fd, &msg, MSG_ERRQUEUE);
222*4882a593Smuzhiyun 		if (ret == -1 && errno == EAGAIN)
223*4882a593Smuzhiyun 			break;
224*4882a593Smuzhiyun 		if (ret == -1)
225*4882a593Smuzhiyun 			error(1, errno, "errqueue");
226*4882a593Smuzhiyun 		if (msg.msg_flags != MSG_ERRQUEUE)
227*4882a593Smuzhiyun 			error(1, 0, "errqueue: flags 0x%x\n", msg.msg_flags);
228*4882a593Smuzhiyun 		if (cfg_audit) {
229*4882a593Smuzhiyun 			for (cmsg = CMSG_FIRSTHDR(&msg);
230*4882a593Smuzhiyun 					cmsg;
231*4882a593Smuzhiyun 					cmsg = CMSG_NXTHDR(&msg, cmsg))
232*4882a593Smuzhiyun 				flush_cmsg(cmsg);
233*4882a593Smuzhiyun 		}
234*4882a593Smuzhiyun 		msg.msg_flags = 0;
235*4882a593Smuzhiyun 	}
236*4882a593Smuzhiyun }
237*4882a593Smuzhiyun 
flush_errqueue(int fd,const bool do_poll)238*4882a593Smuzhiyun static void flush_errqueue(int fd, const bool do_poll)
239*4882a593Smuzhiyun {
240*4882a593Smuzhiyun 	if (do_poll) {
241*4882a593Smuzhiyun 		struct pollfd fds = {0};
242*4882a593Smuzhiyun 		int ret;
243*4882a593Smuzhiyun 
244*4882a593Smuzhiyun 		fds.fd = fd;
245*4882a593Smuzhiyun 		ret = poll(&fds, 1, 500);
246*4882a593Smuzhiyun 		if (ret == 0) {
247*4882a593Smuzhiyun 			if (cfg_verbose)
248*4882a593Smuzhiyun 				fprintf(stderr, "poll timeout\n");
249*4882a593Smuzhiyun 		} else if (ret < 0) {
250*4882a593Smuzhiyun 			error(1, errno, "poll");
251*4882a593Smuzhiyun 		}
252*4882a593Smuzhiyun 	}
253*4882a593Smuzhiyun 
254*4882a593Smuzhiyun 	flush_errqueue_recv(fd);
255*4882a593Smuzhiyun }
256*4882a593Smuzhiyun 
send_tcp(int fd,char * data)257*4882a593Smuzhiyun static int send_tcp(int fd, char *data)
258*4882a593Smuzhiyun {
259*4882a593Smuzhiyun 	int ret, done = 0, count = 0;
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun 	while (done < cfg_payload_len) {
262*4882a593Smuzhiyun 		ret = send(fd, data + done, cfg_payload_len - done,
263*4882a593Smuzhiyun 			   cfg_zerocopy ? MSG_ZEROCOPY : 0);
264*4882a593Smuzhiyun 		if (ret == -1)
265*4882a593Smuzhiyun 			error(1, errno, "write");
266*4882a593Smuzhiyun 
267*4882a593Smuzhiyun 		done += ret;
268*4882a593Smuzhiyun 		count++;
269*4882a593Smuzhiyun 	}
270*4882a593Smuzhiyun 
271*4882a593Smuzhiyun 	return count;
272*4882a593Smuzhiyun }
273*4882a593Smuzhiyun 
send_udp(int fd,char * data)274*4882a593Smuzhiyun static int send_udp(int fd, char *data)
275*4882a593Smuzhiyun {
276*4882a593Smuzhiyun 	int ret, total_len, len, count = 0;
277*4882a593Smuzhiyun 
278*4882a593Smuzhiyun 	total_len = cfg_payload_len;
279*4882a593Smuzhiyun 
280*4882a593Smuzhiyun 	while (total_len) {
281*4882a593Smuzhiyun 		len = total_len < cfg_mss ? total_len : cfg_mss;
282*4882a593Smuzhiyun 
283*4882a593Smuzhiyun 		ret = sendto(fd, data, len, cfg_zerocopy ? MSG_ZEROCOPY : 0,
284*4882a593Smuzhiyun 			     cfg_connected ? NULL : (void *)&cfg_dst_addr,
285*4882a593Smuzhiyun 			     cfg_connected ? 0 : cfg_alen);
286*4882a593Smuzhiyun 		if (ret == -1)
287*4882a593Smuzhiyun 			error(1, errno, "write");
288*4882a593Smuzhiyun 		if (ret != len)
289*4882a593Smuzhiyun 			error(1, errno, "write: %uB != %uB\n", ret, len);
290*4882a593Smuzhiyun 
291*4882a593Smuzhiyun 		total_len -= len;
292*4882a593Smuzhiyun 		count++;
293*4882a593Smuzhiyun 	}
294*4882a593Smuzhiyun 
295*4882a593Smuzhiyun 	return count;
296*4882a593Smuzhiyun }
297*4882a593Smuzhiyun 
send_ts_cmsg(struct cmsghdr * cm)298*4882a593Smuzhiyun static void send_ts_cmsg(struct cmsghdr *cm)
299*4882a593Smuzhiyun {
300*4882a593Smuzhiyun 	uint32_t *valp;
301*4882a593Smuzhiyun 
302*4882a593Smuzhiyun 	cm->cmsg_level = SOL_SOCKET;
303*4882a593Smuzhiyun 	cm->cmsg_type = SO_TIMESTAMPING;
304*4882a593Smuzhiyun 	cm->cmsg_len = CMSG_LEN(sizeof(cfg_tx_ts));
305*4882a593Smuzhiyun 	valp = (void *)CMSG_DATA(cm);
306*4882a593Smuzhiyun 	*valp = cfg_tx_ts;
307*4882a593Smuzhiyun }
308*4882a593Smuzhiyun 
send_udp_sendmmsg(int fd,char * data)309*4882a593Smuzhiyun static int send_udp_sendmmsg(int fd, char *data)
310*4882a593Smuzhiyun {
311*4882a593Smuzhiyun 	char control[CMSG_SPACE(sizeof(cfg_tx_ts))] = {0};
312*4882a593Smuzhiyun 	const int max_nr_msg = ETH_MAX_MTU / ETH_DATA_LEN;
313*4882a593Smuzhiyun 	struct mmsghdr mmsgs[max_nr_msg];
314*4882a593Smuzhiyun 	struct iovec iov[max_nr_msg];
315*4882a593Smuzhiyun 	unsigned int off = 0, left;
316*4882a593Smuzhiyun 	size_t msg_controllen = 0;
317*4882a593Smuzhiyun 	int i = 0, ret;
318*4882a593Smuzhiyun 
319*4882a593Smuzhiyun 	memset(mmsgs, 0, sizeof(mmsgs));
320*4882a593Smuzhiyun 
321*4882a593Smuzhiyun 	if (cfg_tx_tstamp) {
322*4882a593Smuzhiyun 		struct msghdr msg = {0};
323*4882a593Smuzhiyun 		struct cmsghdr *cmsg;
324*4882a593Smuzhiyun 
325*4882a593Smuzhiyun 		msg.msg_control = control;
326*4882a593Smuzhiyun 		msg.msg_controllen = sizeof(control);
327*4882a593Smuzhiyun 		cmsg = CMSG_FIRSTHDR(&msg);
328*4882a593Smuzhiyun 		send_ts_cmsg(cmsg);
329*4882a593Smuzhiyun 		msg_controllen += CMSG_SPACE(sizeof(cfg_tx_ts));
330*4882a593Smuzhiyun 	}
331*4882a593Smuzhiyun 
332*4882a593Smuzhiyun 	left = cfg_payload_len;
333*4882a593Smuzhiyun 	while (left) {
334*4882a593Smuzhiyun 		if (i == max_nr_msg)
335*4882a593Smuzhiyun 			error(1, 0, "sendmmsg: exceeds max_nr_msg");
336*4882a593Smuzhiyun 
337*4882a593Smuzhiyun 		iov[i].iov_base = data + off;
338*4882a593Smuzhiyun 		iov[i].iov_len = cfg_mss < left ? cfg_mss : left;
339*4882a593Smuzhiyun 
340*4882a593Smuzhiyun 		mmsgs[i].msg_hdr.msg_iov = iov + i;
341*4882a593Smuzhiyun 		mmsgs[i].msg_hdr.msg_iovlen = 1;
342*4882a593Smuzhiyun 
343*4882a593Smuzhiyun 		mmsgs[i].msg_hdr.msg_name = (void *)&cfg_dst_addr;
344*4882a593Smuzhiyun 		mmsgs[i].msg_hdr.msg_namelen = cfg_alen;
345*4882a593Smuzhiyun 		if (msg_controllen) {
346*4882a593Smuzhiyun 			mmsgs[i].msg_hdr.msg_control = control;
347*4882a593Smuzhiyun 			mmsgs[i].msg_hdr.msg_controllen = msg_controllen;
348*4882a593Smuzhiyun 		}
349*4882a593Smuzhiyun 
350*4882a593Smuzhiyun 		off += iov[i].iov_len;
351*4882a593Smuzhiyun 		left -= iov[i].iov_len;
352*4882a593Smuzhiyun 		i++;
353*4882a593Smuzhiyun 	}
354*4882a593Smuzhiyun 
355*4882a593Smuzhiyun 	ret = sendmmsg(fd, mmsgs, i, cfg_zerocopy ? MSG_ZEROCOPY : 0);
356*4882a593Smuzhiyun 	if (ret == -1)
357*4882a593Smuzhiyun 		error(1, errno, "sendmmsg");
358*4882a593Smuzhiyun 
359*4882a593Smuzhiyun 	return ret;
360*4882a593Smuzhiyun }
361*4882a593Smuzhiyun 
send_udp_segment_cmsg(struct cmsghdr * cm)362*4882a593Smuzhiyun static void send_udp_segment_cmsg(struct cmsghdr *cm)
363*4882a593Smuzhiyun {
364*4882a593Smuzhiyun 	uint16_t *valp;
365*4882a593Smuzhiyun 
366*4882a593Smuzhiyun 	cm->cmsg_level = SOL_UDP;
367*4882a593Smuzhiyun 	cm->cmsg_type = UDP_SEGMENT;
368*4882a593Smuzhiyun 	cm->cmsg_len = CMSG_LEN(sizeof(cfg_gso_size));
369*4882a593Smuzhiyun 	valp = (void *)CMSG_DATA(cm);
370*4882a593Smuzhiyun 	*valp = cfg_gso_size;
371*4882a593Smuzhiyun }
372*4882a593Smuzhiyun 
send_udp_segment(int fd,char * data)373*4882a593Smuzhiyun static int send_udp_segment(int fd, char *data)
374*4882a593Smuzhiyun {
375*4882a593Smuzhiyun 	char control[CMSG_SPACE(sizeof(cfg_gso_size)) +
376*4882a593Smuzhiyun 		     CMSG_SPACE(sizeof(cfg_tx_ts))] = {0};
377*4882a593Smuzhiyun 	struct msghdr msg = {0};
378*4882a593Smuzhiyun 	struct iovec iov = {0};
379*4882a593Smuzhiyun 	size_t msg_controllen;
380*4882a593Smuzhiyun 	struct cmsghdr *cmsg;
381*4882a593Smuzhiyun 	int ret;
382*4882a593Smuzhiyun 
383*4882a593Smuzhiyun 	iov.iov_base = data;
384*4882a593Smuzhiyun 	iov.iov_len = cfg_payload_len;
385*4882a593Smuzhiyun 
386*4882a593Smuzhiyun 	msg.msg_iov = &iov;
387*4882a593Smuzhiyun 	msg.msg_iovlen = 1;
388*4882a593Smuzhiyun 
389*4882a593Smuzhiyun 	msg.msg_control = control;
390*4882a593Smuzhiyun 	msg.msg_controllen = sizeof(control);
391*4882a593Smuzhiyun 	cmsg = CMSG_FIRSTHDR(&msg);
392*4882a593Smuzhiyun 	send_udp_segment_cmsg(cmsg);
393*4882a593Smuzhiyun 	msg_controllen = CMSG_SPACE(sizeof(cfg_mss));
394*4882a593Smuzhiyun 	if (cfg_tx_tstamp) {
395*4882a593Smuzhiyun 		cmsg = CMSG_NXTHDR(&msg, cmsg);
396*4882a593Smuzhiyun 		send_ts_cmsg(cmsg);
397*4882a593Smuzhiyun 		msg_controllen += CMSG_SPACE(sizeof(cfg_tx_ts));
398*4882a593Smuzhiyun 	}
399*4882a593Smuzhiyun 
400*4882a593Smuzhiyun 	msg.msg_controllen = msg_controllen;
401*4882a593Smuzhiyun 	msg.msg_name = (void *)&cfg_dst_addr;
402*4882a593Smuzhiyun 	msg.msg_namelen = cfg_alen;
403*4882a593Smuzhiyun 
404*4882a593Smuzhiyun 	ret = sendmsg(fd, &msg, cfg_zerocopy ? MSG_ZEROCOPY : 0);
405*4882a593Smuzhiyun 	if (ret == -1)
406*4882a593Smuzhiyun 		error(1, errno, "sendmsg");
407*4882a593Smuzhiyun 	if (ret != iov.iov_len)
408*4882a593Smuzhiyun 		error(1, 0, "sendmsg: %u != %llu\n", ret,
409*4882a593Smuzhiyun 			(unsigned long long)iov.iov_len);
410*4882a593Smuzhiyun 
411*4882a593Smuzhiyun 	return 1;
412*4882a593Smuzhiyun }
413*4882a593Smuzhiyun 
usage(const char * filepath)414*4882a593Smuzhiyun static void usage(const char *filepath)
415*4882a593Smuzhiyun {
416*4882a593Smuzhiyun 	error(1, 0, "Usage: %s [-46acmHPtTuvz] [-C cpu] [-D dst ip] [-l secs] [-M messagenr] [-p port] [-s sendsize] [-S gsosize]",
417*4882a593Smuzhiyun 		    filepath);
418*4882a593Smuzhiyun }
419*4882a593Smuzhiyun 
parse_opts(int argc,char ** argv)420*4882a593Smuzhiyun static void parse_opts(int argc, char **argv)
421*4882a593Smuzhiyun {
422*4882a593Smuzhiyun 	const char *bind_addr = NULL;
423*4882a593Smuzhiyun 	int max_len, hdrlen;
424*4882a593Smuzhiyun 	int c;
425*4882a593Smuzhiyun 
426*4882a593Smuzhiyun 	while ((c = getopt(argc, argv, "46acC:D:Hl:mM:p:s:PS:tTuvz")) != -1) {
427*4882a593Smuzhiyun 		switch (c) {
428*4882a593Smuzhiyun 		case '4':
429*4882a593Smuzhiyun 			if (cfg_family != PF_UNSPEC)
430*4882a593Smuzhiyun 				error(1, 0, "Pass one of -4 or -6");
431*4882a593Smuzhiyun 			cfg_family = PF_INET;
432*4882a593Smuzhiyun 			cfg_alen = sizeof(struct sockaddr_in);
433*4882a593Smuzhiyun 			break;
434*4882a593Smuzhiyun 		case '6':
435*4882a593Smuzhiyun 			if (cfg_family != PF_UNSPEC)
436*4882a593Smuzhiyun 				error(1, 0, "Pass one of -4 or -6");
437*4882a593Smuzhiyun 			cfg_family = PF_INET6;
438*4882a593Smuzhiyun 			cfg_alen = sizeof(struct sockaddr_in6);
439*4882a593Smuzhiyun 			break;
440*4882a593Smuzhiyun 		case 'a':
441*4882a593Smuzhiyun 			cfg_audit = true;
442*4882a593Smuzhiyun 			break;
443*4882a593Smuzhiyun 		case 'c':
444*4882a593Smuzhiyun 			cfg_cache_trash = true;
445*4882a593Smuzhiyun 			break;
446*4882a593Smuzhiyun 		case 'C':
447*4882a593Smuzhiyun 			cfg_cpu = strtol(optarg, NULL, 0);
448*4882a593Smuzhiyun 			break;
449*4882a593Smuzhiyun 		case 'D':
450*4882a593Smuzhiyun 			bind_addr = optarg;
451*4882a593Smuzhiyun 			break;
452*4882a593Smuzhiyun 		case 'l':
453*4882a593Smuzhiyun 			cfg_runtime_ms = strtoul(optarg, NULL, 10) * 1000;
454*4882a593Smuzhiyun 			break;
455*4882a593Smuzhiyun 		case 'm':
456*4882a593Smuzhiyun 			cfg_sendmmsg = true;
457*4882a593Smuzhiyun 			break;
458*4882a593Smuzhiyun 		case 'M':
459*4882a593Smuzhiyun 			cfg_msg_nr = strtoul(optarg, NULL, 10);
460*4882a593Smuzhiyun 			break;
461*4882a593Smuzhiyun 		case 'p':
462*4882a593Smuzhiyun 			cfg_port = strtoul(optarg, NULL, 0);
463*4882a593Smuzhiyun 			break;
464*4882a593Smuzhiyun 		case 'P':
465*4882a593Smuzhiyun 			cfg_poll = true;
466*4882a593Smuzhiyun 			break;
467*4882a593Smuzhiyun 		case 's':
468*4882a593Smuzhiyun 			cfg_payload_len = strtoul(optarg, NULL, 0);
469*4882a593Smuzhiyun 			break;
470*4882a593Smuzhiyun 		case 'S':
471*4882a593Smuzhiyun 			cfg_gso_size = strtoul(optarg, NULL, 0);
472*4882a593Smuzhiyun 			cfg_segment = true;
473*4882a593Smuzhiyun 			break;
474*4882a593Smuzhiyun 		case 'H':
475*4882a593Smuzhiyun 			cfg_tx_ts = SOF_TIMESTAMPING_TX_HARDWARE;
476*4882a593Smuzhiyun 			cfg_tx_tstamp = true;
477*4882a593Smuzhiyun 			break;
478*4882a593Smuzhiyun 		case 't':
479*4882a593Smuzhiyun 			cfg_tcp = true;
480*4882a593Smuzhiyun 			break;
481*4882a593Smuzhiyun 		case 'T':
482*4882a593Smuzhiyun 			cfg_tx_tstamp = true;
483*4882a593Smuzhiyun 			break;
484*4882a593Smuzhiyun 		case 'u':
485*4882a593Smuzhiyun 			cfg_connected = false;
486*4882a593Smuzhiyun 			break;
487*4882a593Smuzhiyun 		case 'v':
488*4882a593Smuzhiyun 			cfg_verbose = true;
489*4882a593Smuzhiyun 			break;
490*4882a593Smuzhiyun 		case 'z':
491*4882a593Smuzhiyun 			cfg_zerocopy = true;
492*4882a593Smuzhiyun 			break;
493*4882a593Smuzhiyun 		}
494*4882a593Smuzhiyun 	}
495*4882a593Smuzhiyun 
496*4882a593Smuzhiyun 	if (!bind_addr)
497*4882a593Smuzhiyun 		bind_addr = cfg_family == PF_INET6 ? "::" : "0.0.0.0";
498*4882a593Smuzhiyun 
499*4882a593Smuzhiyun 	setup_sockaddr(cfg_family, bind_addr, &cfg_dst_addr);
500*4882a593Smuzhiyun 
501*4882a593Smuzhiyun 	if (optind != argc)
502*4882a593Smuzhiyun 		usage(argv[0]);
503*4882a593Smuzhiyun 
504*4882a593Smuzhiyun 	if (cfg_family == PF_UNSPEC)
505*4882a593Smuzhiyun 		error(1, 0, "must pass one of -4 or -6");
506*4882a593Smuzhiyun 	if (cfg_tcp && !cfg_connected)
507*4882a593Smuzhiyun 		error(1, 0, "connectionless tcp makes no sense");
508*4882a593Smuzhiyun 	if (cfg_segment && cfg_sendmmsg)
509*4882a593Smuzhiyun 		error(1, 0, "cannot combine segment offload and sendmmsg");
510*4882a593Smuzhiyun 	if (cfg_tx_tstamp && !(cfg_segment || cfg_sendmmsg))
511*4882a593Smuzhiyun 		error(1, 0, "Options -T and -H require either -S or -m option");
512*4882a593Smuzhiyun 
513*4882a593Smuzhiyun 	if (cfg_family == PF_INET)
514*4882a593Smuzhiyun 		hdrlen = sizeof(struct iphdr) + sizeof(struct udphdr);
515*4882a593Smuzhiyun 	else
516*4882a593Smuzhiyun 		hdrlen = sizeof(struct ip6_hdr) + sizeof(struct udphdr);
517*4882a593Smuzhiyun 
518*4882a593Smuzhiyun 	cfg_mss = ETH_DATA_LEN - hdrlen;
519*4882a593Smuzhiyun 	max_len = ETH_MAX_MTU - hdrlen;
520*4882a593Smuzhiyun 	if (!cfg_gso_size)
521*4882a593Smuzhiyun 		cfg_gso_size = cfg_mss;
522*4882a593Smuzhiyun 
523*4882a593Smuzhiyun 	if (cfg_payload_len > max_len)
524*4882a593Smuzhiyun 		error(1, 0, "payload length %u exceeds max %u",
525*4882a593Smuzhiyun 		      cfg_payload_len, max_len);
526*4882a593Smuzhiyun }
527*4882a593Smuzhiyun 
set_pmtu_discover(int fd,bool is_ipv4)528*4882a593Smuzhiyun static void set_pmtu_discover(int fd, bool is_ipv4)
529*4882a593Smuzhiyun {
530*4882a593Smuzhiyun 	int level, name, val;
531*4882a593Smuzhiyun 
532*4882a593Smuzhiyun 	if (is_ipv4) {
533*4882a593Smuzhiyun 		level	= SOL_IP;
534*4882a593Smuzhiyun 		name	= IP_MTU_DISCOVER;
535*4882a593Smuzhiyun 		val	= IP_PMTUDISC_DO;
536*4882a593Smuzhiyun 	} else {
537*4882a593Smuzhiyun 		level	= SOL_IPV6;
538*4882a593Smuzhiyun 		name	= IPV6_MTU_DISCOVER;
539*4882a593Smuzhiyun 		val	= IPV6_PMTUDISC_DO;
540*4882a593Smuzhiyun 	}
541*4882a593Smuzhiyun 
542*4882a593Smuzhiyun 	if (setsockopt(fd, level, name, &val, sizeof(val)))
543*4882a593Smuzhiyun 		error(1, errno, "setsockopt path mtu");
544*4882a593Smuzhiyun }
545*4882a593Smuzhiyun 
set_tx_timestamping(int fd)546*4882a593Smuzhiyun static void set_tx_timestamping(int fd)
547*4882a593Smuzhiyun {
548*4882a593Smuzhiyun 	int val = SOF_TIMESTAMPING_OPT_CMSG | SOF_TIMESTAMPING_OPT_ID |
549*4882a593Smuzhiyun 			SOF_TIMESTAMPING_OPT_TSONLY;
550*4882a593Smuzhiyun 
551*4882a593Smuzhiyun 	if (cfg_tx_ts == SOF_TIMESTAMPING_TX_SOFTWARE)
552*4882a593Smuzhiyun 		val |= SOF_TIMESTAMPING_SOFTWARE;
553*4882a593Smuzhiyun 	else
554*4882a593Smuzhiyun 		val |= SOF_TIMESTAMPING_RAW_HARDWARE;
555*4882a593Smuzhiyun 
556*4882a593Smuzhiyun 	if (setsockopt(fd, SOL_SOCKET, SO_TIMESTAMPING, &val, sizeof(val)))
557*4882a593Smuzhiyun 		error(1, errno, "setsockopt tx timestamping");
558*4882a593Smuzhiyun }
559*4882a593Smuzhiyun 
print_audit_report(unsigned long num_msgs,unsigned long num_sends)560*4882a593Smuzhiyun static void print_audit_report(unsigned long num_msgs, unsigned long num_sends)
561*4882a593Smuzhiyun {
562*4882a593Smuzhiyun 	unsigned long tdelta;
563*4882a593Smuzhiyun 
564*4882a593Smuzhiyun 	tdelta = tend - tstart;
565*4882a593Smuzhiyun 	if (!tdelta)
566*4882a593Smuzhiyun 		return;
567*4882a593Smuzhiyun 
568*4882a593Smuzhiyun 	fprintf(stderr, "Summary over %lu.%03lu seconds...\n",
569*4882a593Smuzhiyun 			tdelta / 1000, tdelta % 1000);
570*4882a593Smuzhiyun 	fprintf(stderr,
571*4882a593Smuzhiyun 		"sum %s tx: %6lu MB/s %10lu calls (%lu/s) %10lu msgs (%lu/s)\n",
572*4882a593Smuzhiyun 		cfg_tcp ? "tcp" : "udp",
573*4882a593Smuzhiyun 		((num_msgs * cfg_payload_len) >> 10) / tdelta,
574*4882a593Smuzhiyun 		num_sends, num_sends * 1000 / tdelta,
575*4882a593Smuzhiyun 		num_msgs, num_msgs * 1000 / tdelta);
576*4882a593Smuzhiyun 
577*4882a593Smuzhiyun 	if (cfg_tx_tstamp) {
578*4882a593Smuzhiyun 		if (stat_tx_ts_errors)
579*4882a593Smuzhiyun 			error(1, 0,
580*4882a593Smuzhiyun 			      "Expected clean TX Timestamps: %9lu msgs received %6lu errors",
581*4882a593Smuzhiyun 			      stat_tx_ts, stat_tx_ts_errors);
582*4882a593Smuzhiyun 		if (stat_tx_ts != num_sends)
583*4882a593Smuzhiyun 			error(1, 0,
584*4882a593Smuzhiyun 			      "Unexpected number of TX Timestamps: %9lu expected %9lu received",
585*4882a593Smuzhiyun 			      num_sends, stat_tx_ts);
586*4882a593Smuzhiyun 		fprintf(stderr,
587*4882a593Smuzhiyun 			"Tx Timestamps: %19lu received %17lu errors\n",
588*4882a593Smuzhiyun 			stat_tx_ts, stat_tx_ts_errors);
589*4882a593Smuzhiyun 	}
590*4882a593Smuzhiyun 
591*4882a593Smuzhiyun 	if (cfg_zerocopy) {
592*4882a593Smuzhiyun 		if (stat_zcopies != num_sends)
593*4882a593Smuzhiyun 			error(1, 0, "Unexpected number of Zerocopy completions: %9lu expected %9lu received",
594*4882a593Smuzhiyun 			      num_sends, stat_zcopies);
595*4882a593Smuzhiyun 		fprintf(stderr,
596*4882a593Smuzhiyun 			"Zerocopy acks: %19lu\n",
597*4882a593Smuzhiyun 			stat_zcopies);
598*4882a593Smuzhiyun 	}
599*4882a593Smuzhiyun }
600*4882a593Smuzhiyun 
print_report(unsigned long num_msgs,unsigned long num_sends)601*4882a593Smuzhiyun static void print_report(unsigned long num_msgs, unsigned long num_sends)
602*4882a593Smuzhiyun {
603*4882a593Smuzhiyun 	fprintf(stderr,
604*4882a593Smuzhiyun 		"%s tx: %6lu MB/s %8lu calls/s %6lu msg/s\n",
605*4882a593Smuzhiyun 		cfg_tcp ? "tcp" : "udp",
606*4882a593Smuzhiyun 		(num_msgs * cfg_payload_len) >> 20,
607*4882a593Smuzhiyun 		num_sends, num_msgs);
608*4882a593Smuzhiyun 
609*4882a593Smuzhiyun 	if (cfg_audit) {
610*4882a593Smuzhiyun 		total_num_msgs += num_msgs;
611*4882a593Smuzhiyun 		total_num_sends += num_sends;
612*4882a593Smuzhiyun 	}
613*4882a593Smuzhiyun }
614*4882a593Smuzhiyun 
main(int argc,char ** argv)615*4882a593Smuzhiyun int main(int argc, char **argv)
616*4882a593Smuzhiyun {
617*4882a593Smuzhiyun 	unsigned long num_msgs, num_sends;
618*4882a593Smuzhiyun 	unsigned long tnow, treport, tstop;
619*4882a593Smuzhiyun 	int fd, i, val, ret;
620*4882a593Smuzhiyun 
621*4882a593Smuzhiyun 	parse_opts(argc, argv);
622*4882a593Smuzhiyun 
623*4882a593Smuzhiyun 	if (cfg_cpu > 0)
624*4882a593Smuzhiyun 		set_cpu(cfg_cpu);
625*4882a593Smuzhiyun 
626*4882a593Smuzhiyun 	for (i = 0; i < sizeof(buf[0]); i++)
627*4882a593Smuzhiyun 		buf[0][i] = 'a' + (i % 26);
628*4882a593Smuzhiyun 	for (i = 1; i < NUM_PKT; i++)
629*4882a593Smuzhiyun 		memcpy(buf[i], buf[0], sizeof(buf[0]));
630*4882a593Smuzhiyun 
631*4882a593Smuzhiyun 	signal(SIGINT, sigint_handler);
632*4882a593Smuzhiyun 
633*4882a593Smuzhiyun 	fd = socket(cfg_family, cfg_tcp ? SOCK_STREAM : SOCK_DGRAM, 0);
634*4882a593Smuzhiyun 	if (fd == -1)
635*4882a593Smuzhiyun 		error(1, errno, "socket");
636*4882a593Smuzhiyun 
637*4882a593Smuzhiyun 	if (cfg_zerocopy) {
638*4882a593Smuzhiyun 		val = 1;
639*4882a593Smuzhiyun 
640*4882a593Smuzhiyun 		ret = setsockopt(fd, SOL_SOCKET, SO_ZEROCOPY,
641*4882a593Smuzhiyun 				 &val, sizeof(val));
642*4882a593Smuzhiyun 		if (ret) {
643*4882a593Smuzhiyun 			if (errno == ENOPROTOOPT || errno == ENOTSUPP) {
644*4882a593Smuzhiyun 				fprintf(stderr, "SO_ZEROCOPY not supported");
645*4882a593Smuzhiyun 				exit(KSFT_SKIP);
646*4882a593Smuzhiyun 			}
647*4882a593Smuzhiyun 			error(1, errno, "setsockopt zerocopy");
648*4882a593Smuzhiyun 		}
649*4882a593Smuzhiyun 	}
650*4882a593Smuzhiyun 
651*4882a593Smuzhiyun 	if (cfg_connected &&
652*4882a593Smuzhiyun 	    connect(fd, (void *)&cfg_dst_addr, cfg_alen))
653*4882a593Smuzhiyun 		error(1, errno, "connect");
654*4882a593Smuzhiyun 
655*4882a593Smuzhiyun 	if (cfg_segment)
656*4882a593Smuzhiyun 		set_pmtu_discover(fd, cfg_family == PF_INET);
657*4882a593Smuzhiyun 
658*4882a593Smuzhiyun 	if (cfg_tx_tstamp)
659*4882a593Smuzhiyun 		set_tx_timestamping(fd);
660*4882a593Smuzhiyun 
661*4882a593Smuzhiyun 	num_msgs = num_sends = 0;
662*4882a593Smuzhiyun 	tnow = gettimeofday_ms();
663*4882a593Smuzhiyun 	tstart = tnow;
664*4882a593Smuzhiyun 	tend = tnow;
665*4882a593Smuzhiyun 	tstop = tnow + cfg_runtime_ms;
666*4882a593Smuzhiyun 	treport = tnow + 1000;
667*4882a593Smuzhiyun 
668*4882a593Smuzhiyun 	i = 0;
669*4882a593Smuzhiyun 	do {
670*4882a593Smuzhiyun 		if (cfg_tcp)
671*4882a593Smuzhiyun 			num_sends += send_tcp(fd, buf[i]);
672*4882a593Smuzhiyun 		else if (cfg_segment)
673*4882a593Smuzhiyun 			num_sends += send_udp_segment(fd, buf[i]);
674*4882a593Smuzhiyun 		else if (cfg_sendmmsg)
675*4882a593Smuzhiyun 			num_sends += send_udp_sendmmsg(fd, buf[i]);
676*4882a593Smuzhiyun 		else
677*4882a593Smuzhiyun 			num_sends += send_udp(fd, buf[i]);
678*4882a593Smuzhiyun 		num_msgs++;
679*4882a593Smuzhiyun 		if ((cfg_zerocopy && ((num_msgs & 0xF) == 0)) || cfg_tx_tstamp)
680*4882a593Smuzhiyun 			flush_errqueue(fd, cfg_poll);
681*4882a593Smuzhiyun 
682*4882a593Smuzhiyun 		if (cfg_msg_nr && num_msgs >= cfg_msg_nr)
683*4882a593Smuzhiyun 			break;
684*4882a593Smuzhiyun 
685*4882a593Smuzhiyun 		tnow = gettimeofday_ms();
686*4882a593Smuzhiyun 		if (tnow >= treport) {
687*4882a593Smuzhiyun 			print_report(num_msgs, num_sends);
688*4882a593Smuzhiyun 			num_msgs = num_sends = 0;
689*4882a593Smuzhiyun 			treport = tnow + 1000;
690*4882a593Smuzhiyun 		}
691*4882a593Smuzhiyun 
692*4882a593Smuzhiyun 		/* cold cache when writing buffer */
693*4882a593Smuzhiyun 		if (cfg_cache_trash)
694*4882a593Smuzhiyun 			i = ++i < NUM_PKT ? i : 0;
695*4882a593Smuzhiyun 
696*4882a593Smuzhiyun 	} while (!interrupted && (cfg_runtime_ms == -1 || tnow < tstop));
697*4882a593Smuzhiyun 
698*4882a593Smuzhiyun 	if (cfg_zerocopy || cfg_tx_tstamp)
699*4882a593Smuzhiyun 		flush_errqueue(fd, true);
700*4882a593Smuzhiyun 
701*4882a593Smuzhiyun 	if (close(fd))
702*4882a593Smuzhiyun 		error(1, errno, "close");
703*4882a593Smuzhiyun 
704*4882a593Smuzhiyun 	if (cfg_audit) {
705*4882a593Smuzhiyun 		tend = tnow;
706*4882a593Smuzhiyun 		total_num_msgs += num_msgs;
707*4882a593Smuzhiyun 		total_num_sends += num_sends;
708*4882a593Smuzhiyun 		print_audit_report(total_num_msgs, total_num_sends);
709*4882a593Smuzhiyun 	}
710*4882a593Smuzhiyun 
711*4882a593Smuzhiyun 	return 0;
712*4882a593Smuzhiyun }
713