xref: /OK3568_Linux_fs/kernel/net/tipc/socket.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * net/tipc/socket.c: TIPC socket API
3*4882a593Smuzhiyun  *
4*4882a593Smuzhiyun  * Copyright (c) 2001-2007, 2012-2017, Ericsson AB
5*4882a593Smuzhiyun  * Copyright (c) 2004-2008, 2010-2013, Wind River Systems
6*4882a593Smuzhiyun  * All rights reserved.
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * Redistribution and use in source and binary forms, with or without
9*4882a593Smuzhiyun  * modification, are permitted provided that the following conditions are met:
10*4882a593Smuzhiyun  *
11*4882a593Smuzhiyun  * 1. Redistributions of source code must retain the above copyright
12*4882a593Smuzhiyun  *    notice, this list of conditions and the following disclaimer.
13*4882a593Smuzhiyun  * 2. Redistributions in binary form must reproduce the above copyright
14*4882a593Smuzhiyun  *    notice, this list of conditions and the following disclaimer in the
15*4882a593Smuzhiyun  *    documentation and/or other materials provided with the distribution.
16*4882a593Smuzhiyun  * 3. Neither the names of the copyright holders nor the names of its
17*4882a593Smuzhiyun  *    contributors may be used to endorse or promote products derived from
18*4882a593Smuzhiyun  *    this software without specific prior written permission.
19*4882a593Smuzhiyun  *
20*4882a593Smuzhiyun  * Alternatively, this software may be distributed under the terms of the
21*4882a593Smuzhiyun  * GNU General Public License ("GPL") version 2 as published by the Free
22*4882a593Smuzhiyun  * Software Foundation.
23*4882a593Smuzhiyun  *
24*4882a593Smuzhiyun  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
25*4882a593Smuzhiyun  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26*4882a593Smuzhiyun  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27*4882a593Smuzhiyun  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
28*4882a593Smuzhiyun  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
29*4882a593Smuzhiyun  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
30*4882a593Smuzhiyun  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
31*4882a593Smuzhiyun  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
32*4882a593Smuzhiyun  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
33*4882a593Smuzhiyun  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
34*4882a593Smuzhiyun  * POSSIBILITY OF SUCH DAMAGE.
35*4882a593Smuzhiyun  */
36*4882a593Smuzhiyun 
37*4882a593Smuzhiyun #include <linux/rhashtable.h>
38*4882a593Smuzhiyun #include <linux/sched/signal.h>
39*4882a593Smuzhiyun 
40*4882a593Smuzhiyun #include "core.h"
41*4882a593Smuzhiyun #include "name_table.h"
42*4882a593Smuzhiyun #include "node.h"
43*4882a593Smuzhiyun #include "link.h"
44*4882a593Smuzhiyun #include "name_distr.h"
45*4882a593Smuzhiyun #include "socket.h"
46*4882a593Smuzhiyun #include "bcast.h"
47*4882a593Smuzhiyun #include "netlink.h"
48*4882a593Smuzhiyun #include "group.h"
49*4882a593Smuzhiyun #include "trace.h"
50*4882a593Smuzhiyun 
51*4882a593Smuzhiyun #define NAGLE_START_INIT	4
52*4882a593Smuzhiyun #define NAGLE_START_MAX		1024
53*4882a593Smuzhiyun #define CONN_TIMEOUT_DEFAULT    8000    /* default connect timeout = 8s */
54*4882a593Smuzhiyun #define CONN_PROBING_INTV	msecs_to_jiffies(3600000)  /* [ms] => 1 h */
55*4882a593Smuzhiyun #define TIPC_MAX_PORT		0xffffffff
56*4882a593Smuzhiyun #define TIPC_MIN_PORT		1
57*4882a593Smuzhiyun #define TIPC_ACK_RATE		4       /* ACK at 1/4 of rcv window size */
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun enum {
60*4882a593Smuzhiyun 	TIPC_LISTEN = TCP_LISTEN,
61*4882a593Smuzhiyun 	TIPC_ESTABLISHED = TCP_ESTABLISHED,
62*4882a593Smuzhiyun 	TIPC_OPEN = TCP_CLOSE,
63*4882a593Smuzhiyun 	TIPC_DISCONNECTING = TCP_CLOSE_WAIT,
64*4882a593Smuzhiyun 	TIPC_CONNECTING = TCP_SYN_SENT,
65*4882a593Smuzhiyun };
66*4882a593Smuzhiyun 
67*4882a593Smuzhiyun struct sockaddr_pair {
68*4882a593Smuzhiyun 	struct sockaddr_tipc sock;
69*4882a593Smuzhiyun 	struct sockaddr_tipc member;
70*4882a593Smuzhiyun };
71*4882a593Smuzhiyun 
72*4882a593Smuzhiyun /**
73*4882a593Smuzhiyun  * struct tipc_sock - TIPC socket structure
74*4882a593Smuzhiyun  * @sk: socket - interacts with 'port' and with user via the socket API
75*4882a593Smuzhiyun  * @conn_type: TIPC type used when connection was established
76*4882a593Smuzhiyun  * @conn_instance: TIPC instance used when connection was established
77*4882a593Smuzhiyun  * @published: non-zero if port has one or more associated names
78*4882a593Smuzhiyun  * @max_pkt: maximum packet size "hint" used when building messages sent by port
79*4882a593Smuzhiyun  * @maxnagle: maximum size of msg which can be subject to nagle
80*4882a593Smuzhiyun  * @portid: unique port identity in TIPC socket hash table
81*4882a593Smuzhiyun  * @phdr: preformatted message header used when sending messages
82*4882a593Smuzhiyun  * #cong_links: list of congested links
83*4882a593Smuzhiyun  * @publications: list of publications for port
84*4882a593Smuzhiyun  * @blocking_link: address of the congested link we are currently sleeping on
85*4882a593Smuzhiyun  * @pub_count: total # of publications port has made during its lifetime
86*4882a593Smuzhiyun  * @conn_timeout: the time we can wait for an unresponded setup request
87*4882a593Smuzhiyun  * @dupl_rcvcnt: number of bytes counted twice, in both backlog and rcv queue
88*4882a593Smuzhiyun  * @cong_link_cnt: number of congested links
89*4882a593Smuzhiyun  * @snt_unacked: # messages sent by socket, and not yet acked by peer
90*4882a593Smuzhiyun  * @rcv_unacked: # messages read by user, but not yet acked back to peer
91*4882a593Smuzhiyun  * @peer: 'connected' peer for dgram/rdm
92*4882a593Smuzhiyun  * @node: hash table node
93*4882a593Smuzhiyun  * @mc_method: cookie for use between socket and broadcast layer
94*4882a593Smuzhiyun  * @rcu: rcu struct for tipc_sock
95*4882a593Smuzhiyun  */
96*4882a593Smuzhiyun struct tipc_sock {
97*4882a593Smuzhiyun 	struct sock sk;
98*4882a593Smuzhiyun 	u32 conn_type;
99*4882a593Smuzhiyun 	u32 conn_instance;
100*4882a593Smuzhiyun 	int published;
101*4882a593Smuzhiyun 	u32 max_pkt;
102*4882a593Smuzhiyun 	u32 maxnagle;
103*4882a593Smuzhiyun 	u32 portid;
104*4882a593Smuzhiyun 	struct tipc_msg phdr;
105*4882a593Smuzhiyun 	struct list_head cong_links;
106*4882a593Smuzhiyun 	struct list_head publications;
107*4882a593Smuzhiyun 	u32 pub_count;
108*4882a593Smuzhiyun 	atomic_t dupl_rcvcnt;
109*4882a593Smuzhiyun 	u16 conn_timeout;
110*4882a593Smuzhiyun 	bool probe_unacked;
111*4882a593Smuzhiyun 	u16 cong_link_cnt;
112*4882a593Smuzhiyun 	u16 snt_unacked;
113*4882a593Smuzhiyun 	u16 snd_win;
114*4882a593Smuzhiyun 	u16 peer_caps;
115*4882a593Smuzhiyun 	u16 rcv_unacked;
116*4882a593Smuzhiyun 	u16 rcv_win;
117*4882a593Smuzhiyun 	struct sockaddr_tipc peer;
118*4882a593Smuzhiyun 	struct rhash_head node;
119*4882a593Smuzhiyun 	struct tipc_mc_method mc_method;
120*4882a593Smuzhiyun 	struct rcu_head rcu;
121*4882a593Smuzhiyun 	struct tipc_group *group;
122*4882a593Smuzhiyun 	u32 oneway;
123*4882a593Smuzhiyun 	u32 nagle_start;
124*4882a593Smuzhiyun 	u16 snd_backlog;
125*4882a593Smuzhiyun 	u16 msg_acc;
126*4882a593Smuzhiyun 	u16 pkt_cnt;
127*4882a593Smuzhiyun 	bool expect_ack;
128*4882a593Smuzhiyun 	bool nodelay;
129*4882a593Smuzhiyun 	bool group_is_open;
130*4882a593Smuzhiyun };
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun static int tipc_sk_backlog_rcv(struct sock *sk, struct sk_buff *skb);
133*4882a593Smuzhiyun static void tipc_data_ready(struct sock *sk);
134*4882a593Smuzhiyun static void tipc_write_space(struct sock *sk);
135*4882a593Smuzhiyun static void tipc_sock_destruct(struct sock *sk);
136*4882a593Smuzhiyun static int tipc_release(struct socket *sock);
137*4882a593Smuzhiyun static int tipc_accept(struct socket *sock, struct socket *new_sock, int flags,
138*4882a593Smuzhiyun 		       bool kern);
139*4882a593Smuzhiyun static void tipc_sk_timeout(struct timer_list *t);
140*4882a593Smuzhiyun static int tipc_sk_publish(struct tipc_sock *tsk, uint scope,
141*4882a593Smuzhiyun 			   struct tipc_name_seq const *seq);
142*4882a593Smuzhiyun static int tipc_sk_withdraw(struct tipc_sock *tsk, uint scope,
143*4882a593Smuzhiyun 			    struct tipc_name_seq const *seq);
144*4882a593Smuzhiyun static int tipc_sk_leave(struct tipc_sock *tsk);
145*4882a593Smuzhiyun static struct tipc_sock *tipc_sk_lookup(struct net *net, u32 portid);
146*4882a593Smuzhiyun static int tipc_sk_insert(struct tipc_sock *tsk);
147*4882a593Smuzhiyun static void tipc_sk_remove(struct tipc_sock *tsk);
148*4882a593Smuzhiyun static int __tipc_sendstream(struct socket *sock, struct msghdr *m, size_t dsz);
149*4882a593Smuzhiyun static int __tipc_sendmsg(struct socket *sock, struct msghdr *m, size_t dsz);
150*4882a593Smuzhiyun static void tipc_sk_push_backlog(struct tipc_sock *tsk, bool nagle_ack);
151*4882a593Smuzhiyun static int tipc_wait_for_connect(struct socket *sock, long *timeo_p);
152*4882a593Smuzhiyun 
153*4882a593Smuzhiyun static const struct proto_ops packet_ops;
154*4882a593Smuzhiyun static const struct proto_ops stream_ops;
155*4882a593Smuzhiyun static const struct proto_ops msg_ops;
156*4882a593Smuzhiyun static struct proto tipc_proto;
157*4882a593Smuzhiyun static const struct rhashtable_params tsk_rht_params;
158*4882a593Smuzhiyun 
tsk_own_node(struct tipc_sock * tsk)159*4882a593Smuzhiyun static u32 tsk_own_node(struct tipc_sock *tsk)
160*4882a593Smuzhiyun {
161*4882a593Smuzhiyun 	return msg_prevnode(&tsk->phdr);
162*4882a593Smuzhiyun }
163*4882a593Smuzhiyun 
tsk_peer_node(struct tipc_sock * tsk)164*4882a593Smuzhiyun static u32 tsk_peer_node(struct tipc_sock *tsk)
165*4882a593Smuzhiyun {
166*4882a593Smuzhiyun 	return msg_destnode(&tsk->phdr);
167*4882a593Smuzhiyun }
168*4882a593Smuzhiyun 
tsk_peer_port(struct tipc_sock * tsk)169*4882a593Smuzhiyun static u32 tsk_peer_port(struct tipc_sock *tsk)
170*4882a593Smuzhiyun {
171*4882a593Smuzhiyun 	return msg_destport(&tsk->phdr);
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun 
tsk_unreliable(struct tipc_sock * tsk)174*4882a593Smuzhiyun static  bool tsk_unreliable(struct tipc_sock *tsk)
175*4882a593Smuzhiyun {
176*4882a593Smuzhiyun 	return msg_src_droppable(&tsk->phdr) != 0;
177*4882a593Smuzhiyun }
178*4882a593Smuzhiyun 
tsk_set_unreliable(struct tipc_sock * tsk,bool unreliable)179*4882a593Smuzhiyun static void tsk_set_unreliable(struct tipc_sock *tsk, bool unreliable)
180*4882a593Smuzhiyun {
181*4882a593Smuzhiyun 	msg_set_src_droppable(&tsk->phdr, unreliable ? 1 : 0);
182*4882a593Smuzhiyun }
183*4882a593Smuzhiyun 
tsk_unreturnable(struct tipc_sock * tsk)184*4882a593Smuzhiyun static bool tsk_unreturnable(struct tipc_sock *tsk)
185*4882a593Smuzhiyun {
186*4882a593Smuzhiyun 	return msg_dest_droppable(&tsk->phdr) != 0;
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun 
tsk_set_unreturnable(struct tipc_sock * tsk,bool unreturnable)189*4882a593Smuzhiyun static void tsk_set_unreturnable(struct tipc_sock *tsk, bool unreturnable)
190*4882a593Smuzhiyun {
191*4882a593Smuzhiyun 	msg_set_dest_droppable(&tsk->phdr, unreturnable ? 1 : 0);
192*4882a593Smuzhiyun }
193*4882a593Smuzhiyun 
tsk_importance(struct tipc_sock * tsk)194*4882a593Smuzhiyun static int tsk_importance(struct tipc_sock *tsk)
195*4882a593Smuzhiyun {
196*4882a593Smuzhiyun 	return msg_importance(&tsk->phdr);
197*4882a593Smuzhiyun }
198*4882a593Smuzhiyun 
tipc_sk(const struct sock * sk)199*4882a593Smuzhiyun static struct tipc_sock *tipc_sk(const struct sock *sk)
200*4882a593Smuzhiyun {
201*4882a593Smuzhiyun 	return container_of(sk, struct tipc_sock, sk);
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun 
tsk_set_importance(struct sock * sk,int imp)204*4882a593Smuzhiyun int tsk_set_importance(struct sock *sk, int imp)
205*4882a593Smuzhiyun {
206*4882a593Smuzhiyun 	if (imp > TIPC_CRITICAL_IMPORTANCE)
207*4882a593Smuzhiyun 		return -EINVAL;
208*4882a593Smuzhiyun 	msg_set_importance(&tipc_sk(sk)->phdr, (u32)imp);
209*4882a593Smuzhiyun 	return 0;
210*4882a593Smuzhiyun }
211*4882a593Smuzhiyun 
tsk_conn_cong(struct tipc_sock * tsk)212*4882a593Smuzhiyun static bool tsk_conn_cong(struct tipc_sock *tsk)
213*4882a593Smuzhiyun {
214*4882a593Smuzhiyun 	return tsk->snt_unacked > tsk->snd_win;
215*4882a593Smuzhiyun }
216*4882a593Smuzhiyun 
tsk_blocks(int len)217*4882a593Smuzhiyun static u16 tsk_blocks(int len)
218*4882a593Smuzhiyun {
219*4882a593Smuzhiyun 	return ((len / FLOWCTL_BLK_SZ) + 1);
220*4882a593Smuzhiyun }
221*4882a593Smuzhiyun 
222*4882a593Smuzhiyun /* tsk_blocks(): translate a buffer size in bytes to number of
223*4882a593Smuzhiyun  * advertisable blocks, taking into account the ratio truesize(len)/len
224*4882a593Smuzhiyun  * We can trust that this ratio is always < 4 for len >= FLOWCTL_BLK_SZ
225*4882a593Smuzhiyun  */
tsk_adv_blocks(int len)226*4882a593Smuzhiyun static u16 tsk_adv_blocks(int len)
227*4882a593Smuzhiyun {
228*4882a593Smuzhiyun 	return len / FLOWCTL_BLK_SZ / 4;
229*4882a593Smuzhiyun }
230*4882a593Smuzhiyun 
231*4882a593Smuzhiyun /* tsk_inc(): increment counter for sent or received data
232*4882a593Smuzhiyun  * - If block based flow control is not supported by peer we
233*4882a593Smuzhiyun  *   fall back to message based ditto, incrementing the counter
234*4882a593Smuzhiyun  */
tsk_inc(struct tipc_sock * tsk,int msglen)235*4882a593Smuzhiyun static u16 tsk_inc(struct tipc_sock *tsk, int msglen)
236*4882a593Smuzhiyun {
237*4882a593Smuzhiyun 	if (likely(tsk->peer_caps & TIPC_BLOCK_FLOWCTL))
238*4882a593Smuzhiyun 		return ((msglen / FLOWCTL_BLK_SZ) + 1);
239*4882a593Smuzhiyun 	return 1;
240*4882a593Smuzhiyun }
241*4882a593Smuzhiyun 
242*4882a593Smuzhiyun /* tsk_set_nagle - enable/disable nagle property by manipulating maxnagle
243*4882a593Smuzhiyun  */
tsk_set_nagle(struct tipc_sock * tsk)244*4882a593Smuzhiyun static void tsk_set_nagle(struct tipc_sock *tsk)
245*4882a593Smuzhiyun {
246*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
247*4882a593Smuzhiyun 
248*4882a593Smuzhiyun 	tsk->maxnagle = 0;
249*4882a593Smuzhiyun 	if (sk->sk_type != SOCK_STREAM)
250*4882a593Smuzhiyun 		return;
251*4882a593Smuzhiyun 	if (tsk->nodelay)
252*4882a593Smuzhiyun 		return;
253*4882a593Smuzhiyun 	if (!(tsk->peer_caps & TIPC_NAGLE))
254*4882a593Smuzhiyun 		return;
255*4882a593Smuzhiyun 	/* Limit node local buffer size to avoid receive queue overflow */
256*4882a593Smuzhiyun 	if (tsk->max_pkt == MAX_MSG_SIZE)
257*4882a593Smuzhiyun 		tsk->maxnagle = 1500;
258*4882a593Smuzhiyun 	else
259*4882a593Smuzhiyun 		tsk->maxnagle = tsk->max_pkt;
260*4882a593Smuzhiyun }
261*4882a593Smuzhiyun 
262*4882a593Smuzhiyun /**
263*4882a593Smuzhiyun  * tsk_advance_rx_queue - discard first buffer in socket receive queue
264*4882a593Smuzhiyun  *
265*4882a593Smuzhiyun  * Caller must hold socket lock
266*4882a593Smuzhiyun  */
tsk_advance_rx_queue(struct sock * sk)267*4882a593Smuzhiyun static void tsk_advance_rx_queue(struct sock *sk)
268*4882a593Smuzhiyun {
269*4882a593Smuzhiyun 	trace_tipc_sk_advance_rx(sk, NULL, TIPC_DUMP_SK_RCVQ, " ");
270*4882a593Smuzhiyun 	kfree_skb(__skb_dequeue(&sk->sk_receive_queue));
271*4882a593Smuzhiyun }
272*4882a593Smuzhiyun 
273*4882a593Smuzhiyun /* tipc_sk_respond() : send response message back to sender
274*4882a593Smuzhiyun  */
tipc_sk_respond(struct sock * sk,struct sk_buff * skb,int err)275*4882a593Smuzhiyun static void tipc_sk_respond(struct sock *sk, struct sk_buff *skb, int err)
276*4882a593Smuzhiyun {
277*4882a593Smuzhiyun 	u32 selector;
278*4882a593Smuzhiyun 	u32 dnode;
279*4882a593Smuzhiyun 	u32 onode = tipc_own_addr(sock_net(sk));
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 	if (!tipc_msg_reverse(onode, &skb, err))
282*4882a593Smuzhiyun 		return;
283*4882a593Smuzhiyun 
284*4882a593Smuzhiyun 	trace_tipc_sk_rej_msg(sk, skb, TIPC_DUMP_NONE, "@sk_respond!");
285*4882a593Smuzhiyun 	dnode = msg_destnode(buf_msg(skb));
286*4882a593Smuzhiyun 	selector = msg_origport(buf_msg(skb));
287*4882a593Smuzhiyun 	tipc_node_xmit_skb(sock_net(sk), skb, dnode, selector);
288*4882a593Smuzhiyun }
289*4882a593Smuzhiyun 
290*4882a593Smuzhiyun /**
291*4882a593Smuzhiyun  * tsk_rej_rx_queue - reject all buffers in socket receive queue
292*4882a593Smuzhiyun  *
293*4882a593Smuzhiyun  * Caller must hold socket lock
294*4882a593Smuzhiyun  */
tsk_rej_rx_queue(struct sock * sk,int error)295*4882a593Smuzhiyun static void tsk_rej_rx_queue(struct sock *sk, int error)
296*4882a593Smuzhiyun {
297*4882a593Smuzhiyun 	struct sk_buff *skb;
298*4882a593Smuzhiyun 
299*4882a593Smuzhiyun 	while ((skb = __skb_dequeue(&sk->sk_receive_queue)))
300*4882a593Smuzhiyun 		tipc_sk_respond(sk, skb, error);
301*4882a593Smuzhiyun }
302*4882a593Smuzhiyun 
tipc_sk_connected(struct sock * sk)303*4882a593Smuzhiyun static bool tipc_sk_connected(struct sock *sk)
304*4882a593Smuzhiyun {
305*4882a593Smuzhiyun 	return sk->sk_state == TIPC_ESTABLISHED;
306*4882a593Smuzhiyun }
307*4882a593Smuzhiyun 
308*4882a593Smuzhiyun /* tipc_sk_type_connectionless - check if the socket is datagram socket
309*4882a593Smuzhiyun  * @sk: socket
310*4882a593Smuzhiyun  *
311*4882a593Smuzhiyun  * Returns true if connection less, false otherwise
312*4882a593Smuzhiyun  */
tipc_sk_type_connectionless(struct sock * sk)313*4882a593Smuzhiyun static bool tipc_sk_type_connectionless(struct sock *sk)
314*4882a593Smuzhiyun {
315*4882a593Smuzhiyun 	return sk->sk_type == SOCK_RDM || sk->sk_type == SOCK_DGRAM;
316*4882a593Smuzhiyun }
317*4882a593Smuzhiyun 
318*4882a593Smuzhiyun /* tsk_peer_msg - verify if message was sent by connected port's peer
319*4882a593Smuzhiyun  *
320*4882a593Smuzhiyun  * Handles cases where the node's network address has changed from
321*4882a593Smuzhiyun  * the default of <0.0.0> to its configured setting.
322*4882a593Smuzhiyun  */
tsk_peer_msg(struct tipc_sock * tsk,struct tipc_msg * msg)323*4882a593Smuzhiyun static bool tsk_peer_msg(struct tipc_sock *tsk, struct tipc_msg *msg)
324*4882a593Smuzhiyun {
325*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
326*4882a593Smuzhiyun 	u32 self = tipc_own_addr(sock_net(sk));
327*4882a593Smuzhiyun 	u32 peer_port = tsk_peer_port(tsk);
328*4882a593Smuzhiyun 	u32 orig_node, peer_node;
329*4882a593Smuzhiyun 
330*4882a593Smuzhiyun 	if (unlikely(!tipc_sk_connected(sk)))
331*4882a593Smuzhiyun 		return false;
332*4882a593Smuzhiyun 
333*4882a593Smuzhiyun 	if (unlikely(msg_origport(msg) != peer_port))
334*4882a593Smuzhiyun 		return false;
335*4882a593Smuzhiyun 
336*4882a593Smuzhiyun 	orig_node = msg_orignode(msg);
337*4882a593Smuzhiyun 	peer_node = tsk_peer_node(tsk);
338*4882a593Smuzhiyun 
339*4882a593Smuzhiyun 	if (likely(orig_node == peer_node))
340*4882a593Smuzhiyun 		return true;
341*4882a593Smuzhiyun 
342*4882a593Smuzhiyun 	if (!orig_node && peer_node == self)
343*4882a593Smuzhiyun 		return true;
344*4882a593Smuzhiyun 
345*4882a593Smuzhiyun 	if (!peer_node && orig_node == self)
346*4882a593Smuzhiyun 		return true;
347*4882a593Smuzhiyun 
348*4882a593Smuzhiyun 	return false;
349*4882a593Smuzhiyun }
350*4882a593Smuzhiyun 
351*4882a593Smuzhiyun /* tipc_set_sk_state - set the sk_state of the socket
352*4882a593Smuzhiyun  * @sk: socket
353*4882a593Smuzhiyun  *
354*4882a593Smuzhiyun  * Caller must hold socket lock
355*4882a593Smuzhiyun  *
356*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
357*4882a593Smuzhiyun  */
tipc_set_sk_state(struct sock * sk,int state)358*4882a593Smuzhiyun static int tipc_set_sk_state(struct sock *sk, int state)
359*4882a593Smuzhiyun {
360*4882a593Smuzhiyun 	int oldsk_state = sk->sk_state;
361*4882a593Smuzhiyun 	int res = -EINVAL;
362*4882a593Smuzhiyun 
363*4882a593Smuzhiyun 	switch (state) {
364*4882a593Smuzhiyun 	case TIPC_OPEN:
365*4882a593Smuzhiyun 		res = 0;
366*4882a593Smuzhiyun 		break;
367*4882a593Smuzhiyun 	case TIPC_LISTEN:
368*4882a593Smuzhiyun 	case TIPC_CONNECTING:
369*4882a593Smuzhiyun 		if (oldsk_state == TIPC_OPEN)
370*4882a593Smuzhiyun 			res = 0;
371*4882a593Smuzhiyun 		break;
372*4882a593Smuzhiyun 	case TIPC_ESTABLISHED:
373*4882a593Smuzhiyun 		if (oldsk_state == TIPC_CONNECTING ||
374*4882a593Smuzhiyun 		    oldsk_state == TIPC_OPEN)
375*4882a593Smuzhiyun 			res = 0;
376*4882a593Smuzhiyun 		break;
377*4882a593Smuzhiyun 	case TIPC_DISCONNECTING:
378*4882a593Smuzhiyun 		if (oldsk_state == TIPC_CONNECTING ||
379*4882a593Smuzhiyun 		    oldsk_state == TIPC_ESTABLISHED)
380*4882a593Smuzhiyun 			res = 0;
381*4882a593Smuzhiyun 		break;
382*4882a593Smuzhiyun 	}
383*4882a593Smuzhiyun 
384*4882a593Smuzhiyun 	if (!res)
385*4882a593Smuzhiyun 		sk->sk_state = state;
386*4882a593Smuzhiyun 
387*4882a593Smuzhiyun 	return res;
388*4882a593Smuzhiyun }
389*4882a593Smuzhiyun 
tipc_sk_sock_err(struct socket * sock,long * timeout)390*4882a593Smuzhiyun static int tipc_sk_sock_err(struct socket *sock, long *timeout)
391*4882a593Smuzhiyun {
392*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
393*4882a593Smuzhiyun 	int err = sock_error(sk);
394*4882a593Smuzhiyun 	int typ = sock->type;
395*4882a593Smuzhiyun 
396*4882a593Smuzhiyun 	if (err)
397*4882a593Smuzhiyun 		return err;
398*4882a593Smuzhiyun 	if (typ == SOCK_STREAM || typ == SOCK_SEQPACKET) {
399*4882a593Smuzhiyun 		if (sk->sk_state == TIPC_DISCONNECTING)
400*4882a593Smuzhiyun 			return -EPIPE;
401*4882a593Smuzhiyun 		else if (!tipc_sk_connected(sk))
402*4882a593Smuzhiyun 			return -ENOTCONN;
403*4882a593Smuzhiyun 	}
404*4882a593Smuzhiyun 	if (!*timeout)
405*4882a593Smuzhiyun 		return -EAGAIN;
406*4882a593Smuzhiyun 	if (signal_pending(current))
407*4882a593Smuzhiyun 		return sock_intr_errno(*timeout);
408*4882a593Smuzhiyun 
409*4882a593Smuzhiyun 	return 0;
410*4882a593Smuzhiyun }
411*4882a593Smuzhiyun 
412*4882a593Smuzhiyun #define tipc_wait_for_cond(sock_, timeo_, condition_)			       \
413*4882a593Smuzhiyun ({                                                                             \
414*4882a593Smuzhiyun 	DEFINE_WAIT_FUNC(wait_, woken_wake_function);                          \
415*4882a593Smuzhiyun 	struct sock *sk_;						       \
416*4882a593Smuzhiyun 	int rc_;							       \
417*4882a593Smuzhiyun 									       \
418*4882a593Smuzhiyun 	while ((rc_ = !(condition_))) {					       \
419*4882a593Smuzhiyun 		/* coupled with smp_wmb() in tipc_sk_proto_rcv() */            \
420*4882a593Smuzhiyun 		smp_rmb();                                                     \
421*4882a593Smuzhiyun 		sk_ = (sock_)->sk;					       \
422*4882a593Smuzhiyun 		rc_ = tipc_sk_sock_err((sock_), timeo_);		       \
423*4882a593Smuzhiyun 		if (rc_)						       \
424*4882a593Smuzhiyun 			break;						       \
425*4882a593Smuzhiyun 		add_wait_queue(sk_sleep(sk_), &wait_);                         \
426*4882a593Smuzhiyun 		release_sock(sk_);					       \
427*4882a593Smuzhiyun 		*(timeo_) = wait_woken(&wait_, TASK_INTERRUPTIBLE, *(timeo_)); \
428*4882a593Smuzhiyun 		sched_annotate_sleep();				               \
429*4882a593Smuzhiyun 		lock_sock(sk_);						       \
430*4882a593Smuzhiyun 		remove_wait_queue(sk_sleep(sk_), &wait_);		       \
431*4882a593Smuzhiyun 	}								       \
432*4882a593Smuzhiyun 	rc_;								       \
433*4882a593Smuzhiyun })
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun /**
436*4882a593Smuzhiyun  * tipc_sk_create - create a TIPC socket
437*4882a593Smuzhiyun  * @net: network namespace (must be default network)
438*4882a593Smuzhiyun  * @sock: pre-allocated socket structure
439*4882a593Smuzhiyun  * @protocol: protocol indicator (must be 0)
440*4882a593Smuzhiyun  * @kern: caused by kernel or by userspace?
441*4882a593Smuzhiyun  *
442*4882a593Smuzhiyun  * This routine creates additional data structures used by the TIPC socket,
443*4882a593Smuzhiyun  * initializes them, and links them together.
444*4882a593Smuzhiyun  *
445*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
446*4882a593Smuzhiyun  */
tipc_sk_create(struct net * net,struct socket * sock,int protocol,int kern)447*4882a593Smuzhiyun static int tipc_sk_create(struct net *net, struct socket *sock,
448*4882a593Smuzhiyun 			  int protocol, int kern)
449*4882a593Smuzhiyun {
450*4882a593Smuzhiyun 	const struct proto_ops *ops;
451*4882a593Smuzhiyun 	struct sock *sk;
452*4882a593Smuzhiyun 	struct tipc_sock *tsk;
453*4882a593Smuzhiyun 	struct tipc_msg *msg;
454*4882a593Smuzhiyun 
455*4882a593Smuzhiyun 	/* Validate arguments */
456*4882a593Smuzhiyun 	if (unlikely(protocol != 0))
457*4882a593Smuzhiyun 		return -EPROTONOSUPPORT;
458*4882a593Smuzhiyun 
459*4882a593Smuzhiyun 	switch (sock->type) {
460*4882a593Smuzhiyun 	case SOCK_STREAM:
461*4882a593Smuzhiyun 		ops = &stream_ops;
462*4882a593Smuzhiyun 		break;
463*4882a593Smuzhiyun 	case SOCK_SEQPACKET:
464*4882a593Smuzhiyun 		ops = &packet_ops;
465*4882a593Smuzhiyun 		break;
466*4882a593Smuzhiyun 	case SOCK_DGRAM:
467*4882a593Smuzhiyun 	case SOCK_RDM:
468*4882a593Smuzhiyun 		ops = &msg_ops;
469*4882a593Smuzhiyun 		break;
470*4882a593Smuzhiyun 	default:
471*4882a593Smuzhiyun 		return -EPROTOTYPE;
472*4882a593Smuzhiyun 	}
473*4882a593Smuzhiyun 
474*4882a593Smuzhiyun 	/* Allocate socket's protocol area */
475*4882a593Smuzhiyun 	sk = sk_alloc(net, AF_TIPC, GFP_KERNEL, &tipc_proto, kern);
476*4882a593Smuzhiyun 	if (sk == NULL)
477*4882a593Smuzhiyun 		return -ENOMEM;
478*4882a593Smuzhiyun 
479*4882a593Smuzhiyun 	tsk = tipc_sk(sk);
480*4882a593Smuzhiyun 	tsk->max_pkt = MAX_PKT_DEFAULT;
481*4882a593Smuzhiyun 	tsk->maxnagle = 0;
482*4882a593Smuzhiyun 	tsk->nagle_start = NAGLE_START_INIT;
483*4882a593Smuzhiyun 	INIT_LIST_HEAD(&tsk->publications);
484*4882a593Smuzhiyun 	INIT_LIST_HEAD(&tsk->cong_links);
485*4882a593Smuzhiyun 	msg = &tsk->phdr;
486*4882a593Smuzhiyun 
487*4882a593Smuzhiyun 	/* Finish initializing socket data structures */
488*4882a593Smuzhiyun 	sock->ops = ops;
489*4882a593Smuzhiyun 	sock_init_data(sock, sk);
490*4882a593Smuzhiyun 	tipc_set_sk_state(sk, TIPC_OPEN);
491*4882a593Smuzhiyun 	if (tipc_sk_insert(tsk)) {
492*4882a593Smuzhiyun 		sk_free(sk);
493*4882a593Smuzhiyun 		pr_warn("Socket create failed; port number exhausted\n");
494*4882a593Smuzhiyun 		return -EINVAL;
495*4882a593Smuzhiyun 	}
496*4882a593Smuzhiyun 
497*4882a593Smuzhiyun 	/* Ensure tsk is visible before we read own_addr. */
498*4882a593Smuzhiyun 	smp_mb();
499*4882a593Smuzhiyun 
500*4882a593Smuzhiyun 	tipc_msg_init(tipc_own_addr(net), msg, TIPC_LOW_IMPORTANCE,
501*4882a593Smuzhiyun 		      TIPC_NAMED_MSG, NAMED_H_SIZE, 0);
502*4882a593Smuzhiyun 
503*4882a593Smuzhiyun 	msg_set_origport(msg, tsk->portid);
504*4882a593Smuzhiyun 	timer_setup(&sk->sk_timer, tipc_sk_timeout, 0);
505*4882a593Smuzhiyun 	sk->sk_shutdown = 0;
506*4882a593Smuzhiyun 	sk->sk_backlog_rcv = tipc_sk_backlog_rcv;
507*4882a593Smuzhiyun 	sk->sk_rcvbuf = READ_ONCE(sysctl_tipc_rmem[1]);
508*4882a593Smuzhiyun 	sk->sk_data_ready = tipc_data_ready;
509*4882a593Smuzhiyun 	sk->sk_write_space = tipc_write_space;
510*4882a593Smuzhiyun 	sk->sk_destruct = tipc_sock_destruct;
511*4882a593Smuzhiyun 	tsk->conn_timeout = CONN_TIMEOUT_DEFAULT;
512*4882a593Smuzhiyun 	tsk->group_is_open = true;
513*4882a593Smuzhiyun 	atomic_set(&tsk->dupl_rcvcnt, 0);
514*4882a593Smuzhiyun 
515*4882a593Smuzhiyun 	/* Start out with safe limits until we receive an advertised window */
516*4882a593Smuzhiyun 	tsk->snd_win = tsk_adv_blocks(RCVBUF_MIN);
517*4882a593Smuzhiyun 	tsk->rcv_win = tsk->snd_win;
518*4882a593Smuzhiyun 
519*4882a593Smuzhiyun 	if (tipc_sk_type_connectionless(sk)) {
520*4882a593Smuzhiyun 		tsk_set_unreturnable(tsk, true);
521*4882a593Smuzhiyun 		if (sock->type == SOCK_DGRAM)
522*4882a593Smuzhiyun 			tsk_set_unreliable(tsk, true);
523*4882a593Smuzhiyun 	}
524*4882a593Smuzhiyun 	__skb_queue_head_init(&tsk->mc_method.deferredq);
525*4882a593Smuzhiyun 	trace_tipc_sk_create(sk, NULL, TIPC_DUMP_NONE, " ");
526*4882a593Smuzhiyun 	return 0;
527*4882a593Smuzhiyun }
528*4882a593Smuzhiyun 
tipc_sk_callback(struct rcu_head * head)529*4882a593Smuzhiyun static void tipc_sk_callback(struct rcu_head *head)
530*4882a593Smuzhiyun {
531*4882a593Smuzhiyun 	struct tipc_sock *tsk = container_of(head, struct tipc_sock, rcu);
532*4882a593Smuzhiyun 
533*4882a593Smuzhiyun 	sock_put(&tsk->sk);
534*4882a593Smuzhiyun }
535*4882a593Smuzhiyun 
536*4882a593Smuzhiyun /* Caller should hold socket lock for the socket. */
__tipc_shutdown(struct socket * sock,int error)537*4882a593Smuzhiyun static void __tipc_shutdown(struct socket *sock, int error)
538*4882a593Smuzhiyun {
539*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
540*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
541*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
542*4882a593Smuzhiyun 	long timeout = msecs_to_jiffies(CONN_TIMEOUT_DEFAULT);
543*4882a593Smuzhiyun 	u32 dnode = tsk_peer_node(tsk);
544*4882a593Smuzhiyun 	struct sk_buff *skb;
545*4882a593Smuzhiyun 
546*4882a593Smuzhiyun 	/* Avoid that hi-prio shutdown msgs bypass msgs in link wakeup queue */
547*4882a593Smuzhiyun 	tipc_wait_for_cond(sock, &timeout, (!tsk->cong_link_cnt &&
548*4882a593Smuzhiyun 					    !tsk_conn_cong(tsk)));
549*4882a593Smuzhiyun 
550*4882a593Smuzhiyun 	/* Push out delayed messages if in Nagle mode */
551*4882a593Smuzhiyun 	tipc_sk_push_backlog(tsk, false);
552*4882a593Smuzhiyun 	/* Remove pending SYN */
553*4882a593Smuzhiyun 	__skb_queue_purge(&sk->sk_write_queue);
554*4882a593Smuzhiyun 
555*4882a593Smuzhiyun 	/* Remove partially received buffer if any */
556*4882a593Smuzhiyun 	skb = skb_peek(&sk->sk_receive_queue);
557*4882a593Smuzhiyun 	if (skb && TIPC_SKB_CB(skb)->bytes_read) {
558*4882a593Smuzhiyun 		__skb_unlink(skb, &sk->sk_receive_queue);
559*4882a593Smuzhiyun 		kfree_skb(skb);
560*4882a593Smuzhiyun 	}
561*4882a593Smuzhiyun 
562*4882a593Smuzhiyun 	/* Reject all unreceived messages if connectionless */
563*4882a593Smuzhiyun 	if (tipc_sk_type_connectionless(sk)) {
564*4882a593Smuzhiyun 		tsk_rej_rx_queue(sk, error);
565*4882a593Smuzhiyun 		return;
566*4882a593Smuzhiyun 	}
567*4882a593Smuzhiyun 
568*4882a593Smuzhiyun 	switch (sk->sk_state) {
569*4882a593Smuzhiyun 	case TIPC_CONNECTING:
570*4882a593Smuzhiyun 	case TIPC_ESTABLISHED:
571*4882a593Smuzhiyun 		tipc_set_sk_state(sk, TIPC_DISCONNECTING);
572*4882a593Smuzhiyun 		tipc_node_remove_conn(net, dnode, tsk->portid);
573*4882a593Smuzhiyun 		/* Send a FIN+/- to its peer */
574*4882a593Smuzhiyun 		skb = __skb_dequeue(&sk->sk_receive_queue);
575*4882a593Smuzhiyun 		if (skb) {
576*4882a593Smuzhiyun 			__skb_queue_purge(&sk->sk_receive_queue);
577*4882a593Smuzhiyun 			tipc_sk_respond(sk, skb, error);
578*4882a593Smuzhiyun 			break;
579*4882a593Smuzhiyun 		}
580*4882a593Smuzhiyun 		skb = tipc_msg_create(TIPC_CRITICAL_IMPORTANCE,
581*4882a593Smuzhiyun 				      TIPC_CONN_MSG, SHORT_H_SIZE, 0, dnode,
582*4882a593Smuzhiyun 				      tsk_own_node(tsk), tsk_peer_port(tsk),
583*4882a593Smuzhiyun 				      tsk->portid, error);
584*4882a593Smuzhiyun 		if (skb)
585*4882a593Smuzhiyun 			tipc_node_xmit_skb(net, skb, dnode, tsk->portid);
586*4882a593Smuzhiyun 		break;
587*4882a593Smuzhiyun 	case TIPC_LISTEN:
588*4882a593Smuzhiyun 		/* Reject all SYN messages */
589*4882a593Smuzhiyun 		tsk_rej_rx_queue(sk, error);
590*4882a593Smuzhiyun 		break;
591*4882a593Smuzhiyun 	default:
592*4882a593Smuzhiyun 		__skb_queue_purge(&sk->sk_receive_queue);
593*4882a593Smuzhiyun 		break;
594*4882a593Smuzhiyun 	}
595*4882a593Smuzhiyun }
596*4882a593Smuzhiyun 
597*4882a593Smuzhiyun /**
598*4882a593Smuzhiyun  * tipc_release - destroy a TIPC socket
599*4882a593Smuzhiyun  * @sock: socket to destroy
600*4882a593Smuzhiyun  *
601*4882a593Smuzhiyun  * This routine cleans up any messages that are still queued on the socket.
602*4882a593Smuzhiyun  * For DGRAM and RDM socket types, all queued messages are rejected.
603*4882a593Smuzhiyun  * For SEQPACKET and STREAM socket types, the first message is rejected
604*4882a593Smuzhiyun  * and any others are discarded.  (If the first message on a STREAM socket
605*4882a593Smuzhiyun  * is partially-read, it is discarded and the next one is rejected instead.)
606*4882a593Smuzhiyun  *
607*4882a593Smuzhiyun  * NOTE: Rejected messages are not necessarily returned to the sender!  They
608*4882a593Smuzhiyun  * are returned or discarded according to the "destination droppable" setting
609*4882a593Smuzhiyun  * specified for the message by the sender.
610*4882a593Smuzhiyun  *
611*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
612*4882a593Smuzhiyun  */
tipc_release(struct socket * sock)613*4882a593Smuzhiyun static int tipc_release(struct socket *sock)
614*4882a593Smuzhiyun {
615*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
616*4882a593Smuzhiyun 	struct tipc_sock *tsk;
617*4882a593Smuzhiyun 
618*4882a593Smuzhiyun 	/*
619*4882a593Smuzhiyun 	 * Exit if socket isn't fully initialized (occurs when a failed accept()
620*4882a593Smuzhiyun 	 * releases a pre-allocated child socket that was never used)
621*4882a593Smuzhiyun 	 */
622*4882a593Smuzhiyun 	if (sk == NULL)
623*4882a593Smuzhiyun 		return 0;
624*4882a593Smuzhiyun 
625*4882a593Smuzhiyun 	tsk = tipc_sk(sk);
626*4882a593Smuzhiyun 	lock_sock(sk);
627*4882a593Smuzhiyun 
628*4882a593Smuzhiyun 	trace_tipc_sk_release(sk, NULL, TIPC_DUMP_ALL, " ");
629*4882a593Smuzhiyun 	__tipc_shutdown(sock, TIPC_ERR_NO_PORT);
630*4882a593Smuzhiyun 	sk->sk_shutdown = SHUTDOWN_MASK;
631*4882a593Smuzhiyun 	tipc_sk_leave(tsk);
632*4882a593Smuzhiyun 	tipc_sk_withdraw(tsk, 0, NULL);
633*4882a593Smuzhiyun 	__skb_queue_purge(&tsk->mc_method.deferredq);
634*4882a593Smuzhiyun 	sk_stop_timer(sk, &sk->sk_timer);
635*4882a593Smuzhiyun 	tipc_sk_remove(tsk);
636*4882a593Smuzhiyun 
637*4882a593Smuzhiyun 	sock_orphan(sk);
638*4882a593Smuzhiyun 	/* Reject any messages that accumulated in backlog queue */
639*4882a593Smuzhiyun 	release_sock(sk);
640*4882a593Smuzhiyun 	tipc_dest_list_purge(&tsk->cong_links);
641*4882a593Smuzhiyun 	tsk->cong_link_cnt = 0;
642*4882a593Smuzhiyun 	call_rcu(&tsk->rcu, tipc_sk_callback);
643*4882a593Smuzhiyun 	sock->sk = NULL;
644*4882a593Smuzhiyun 
645*4882a593Smuzhiyun 	return 0;
646*4882a593Smuzhiyun }
647*4882a593Smuzhiyun 
648*4882a593Smuzhiyun /**
649*4882a593Smuzhiyun  * tipc_bind - associate or disassocate TIPC name(s) with a socket
650*4882a593Smuzhiyun  * @sock: socket structure
651*4882a593Smuzhiyun  * @uaddr: socket address describing name(s) and desired operation
652*4882a593Smuzhiyun  * @uaddr_len: size of socket address data structure
653*4882a593Smuzhiyun  *
654*4882a593Smuzhiyun  * Name and name sequence binding is indicated using a positive scope value;
655*4882a593Smuzhiyun  * a negative scope value unbinds the specified name.  Specifying no name
656*4882a593Smuzhiyun  * (i.e. a socket address length of 0) unbinds all names from the socket.
657*4882a593Smuzhiyun  *
658*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
659*4882a593Smuzhiyun  *
660*4882a593Smuzhiyun  * NOTE: This routine doesn't need to take the socket lock since it doesn't
661*4882a593Smuzhiyun  *       access any non-constant socket information.
662*4882a593Smuzhiyun  */
tipc_bind(struct socket * sock,struct sockaddr * uaddr,int uaddr_len)663*4882a593Smuzhiyun static int tipc_bind(struct socket *sock, struct sockaddr *uaddr,
664*4882a593Smuzhiyun 		     int uaddr_len)
665*4882a593Smuzhiyun {
666*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
667*4882a593Smuzhiyun 	struct sockaddr_tipc *addr = (struct sockaddr_tipc *)uaddr;
668*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
669*4882a593Smuzhiyun 	int res = -EINVAL;
670*4882a593Smuzhiyun 
671*4882a593Smuzhiyun 	lock_sock(sk);
672*4882a593Smuzhiyun 	if (unlikely(!uaddr_len)) {
673*4882a593Smuzhiyun 		res = tipc_sk_withdraw(tsk, 0, NULL);
674*4882a593Smuzhiyun 		goto exit;
675*4882a593Smuzhiyun 	}
676*4882a593Smuzhiyun 	if (tsk->group) {
677*4882a593Smuzhiyun 		res = -EACCES;
678*4882a593Smuzhiyun 		goto exit;
679*4882a593Smuzhiyun 	}
680*4882a593Smuzhiyun 	if (uaddr_len < sizeof(struct sockaddr_tipc)) {
681*4882a593Smuzhiyun 		res = -EINVAL;
682*4882a593Smuzhiyun 		goto exit;
683*4882a593Smuzhiyun 	}
684*4882a593Smuzhiyun 	if (addr->family != AF_TIPC) {
685*4882a593Smuzhiyun 		res = -EAFNOSUPPORT;
686*4882a593Smuzhiyun 		goto exit;
687*4882a593Smuzhiyun 	}
688*4882a593Smuzhiyun 
689*4882a593Smuzhiyun 	if (addr->addrtype == TIPC_ADDR_NAME)
690*4882a593Smuzhiyun 		addr->addr.nameseq.upper = addr->addr.nameseq.lower;
691*4882a593Smuzhiyun 	else if (addr->addrtype != TIPC_ADDR_NAMESEQ) {
692*4882a593Smuzhiyun 		res = -EAFNOSUPPORT;
693*4882a593Smuzhiyun 		goto exit;
694*4882a593Smuzhiyun 	}
695*4882a593Smuzhiyun 
696*4882a593Smuzhiyun 	if ((addr->addr.nameseq.type < TIPC_RESERVED_TYPES) &&
697*4882a593Smuzhiyun 	    (addr->addr.nameseq.type != TIPC_TOP_SRV) &&
698*4882a593Smuzhiyun 	    (addr->addr.nameseq.type != TIPC_CFG_SRV)) {
699*4882a593Smuzhiyun 		res = -EACCES;
700*4882a593Smuzhiyun 		goto exit;
701*4882a593Smuzhiyun 	}
702*4882a593Smuzhiyun 
703*4882a593Smuzhiyun 	res = (addr->scope >= 0) ?
704*4882a593Smuzhiyun 		tipc_sk_publish(tsk, addr->scope, &addr->addr.nameseq) :
705*4882a593Smuzhiyun 		tipc_sk_withdraw(tsk, -addr->scope, &addr->addr.nameseq);
706*4882a593Smuzhiyun exit:
707*4882a593Smuzhiyun 	release_sock(sk);
708*4882a593Smuzhiyun 	return res;
709*4882a593Smuzhiyun }
710*4882a593Smuzhiyun 
711*4882a593Smuzhiyun /**
712*4882a593Smuzhiyun  * tipc_getname - get port ID of socket or peer socket
713*4882a593Smuzhiyun  * @sock: socket structure
714*4882a593Smuzhiyun  * @uaddr: area for returned socket address
715*4882a593Smuzhiyun  * @peer: 0 = own ID, 1 = current peer ID, 2 = current/former peer ID
716*4882a593Smuzhiyun  *
717*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
718*4882a593Smuzhiyun  *
719*4882a593Smuzhiyun  * NOTE: This routine doesn't need to take the socket lock since it only
720*4882a593Smuzhiyun  *       accesses socket information that is unchanging (or which changes in
721*4882a593Smuzhiyun  *       a completely predictable manner).
722*4882a593Smuzhiyun  */
tipc_getname(struct socket * sock,struct sockaddr * uaddr,int peer)723*4882a593Smuzhiyun static int tipc_getname(struct socket *sock, struct sockaddr *uaddr,
724*4882a593Smuzhiyun 			int peer)
725*4882a593Smuzhiyun {
726*4882a593Smuzhiyun 	struct sockaddr_tipc *addr = (struct sockaddr_tipc *)uaddr;
727*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
728*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
729*4882a593Smuzhiyun 
730*4882a593Smuzhiyun 	memset(addr, 0, sizeof(*addr));
731*4882a593Smuzhiyun 	if (peer) {
732*4882a593Smuzhiyun 		if ((!tipc_sk_connected(sk)) &&
733*4882a593Smuzhiyun 		    ((peer != 2) || (sk->sk_state != TIPC_DISCONNECTING)))
734*4882a593Smuzhiyun 			return -ENOTCONN;
735*4882a593Smuzhiyun 		addr->addr.id.ref = tsk_peer_port(tsk);
736*4882a593Smuzhiyun 		addr->addr.id.node = tsk_peer_node(tsk);
737*4882a593Smuzhiyun 	} else {
738*4882a593Smuzhiyun 		addr->addr.id.ref = tsk->portid;
739*4882a593Smuzhiyun 		addr->addr.id.node = tipc_own_addr(sock_net(sk));
740*4882a593Smuzhiyun 	}
741*4882a593Smuzhiyun 
742*4882a593Smuzhiyun 	addr->addrtype = TIPC_ADDR_ID;
743*4882a593Smuzhiyun 	addr->family = AF_TIPC;
744*4882a593Smuzhiyun 	addr->scope = 0;
745*4882a593Smuzhiyun 	addr->addr.name.domain = 0;
746*4882a593Smuzhiyun 
747*4882a593Smuzhiyun 	return sizeof(*addr);
748*4882a593Smuzhiyun }
749*4882a593Smuzhiyun 
750*4882a593Smuzhiyun /**
751*4882a593Smuzhiyun  * tipc_poll - read and possibly block on pollmask
752*4882a593Smuzhiyun  * @file: file structure associated with the socket
753*4882a593Smuzhiyun  * @sock: socket for which to calculate the poll bits
754*4882a593Smuzhiyun  * @wait: ???
755*4882a593Smuzhiyun  *
756*4882a593Smuzhiyun  * Returns pollmask value
757*4882a593Smuzhiyun  *
758*4882a593Smuzhiyun  * COMMENTARY:
759*4882a593Smuzhiyun  * It appears that the usual socket locking mechanisms are not useful here
760*4882a593Smuzhiyun  * since the pollmask info is potentially out-of-date the moment this routine
761*4882a593Smuzhiyun  * exits.  TCP and other protocols seem to rely on higher level poll routines
762*4882a593Smuzhiyun  * to handle any preventable race conditions, so TIPC will do the same ...
763*4882a593Smuzhiyun  *
764*4882a593Smuzhiyun  * IMPORTANT: The fact that a read or write operation is indicated does NOT
765*4882a593Smuzhiyun  * imply that the operation will succeed, merely that it should be performed
766*4882a593Smuzhiyun  * and will not block.
767*4882a593Smuzhiyun  */
tipc_poll(struct file * file,struct socket * sock,poll_table * wait)768*4882a593Smuzhiyun static __poll_t tipc_poll(struct file *file, struct socket *sock,
769*4882a593Smuzhiyun 			      poll_table *wait)
770*4882a593Smuzhiyun {
771*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
772*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
773*4882a593Smuzhiyun 	__poll_t revents = 0;
774*4882a593Smuzhiyun 
775*4882a593Smuzhiyun 	sock_poll_wait(file, sock, wait);
776*4882a593Smuzhiyun 	trace_tipc_sk_poll(sk, NULL, TIPC_DUMP_ALL, " ");
777*4882a593Smuzhiyun 
778*4882a593Smuzhiyun 	if (sk->sk_shutdown & RCV_SHUTDOWN)
779*4882a593Smuzhiyun 		revents |= EPOLLRDHUP | EPOLLIN | EPOLLRDNORM;
780*4882a593Smuzhiyun 	if (sk->sk_shutdown == SHUTDOWN_MASK)
781*4882a593Smuzhiyun 		revents |= EPOLLHUP;
782*4882a593Smuzhiyun 
783*4882a593Smuzhiyun 	switch (sk->sk_state) {
784*4882a593Smuzhiyun 	case TIPC_ESTABLISHED:
785*4882a593Smuzhiyun 		if (!tsk->cong_link_cnt && !tsk_conn_cong(tsk))
786*4882a593Smuzhiyun 			revents |= EPOLLOUT;
787*4882a593Smuzhiyun 		fallthrough;
788*4882a593Smuzhiyun 	case TIPC_LISTEN:
789*4882a593Smuzhiyun 	case TIPC_CONNECTING:
790*4882a593Smuzhiyun 		if (!skb_queue_empty_lockless(&sk->sk_receive_queue))
791*4882a593Smuzhiyun 			revents |= EPOLLIN | EPOLLRDNORM;
792*4882a593Smuzhiyun 		break;
793*4882a593Smuzhiyun 	case TIPC_OPEN:
794*4882a593Smuzhiyun 		if (tsk->group_is_open && !tsk->cong_link_cnt)
795*4882a593Smuzhiyun 			revents |= EPOLLOUT;
796*4882a593Smuzhiyun 		if (!tipc_sk_type_connectionless(sk))
797*4882a593Smuzhiyun 			break;
798*4882a593Smuzhiyun 		if (skb_queue_empty_lockless(&sk->sk_receive_queue))
799*4882a593Smuzhiyun 			break;
800*4882a593Smuzhiyun 		revents |= EPOLLIN | EPOLLRDNORM;
801*4882a593Smuzhiyun 		break;
802*4882a593Smuzhiyun 	case TIPC_DISCONNECTING:
803*4882a593Smuzhiyun 		revents = EPOLLIN | EPOLLRDNORM | EPOLLHUP;
804*4882a593Smuzhiyun 		break;
805*4882a593Smuzhiyun 	}
806*4882a593Smuzhiyun 	return revents;
807*4882a593Smuzhiyun }
808*4882a593Smuzhiyun 
809*4882a593Smuzhiyun /**
810*4882a593Smuzhiyun  * tipc_sendmcast - send multicast message
811*4882a593Smuzhiyun  * @sock: socket structure
812*4882a593Smuzhiyun  * @seq: destination address
813*4882a593Smuzhiyun  * @msg: message to send
814*4882a593Smuzhiyun  * @dlen: length of data to send
815*4882a593Smuzhiyun  * @timeout: timeout to wait for wakeup
816*4882a593Smuzhiyun  *
817*4882a593Smuzhiyun  * Called from function tipc_sendmsg(), which has done all sanity checks
818*4882a593Smuzhiyun  * Returns the number of bytes sent on success, or errno
819*4882a593Smuzhiyun  */
tipc_sendmcast(struct socket * sock,struct tipc_name_seq * seq,struct msghdr * msg,size_t dlen,long timeout)820*4882a593Smuzhiyun static int tipc_sendmcast(struct  socket *sock, struct tipc_name_seq *seq,
821*4882a593Smuzhiyun 			  struct msghdr *msg, size_t dlen, long timeout)
822*4882a593Smuzhiyun {
823*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
824*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
825*4882a593Smuzhiyun 	struct tipc_msg *hdr = &tsk->phdr;
826*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
827*4882a593Smuzhiyun 	int mtu = tipc_bcast_get_mtu(net);
828*4882a593Smuzhiyun 	struct tipc_mc_method *method = &tsk->mc_method;
829*4882a593Smuzhiyun 	struct sk_buff_head pkts;
830*4882a593Smuzhiyun 	struct tipc_nlist dsts;
831*4882a593Smuzhiyun 	int rc;
832*4882a593Smuzhiyun 
833*4882a593Smuzhiyun 	if (tsk->group)
834*4882a593Smuzhiyun 		return -EACCES;
835*4882a593Smuzhiyun 
836*4882a593Smuzhiyun 	/* Block or return if any destination link is congested */
837*4882a593Smuzhiyun 	rc = tipc_wait_for_cond(sock, &timeout, !tsk->cong_link_cnt);
838*4882a593Smuzhiyun 	if (unlikely(rc))
839*4882a593Smuzhiyun 		return rc;
840*4882a593Smuzhiyun 
841*4882a593Smuzhiyun 	/* Lookup destination nodes */
842*4882a593Smuzhiyun 	tipc_nlist_init(&dsts, tipc_own_addr(net));
843*4882a593Smuzhiyun 	tipc_nametbl_lookup_dst_nodes(net, seq->type, seq->lower,
844*4882a593Smuzhiyun 				      seq->upper, &dsts);
845*4882a593Smuzhiyun 	if (!dsts.local && !dsts.remote)
846*4882a593Smuzhiyun 		return -EHOSTUNREACH;
847*4882a593Smuzhiyun 
848*4882a593Smuzhiyun 	/* Build message header */
849*4882a593Smuzhiyun 	msg_set_type(hdr, TIPC_MCAST_MSG);
850*4882a593Smuzhiyun 	msg_set_hdr_sz(hdr, MCAST_H_SIZE);
851*4882a593Smuzhiyun 	msg_set_lookup_scope(hdr, TIPC_CLUSTER_SCOPE);
852*4882a593Smuzhiyun 	msg_set_destport(hdr, 0);
853*4882a593Smuzhiyun 	msg_set_destnode(hdr, 0);
854*4882a593Smuzhiyun 	msg_set_nametype(hdr, seq->type);
855*4882a593Smuzhiyun 	msg_set_namelower(hdr, seq->lower);
856*4882a593Smuzhiyun 	msg_set_nameupper(hdr, seq->upper);
857*4882a593Smuzhiyun 
858*4882a593Smuzhiyun 	/* Build message as chain of buffers */
859*4882a593Smuzhiyun 	__skb_queue_head_init(&pkts);
860*4882a593Smuzhiyun 	rc = tipc_msg_build(hdr, msg, 0, dlen, mtu, &pkts);
861*4882a593Smuzhiyun 
862*4882a593Smuzhiyun 	/* Send message if build was successful */
863*4882a593Smuzhiyun 	if (unlikely(rc == dlen)) {
864*4882a593Smuzhiyun 		trace_tipc_sk_sendmcast(sk, skb_peek(&pkts),
865*4882a593Smuzhiyun 					TIPC_DUMP_SK_SNDQ, " ");
866*4882a593Smuzhiyun 		rc = tipc_mcast_xmit(net, &pkts, method, &dsts,
867*4882a593Smuzhiyun 				     &tsk->cong_link_cnt);
868*4882a593Smuzhiyun 	}
869*4882a593Smuzhiyun 
870*4882a593Smuzhiyun 	tipc_nlist_purge(&dsts);
871*4882a593Smuzhiyun 
872*4882a593Smuzhiyun 	return rc ? rc : dlen;
873*4882a593Smuzhiyun }
874*4882a593Smuzhiyun 
875*4882a593Smuzhiyun /**
876*4882a593Smuzhiyun  * tipc_send_group_msg - send a message to a member in the group
877*4882a593Smuzhiyun  * @net: network namespace
878*4882a593Smuzhiyun  * @m: message to send
879*4882a593Smuzhiyun  * @mb: group member
880*4882a593Smuzhiyun  * @dnode: destination node
881*4882a593Smuzhiyun  * @dport: destination port
882*4882a593Smuzhiyun  * @dlen: total length of message data
883*4882a593Smuzhiyun  */
tipc_send_group_msg(struct net * net,struct tipc_sock * tsk,struct msghdr * m,struct tipc_member * mb,u32 dnode,u32 dport,int dlen)884*4882a593Smuzhiyun static int tipc_send_group_msg(struct net *net, struct tipc_sock *tsk,
885*4882a593Smuzhiyun 			       struct msghdr *m, struct tipc_member *mb,
886*4882a593Smuzhiyun 			       u32 dnode, u32 dport, int dlen)
887*4882a593Smuzhiyun {
888*4882a593Smuzhiyun 	u16 bc_snd_nxt = tipc_group_bc_snd_nxt(tsk->group);
889*4882a593Smuzhiyun 	struct tipc_mc_method *method = &tsk->mc_method;
890*4882a593Smuzhiyun 	int blks = tsk_blocks(GROUP_H_SIZE + dlen);
891*4882a593Smuzhiyun 	struct tipc_msg *hdr = &tsk->phdr;
892*4882a593Smuzhiyun 	struct sk_buff_head pkts;
893*4882a593Smuzhiyun 	int mtu, rc;
894*4882a593Smuzhiyun 
895*4882a593Smuzhiyun 	/* Complete message header */
896*4882a593Smuzhiyun 	msg_set_type(hdr, TIPC_GRP_UCAST_MSG);
897*4882a593Smuzhiyun 	msg_set_hdr_sz(hdr, GROUP_H_SIZE);
898*4882a593Smuzhiyun 	msg_set_destport(hdr, dport);
899*4882a593Smuzhiyun 	msg_set_destnode(hdr, dnode);
900*4882a593Smuzhiyun 	msg_set_grp_bc_seqno(hdr, bc_snd_nxt);
901*4882a593Smuzhiyun 
902*4882a593Smuzhiyun 	/* Build message as chain of buffers */
903*4882a593Smuzhiyun 	__skb_queue_head_init(&pkts);
904*4882a593Smuzhiyun 	mtu = tipc_node_get_mtu(net, dnode, tsk->portid, false);
905*4882a593Smuzhiyun 	rc = tipc_msg_build(hdr, m, 0, dlen, mtu, &pkts);
906*4882a593Smuzhiyun 	if (unlikely(rc != dlen))
907*4882a593Smuzhiyun 		return rc;
908*4882a593Smuzhiyun 
909*4882a593Smuzhiyun 	/* Send message */
910*4882a593Smuzhiyun 	rc = tipc_node_xmit(net, &pkts, dnode, tsk->portid);
911*4882a593Smuzhiyun 	if (unlikely(rc == -ELINKCONG)) {
912*4882a593Smuzhiyun 		tipc_dest_push(&tsk->cong_links, dnode, 0);
913*4882a593Smuzhiyun 		tsk->cong_link_cnt++;
914*4882a593Smuzhiyun 	}
915*4882a593Smuzhiyun 
916*4882a593Smuzhiyun 	/* Update send window */
917*4882a593Smuzhiyun 	tipc_group_update_member(mb, blks);
918*4882a593Smuzhiyun 
919*4882a593Smuzhiyun 	/* A broadcast sent within next EXPIRE period must follow same path */
920*4882a593Smuzhiyun 	method->rcast = true;
921*4882a593Smuzhiyun 	method->mandatory = true;
922*4882a593Smuzhiyun 	return dlen;
923*4882a593Smuzhiyun }
924*4882a593Smuzhiyun 
925*4882a593Smuzhiyun /**
926*4882a593Smuzhiyun  * tipc_send_group_unicast - send message to a member in the group
927*4882a593Smuzhiyun  * @sock: socket structure
928*4882a593Smuzhiyun  * @m: message to send
929*4882a593Smuzhiyun  * @dlen: total length of message data
930*4882a593Smuzhiyun  * @timeout: timeout to wait for wakeup
931*4882a593Smuzhiyun  *
932*4882a593Smuzhiyun  * Called from function tipc_sendmsg(), which has done all sanity checks
933*4882a593Smuzhiyun  * Returns the number of bytes sent on success, or errno
934*4882a593Smuzhiyun  */
tipc_send_group_unicast(struct socket * sock,struct msghdr * m,int dlen,long timeout)935*4882a593Smuzhiyun static int tipc_send_group_unicast(struct socket *sock, struct msghdr *m,
936*4882a593Smuzhiyun 				   int dlen, long timeout)
937*4882a593Smuzhiyun {
938*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
939*4882a593Smuzhiyun 	DECLARE_SOCKADDR(struct sockaddr_tipc *, dest, m->msg_name);
940*4882a593Smuzhiyun 	int blks = tsk_blocks(GROUP_H_SIZE + dlen);
941*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
942*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
943*4882a593Smuzhiyun 	struct tipc_member *mb = NULL;
944*4882a593Smuzhiyun 	u32 node, port;
945*4882a593Smuzhiyun 	int rc;
946*4882a593Smuzhiyun 
947*4882a593Smuzhiyun 	node = dest->addr.id.node;
948*4882a593Smuzhiyun 	port = dest->addr.id.ref;
949*4882a593Smuzhiyun 	if (!port && !node)
950*4882a593Smuzhiyun 		return -EHOSTUNREACH;
951*4882a593Smuzhiyun 
952*4882a593Smuzhiyun 	/* Block or return if destination link or member is congested */
953*4882a593Smuzhiyun 	rc = tipc_wait_for_cond(sock, &timeout,
954*4882a593Smuzhiyun 				!tipc_dest_find(&tsk->cong_links, node, 0) &&
955*4882a593Smuzhiyun 				tsk->group &&
956*4882a593Smuzhiyun 				!tipc_group_cong(tsk->group, node, port, blks,
957*4882a593Smuzhiyun 						 &mb));
958*4882a593Smuzhiyun 	if (unlikely(rc))
959*4882a593Smuzhiyun 		return rc;
960*4882a593Smuzhiyun 
961*4882a593Smuzhiyun 	if (unlikely(!mb))
962*4882a593Smuzhiyun 		return -EHOSTUNREACH;
963*4882a593Smuzhiyun 
964*4882a593Smuzhiyun 	rc = tipc_send_group_msg(net, tsk, m, mb, node, port, dlen);
965*4882a593Smuzhiyun 
966*4882a593Smuzhiyun 	return rc ? rc : dlen;
967*4882a593Smuzhiyun }
968*4882a593Smuzhiyun 
969*4882a593Smuzhiyun /**
970*4882a593Smuzhiyun  * tipc_send_group_anycast - send message to any member with given identity
971*4882a593Smuzhiyun  * @sock: socket structure
972*4882a593Smuzhiyun  * @m: message to send
973*4882a593Smuzhiyun  * @dlen: total length of message data
974*4882a593Smuzhiyun  * @timeout: timeout to wait for wakeup
975*4882a593Smuzhiyun  *
976*4882a593Smuzhiyun  * Called from function tipc_sendmsg(), which has done all sanity checks
977*4882a593Smuzhiyun  * Returns the number of bytes sent on success, or errno
978*4882a593Smuzhiyun  */
tipc_send_group_anycast(struct socket * sock,struct msghdr * m,int dlen,long timeout)979*4882a593Smuzhiyun static int tipc_send_group_anycast(struct socket *sock, struct msghdr *m,
980*4882a593Smuzhiyun 				   int dlen, long timeout)
981*4882a593Smuzhiyun {
982*4882a593Smuzhiyun 	DECLARE_SOCKADDR(struct sockaddr_tipc *, dest, m->msg_name);
983*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
984*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
985*4882a593Smuzhiyun 	struct list_head *cong_links = &tsk->cong_links;
986*4882a593Smuzhiyun 	int blks = tsk_blocks(GROUP_H_SIZE + dlen);
987*4882a593Smuzhiyun 	struct tipc_msg *hdr = &tsk->phdr;
988*4882a593Smuzhiyun 	struct tipc_member *first = NULL;
989*4882a593Smuzhiyun 	struct tipc_member *mbr = NULL;
990*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
991*4882a593Smuzhiyun 	u32 node, port, exclude;
992*4882a593Smuzhiyun 	struct list_head dsts;
993*4882a593Smuzhiyun 	u32 type, inst, scope;
994*4882a593Smuzhiyun 	int lookups = 0;
995*4882a593Smuzhiyun 	int dstcnt, rc;
996*4882a593Smuzhiyun 	bool cong;
997*4882a593Smuzhiyun 
998*4882a593Smuzhiyun 	INIT_LIST_HEAD(&dsts);
999*4882a593Smuzhiyun 
1000*4882a593Smuzhiyun 	type = msg_nametype(hdr);
1001*4882a593Smuzhiyun 	inst = dest->addr.name.name.instance;
1002*4882a593Smuzhiyun 	scope = msg_lookup_scope(hdr);
1003*4882a593Smuzhiyun 
1004*4882a593Smuzhiyun 	while (++lookups < 4) {
1005*4882a593Smuzhiyun 		exclude = tipc_group_exclude(tsk->group);
1006*4882a593Smuzhiyun 
1007*4882a593Smuzhiyun 		first = NULL;
1008*4882a593Smuzhiyun 
1009*4882a593Smuzhiyun 		/* Look for a non-congested destination member, if any */
1010*4882a593Smuzhiyun 		while (1) {
1011*4882a593Smuzhiyun 			if (!tipc_nametbl_lookup(net, type, inst, scope, &dsts,
1012*4882a593Smuzhiyun 						 &dstcnt, exclude, false))
1013*4882a593Smuzhiyun 				return -EHOSTUNREACH;
1014*4882a593Smuzhiyun 			tipc_dest_pop(&dsts, &node, &port);
1015*4882a593Smuzhiyun 			cong = tipc_group_cong(tsk->group, node, port, blks,
1016*4882a593Smuzhiyun 					       &mbr);
1017*4882a593Smuzhiyun 			if (!cong)
1018*4882a593Smuzhiyun 				break;
1019*4882a593Smuzhiyun 			if (mbr == first)
1020*4882a593Smuzhiyun 				break;
1021*4882a593Smuzhiyun 			if (!first)
1022*4882a593Smuzhiyun 				first = mbr;
1023*4882a593Smuzhiyun 		}
1024*4882a593Smuzhiyun 
1025*4882a593Smuzhiyun 		/* Start over if destination was not in member list */
1026*4882a593Smuzhiyun 		if (unlikely(!mbr))
1027*4882a593Smuzhiyun 			continue;
1028*4882a593Smuzhiyun 
1029*4882a593Smuzhiyun 		if (likely(!cong && !tipc_dest_find(cong_links, node, 0)))
1030*4882a593Smuzhiyun 			break;
1031*4882a593Smuzhiyun 
1032*4882a593Smuzhiyun 		/* Block or return if destination link or member is congested */
1033*4882a593Smuzhiyun 		rc = tipc_wait_for_cond(sock, &timeout,
1034*4882a593Smuzhiyun 					!tipc_dest_find(cong_links, node, 0) &&
1035*4882a593Smuzhiyun 					tsk->group &&
1036*4882a593Smuzhiyun 					!tipc_group_cong(tsk->group, node, port,
1037*4882a593Smuzhiyun 							 blks, &mbr));
1038*4882a593Smuzhiyun 		if (unlikely(rc))
1039*4882a593Smuzhiyun 			return rc;
1040*4882a593Smuzhiyun 
1041*4882a593Smuzhiyun 		/* Send, unless destination disappeared while waiting */
1042*4882a593Smuzhiyun 		if (likely(mbr))
1043*4882a593Smuzhiyun 			break;
1044*4882a593Smuzhiyun 	}
1045*4882a593Smuzhiyun 
1046*4882a593Smuzhiyun 	if (unlikely(lookups >= 4))
1047*4882a593Smuzhiyun 		return -EHOSTUNREACH;
1048*4882a593Smuzhiyun 
1049*4882a593Smuzhiyun 	rc = tipc_send_group_msg(net, tsk, m, mbr, node, port, dlen);
1050*4882a593Smuzhiyun 
1051*4882a593Smuzhiyun 	return rc ? rc : dlen;
1052*4882a593Smuzhiyun }
1053*4882a593Smuzhiyun 
1054*4882a593Smuzhiyun /**
1055*4882a593Smuzhiyun  * tipc_send_group_bcast - send message to all members in communication group
1056*4882a593Smuzhiyun  * @sock: socket structure
1057*4882a593Smuzhiyun  * @m: message to send
1058*4882a593Smuzhiyun  * @dlen: total length of message data
1059*4882a593Smuzhiyun  * @timeout: timeout to wait for wakeup
1060*4882a593Smuzhiyun  *
1061*4882a593Smuzhiyun  * Called from function tipc_sendmsg(), which has done all sanity checks
1062*4882a593Smuzhiyun  * Returns the number of bytes sent on success, or errno
1063*4882a593Smuzhiyun  */
tipc_send_group_bcast(struct socket * sock,struct msghdr * m,int dlen,long timeout)1064*4882a593Smuzhiyun static int tipc_send_group_bcast(struct socket *sock, struct msghdr *m,
1065*4882a593Smuzhiyun 				 int dlen, long timeout)
1066*4882a593Smuzhiyun {
1067*4882a593Smuzhiyun 	DECLARE_SOCKADDR(struct sockaddr_tipc *, dest, m->msg_name);
1068*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
1069*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
1070*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
1071*4882a593Smuzhiyun 	struct tipc_nlist *dsts;
1072*4882a593Smuzhiyun 	struct tipc_mc_method *method = &tsk->mc_method;
1073*4882a593Smuzhiyun 	bool ack = method->mandatory && method->rcast;
1074*4882a593Smuzhiyun 	int blks = tsk_blocks(MCAST_H_SIZE + dlen);
1075*4882a593Smuzhiyun 	struct tipc_msg *hdr = &tsk->phdr;
1076*4882a593Smuzhiyun 	int mtu = tipc_bcast_get_mtu(net);
1077*4882a593Smuzhiyun 	struct sk_buff_head pkts;
1078*4882a593Smuzhiyun 	int rc = -EHOSTUNREACH;
1079*4882a593Smuzhiyun 
1080*4882a593Smuzhiyun 	/* Block or return if any destination link or member is congested */
1081*4882a593Smuzhiyun 	rc = tipc_wait_for_cond(sock, &timeout,
1082*4882a593Smuzhiyun 				!tsk->cong_link_cnt && tsk->group &&
1083*4882a593Smuzhiyun 				!tipc_group_bc_cong(tsk->group, blks));
1084*4882a593Smuzhiyun 	if (unlikely(rc))
1085*4882a593Smuzhiyun 		return rc;
1086*4882a593Smuzhiyun 
1087*4882a593Smuzhiyun 	dsts = tipc_group_dests(tsk->group);
1088*4882a593Smuzhiyun 	if (!dsts->local && !dsts->remote)
1089*4882a593Smuzhiyun 		return -EHOSTUNREACH;
1090*4882a593Smuzhiyun 
1091*4882a593Smuzhiyun 	/* Complete message header */
1092*4882a593Smuzhiyun 	if (dest) {
1093*4882a593Smuzhiyun 		msg_set_type(hdr, TIPC_GRP_MCAST_MSG);
1094*4882a593Smuzhiyun 		msg_set_nameinst(hdr, dest->addr.name.name.instance);
1095*4882a593Smuzhiyun 	} else {
1096*4882a593Smuzhiyun 		msg_set_type(hdr, TIPC_GRP_BCAST_MSG);
1097*4882a593Smuzhiyun 		msg_set_nameinst(hdr, 0);
1098*4882a593Smuzhiyun 	}
1099*4882a593Smuzhiyun 	msg_set_hdr_sz(hdr, GROUP_H_SIZE);
1100*4882a593Smuzhiyun 	msg_set_destport(hdr, 0);
1101*4882a593Smuzhiyun 	msg_set_destnode(hdr, 0);
1102*4882a593Smuzhiyun 	msg_set_grp_bc_seqno(hdr, tipc_group_bc_snd_nxt(tsk->group));
1103*4882a593Smuzhiyun 
1104*4882a593Smuzhiyun 	/* Avoid getting stuck with repeated forced replicasts */
1105*4882a593Smuzhiyun 	msg_set_grp_bc_ack_req(hdr, ack);
1106*4882a593Smuzhiyun 
1107*4882a593Smuzhiyun 	/* Build message as chain of buffers */
1108*4882a593Smuzhiyun 	__skb_queue_head_init(&pkts);
1109*4882a593Smuzhiyun 	rc = tipc_msg_build(hdr, m, 0, dlen, mtu, &pkts);
1110*4882a593Smuzhiyun 	if (unlikely(rc != dlen))
1111*4882a593Smuzhiyun 		return rc;
1112*4882a593Smuzhiyun 
1113*4882a593Smuzhiyun 	/* Send message */
1114*4882a593Smuzhiyun 	rc = tipc_mcast_xmit(net, &pkts, method, dsts, &tsk->cong_link_cnt);
1115*4882a593Smuzhiyun 	if (unlikely(rc))
1116*4882a593Smuzhiyun 		return rc;
1117*4882a593Smuzhiyun 
1118*4882a593Smuzhiyun 	/* Update broadcast sequence number and send windows */
1119*4882a593Smuzhiyun 	tipc_group_update_bc_members(tsk->group, blks, ack);
1120*4882a593Smuzhiyun 
1121*4882a593Smuzhiyun 	/* Broadcast link is now free to choose method for next broadcast */
1122*4882a593Smuzhiyun 	method->mandatory = false;
1123*4882a593Smuzhiyun 	method->expires = jiffies;
1124*4882a593Smuzhiyun 
1125*4882a593Smuzhiyun 	return dlen;
1126*4882a593Smuzhiyun }
1127*4882a593Smuzhiyun 
1128*4882a593Smuzhiyun /**
1129*4882a593Smuzhiyun  * tipc_send_group_mcast - send message to all members with given identity
1130*4882a593Smuzhiyun  * @sock: socket structure
1131*4882a593Smuzhiyun  * @m: message to send
1132*4882a593Smuzhiyun  * @dlen: total length of message data
1133*4882a593Smuzhiyun  * @timeout: timeout to wait for wakeup
1134*4882a593Smuzhiyun  *
1135*4882a593Smuzhiyun  * Called from function tipc_sendmsg(), which has done all sanity checks
1136*4882a593Smuzhiyun  * Returns the number of bytes sent on success, or errno
1137*4882a593Smuzhiyun  */
tipc_send_group_mcast(struct socket * sock,struct msghdr * m,int dlen,long timeout)1138*4882a593Smuzhiyun static int tipc_send_group_mcast(struct socket *sock, struct msghdr *m,
1139*4882a593Smuzhiyun 				 int dlen, long timeout)
1140*4882a593Smuzhiyun {
1141*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
1142*4882a593Smuzhiyun 	DECLARE_SOCKADDR(struct sockaddr_tipc *, dest, m->msg_name);
1143*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
1144*4882a593Smuzhiyun 	struct tipc_group *grp = tsk->group;
1145*4882a593Smuzhiyun 	struct tipc_msg *hdr = &tsk->phdr;
1146*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
1147*4882a593Smuzhiyun 	u32 type, inst, scope, exclude;
1148*4882a593Smuzhiyun 	struct list_head dsts;
1149*4882a593Smuzhiyun 	u32 dstcnt;
1150*4882a593Smuzhiyun 
1151*4882a593Smuzhiyun 	INIT_LIST_HEAD(&dsts);
1152*4882a593Smuzhiyun 
1153*4882a593Smuzhiyun 	type = msg_nametype(hdr);
1154*4882a593Smuzhiyun 	inst = dest->addr.name.name.instance;
1155*4882a593Smuzhiyun 	scope = msg_lookup_scope(hdr);
1156*4882a593Smuzhiyun 	exclude = tipc_group_exclude(grp);
1157*4882a593Smuzhiyun 
1158*4882a593Smuzhiyun 	if (!tipc_nametbl_lookup(net, type, inst, scope, &dsts,
1159*4882a593Smuzhiyun 				 &dstcnt, exclude, true))
1160*4882a593Smuzhiyun 		return -EHOSTUNREACH;
1161*4882a593Smuzhiyun 
1162*4882a593Smuzhiyun 	if (dstcnt == 1) {
1163*4882a593Smuzhiyun 		tipc_dest_pop(&dsts, &dest->addr.id.node, &dest->addr.id.ref);
1164*4882a593Smuzhiyun 		return tipc_send_group_unicast(sock, m, dlen, timeout);
1165*4882a593Smuzhiyun 	}
1166*4882a593Smuzhiyun 
1167*4882a593Smuzhiyun 	tipc_dest_list_purge(&dsts);
1168*4882a593Smuzhiyun 	return tipc_send_group_bcast(sock, m, dlen, timeout);
1169*4882a593Smuzhiyun }
1170*4882a593Smuzhiyun 
1171*4882a593Smuzhiyun /**
1172*4882a593Smuzhiyun  * tipc_sk_mcast_rcv - Deliver multicast messages to all destination sockets
1173*4882a593Smuzhiyun  * @arrvq: queue with arriving messages, to be cloned after destination lookup
1174*4882a593Smuzhiyun  * @inputq: queue with cloned messages, delivered to socket after dest lookup
1175*4882a593Smuzhiyun  *
1176*4882a593Smuzhiyun  * Multi-threaded: parallel calls with reference to same queues may occur
1177*4882a593Smuzhiyun  */
tipc_sk_mcast_rcv(struct net * net,struct sk_buff_head * arrvq,struct sk_buff_head * inputq)1178*4882a593Smuzhiyun void tipc_sk_mcast_rcv(struct net *net, struct sk_buff_head *arrvq,
1179*4882a593Smuzhiyun 		       struct sk_buff_head *inputq)
1180*4882a593Smuzhiyun {
1181*4882a593Smuzhiyun 	u32 self = tipc_own_addr(net);
1182*4882a593Smuzhiyun 	u32 type, lower, upper, scope;
1183*4882a593Smuzhiyun 	struct sk_buff *skb, *_skb;
1184*4882a593Smuzhiyun 	u32 portid, onode;
1185*4882a593Smuzhiyun 	struct sk_buff_head tmpq;
1186*4882a593Smuzhiyun 	struct list_head dports;
1187*4882a593Smuzhiyun 	struct tipc_msg *hdr;
1188*4882a593Smuzhiyun 	int user, mtyp, hlen;
1189*4882a593Smuzhiyun 	bool exact;
1190*4882a593Smuzhiyun 
1191*4882a593Smuzhiyun 	__skb_queue_head_init(&tmpq);
1192*4882a593Smuzhiyun 	INIT_LIST_HEAD(&dports);
1193*4882a593Smuzhiyun 
1194*4882a593Smuzhiyun 	skb = tipc_skb_peek(arrvq, &inputq->lock);
1195*4882a593Smuzhiyun 	for (; skb; skb = tipc_skb_peek(arrvq, &inputq->lock)) {
1196*4882a593Smuzhiyun 		hdr = buf_msg(skb);
1197*4882a593Smuzhiyun 		user = msg_user(hdr);
1198*4882a593Smuzhiyun 		mtyp = msg_type(hdr);
1199*4882a593Smuzhiyun 		hlen = skb_headroom(skb) + msg_hdr_sz(hdr);
1200*4882a593Smuzhiyun 		onode = msg_orignode(hdr);
1201*4882a593Smuzhiyun 		type = msg_nametype(hdr);
1202*4882a593Smuzhiyun 
1203*4882a593Smuzhiyun 		if (mtyp == TIPC_GRP_UCAST_MSG || user == GROUP_PROTOCOL) {
1204*4882a593Smuzhiyun 			spin_lock_bh(&inputq->lock);
1205*4882a593Smuzhiyun 			if (skb_peek(arrvq) == skb) {
1206*4882a593Smuzhiyun 				__skb_dequeue(arrvq);
1207*4882a593Smuzhiyun 				__skb_queue_tail(inputq, skb);
1208*4882a593Smuzhiyun 			}
1209*4882a593Smuzhiyun 			kfree_skb(skb);
1210*4882a593Smuzhiyun 			spin_unlock_bh(&inputq->lock);
1211*4882a593Smuzhiyun 			continue;
1212*4882a593Smuzhiyun 		}
1213*4882a593Smuzhiyun 
1214*4882a593Smuzhiyun 		/* Group messages require exact scope match */
1215*4882a593Smuzhiyun 		if (msg_in_group(hdr)) {
1216*4882a593Smuzhiyun 			lower = 0;
1217*4882a593Smuzhiyun 			upper = ~0;
1218*4882a593Smuzhiyun 			scope = msg_lookup_scope(hdr);
1219*4882a593Smuzhiyun 			exact = true;
1220*4882a593Smuzhiyun 		} else {
1221*4882a593Smuzhiyun 			/* TIPC_NODE_SCOPE means "any scope" in this context */
1222*4882a593Smuzhiyun 			if (onode == self)
1223*4882a593Smuzhiyun 				scope = TIPC_NODE_SCOPE;
1224*4882a593Smuzhiyun 			else
1225*4882a593Smuzhiyun 				scope = TIPC_CLUSTER_SCOPE;
1226*4882a593Smuzhiyun 			exact = false;
1227*4882a593Smuzhiyun 			lower = msg_namelower(hdr);
1228*4882a593Smuzhiyun 			upper = msg_nameupper(hdr);
1229*4882a593Smuzhiyun 		}
1230*4882a593Smuzhiyun 
1231*4882a593Smuzhiyun 		/* Create destination port list: */
1232*4882a593Smuzhiyun 		tipc_nametbl_mc_lookup(net, type, lower, upper,
1233*4882a593Smuzhiyun 				       scope, exact, &dports);
1234*4882a593Smuzhiyun 
1235*4882a593Smuzhiyun 		/* Clone message per destination */
1236*4882a593Smuzhiyun 		while (tipc_dest_pop(&dports, NULL, &portid)) {
1237*4882a593Smuzhiyun 			_skb = __pskb_copy(skb, hlen, GFP_ATOMIC);
1238*4882a593Smuzhiyun 			if (_skb) {
1239*4882a593Smuzhiyun 				msg_set_destport(buf_msg(_skb), portid);
1240*4882a593Smuzhiyun 				__skb_queue_tail(&tmpq, _skb);
1241*4882a593Smuzhiyun 				continue;
1242*4882a593Smuzhiyun 			}
1243*4882a593Smuzhiyun 			pr_warn("Failed to clone mcast rcv buffer\n");
1244*4882a593Smuzhiyun 		}
1245*4882a593Smuzhiyun 		/* Append to inputq if not already done by other thread */
1246*4882a593Smuzhiyun 		spin_lock_bh(&inputq->lock);
1247*4882a593Smuzhiyun 		if (skb_peek(arrvq) == skb) {
1248*4882a593Smuzhiyun 			skb_queue_splice_tail_init(&tmpq, inputq);
1249*4882a593Smuzhiyun 			/* Decrease the skb's refcnt as increasing in the
1250*4882a593Smuzhiyun 			 * function tipc_skb_peek
1251*4882a593Smuzhiyun 			 */
1252*4882a593Smuzhiyun 			kfree_skb(__skb_dequeue(arrvq));
1253*4882a593Smuzhiyun 		}
1254*4882a593Smuzhiyun 		spin_unlock_bh(&inputq->lock);
1255*4882a593Smuzhiyun 		__skb_queue_purge(&tmpq);
1256*4882a593Smuzhiyun 		kfree_skb(skb);
1257*4882a593Smuzhiyun 	}
1258*4882a593Smuzhiyun 	tipc_sk_rcv(net, inputq);
1259*4882a593Smuzhiyun }
1260*4882a593Smuzhiyun 
1261*4882a593Smuzhiyun /* tipc_sk_push_backlog(): send accumulated buffers in socket write queue
1262*4882a593Smuzhiyun  *                         when socket is in Nagle mode
1263*4882a593Smuzhiyun  */
tipc_sk_push_backlog(struct tipc_sock * tsk,bool nagle_ack)1264*4882a593Smuzhiyun static void tipc_sk_push_backlog(struct tipc_sock *tsk, bool nagle_ack)
1265*4882a593Smuzhiyun {
1266*4882a593Smuzhiyun 	struct sk_buff_head *txq = &tsk->sk.sk_write_queue;
1267*4882a593Smuzhiyun 	struct sk_buff *skb = skb_peek_tail(txq);
1268*4882a593Smuzhiyun 	struct net *net = sock_net(&tsk->sk);
1269*4882a593Smuzhiyun 	u32 dnode = tsk_peer_node(tsk);
1270*4882a593Smuzhiyun 	int rc;
1271*4882a593Smuzhiyun 
1272*4882a593Smuzhiyun 	if (nagle_ack) {
1273*4882a593Smuzhiyun 		tsk->pkt_cnt += skb_queue_len(txq);
1274*4882a593Smuzhiyun 		if (!tsk->pkt_cnt || tsk->msg_acc / tsk->pkt_cnt < 2) {
1275*4882a593Smuzhiyun 			tsk->oneway = 0;
1276*4882a593Smuzhiyun 			if (tsk->nagle_start < NAGLE_START_MAX)
1277*4882a593Smuzhiyun 				tsk->nagle_start *= 2;
1278*4882a593Smuzhiyun 			tsk->expect_ack = false;
1279*4882a593Smuzhiyun 			pr_debug("tsk %10u: bad nagle %u -> %u, next start %u!\n",
1280*4882a593Smuzhiyun 				 tsk->portid, tsk->msg_acc, tsk->pkt_cnt,
1281*4882a593Smuzhiyun 				 tsk->nagle_start);
1282*4882a593Smuzhiyun 		} else {
1283*4882a593Smuzhiyun 			tsk->nagle_start = NAGLE_START_INIT;
1284*4882a593Smuzhiyun 			if (skb) {
1285*4882a593Smuzhiyun 				msg_set_ack_required(buf_msg(skb));
1286*4882a593Smuzhiyun 				tsk->expect_ack = true;
1287*4882a593Smuzhiyun 			} else {
1288*4882a593Smuzhiyun 				tsk->expect_ack = false;
1289*4882a593Smuzhiyun 			}
1290*4882a593Smuzhiyun 		}
1291*4882a593Smuzhiyun 		tsk->msg_acc = 0;
1292*4882a593Smuzhiyun 		tsk->pkt_cnt = 0;
1293*4882a593Smuzhiyun 	}
1294*4882a593Smuzhiyun 
1295*4882a593Smuzhiyun 	if (!skb || tsk->cong_link_cnt)
1296*4882a593Smuzhiyun 		return;
1297*4882a593Smuzhiyun 
1298*4882a593Smuzhiyun 	/* Do not send SYN again after congestion */
1299*4882a593Smuzhiyun 	if (msg_is_syn(buf_msg(skb)))
1300*4882a593Smuzhiyun 		return;
1301*4882a593Smuzhiyun 
1302*4882a593Smuzhiyun 	if (tsk->msg_acc)
1303*4882a593Smuzhiyun 		tsk->pkt_cnt += skb_queue_len(txq);
1304*4882a593Smuzhiyun 	tsk->snt_unacked += tsk->snd_backlog;
1305*4882a593Smuzhiyun 	tsk->snd_backlog = 0;
1306*4882a593Smuzhiyun 	rc = tipc_node_xmit(net, txq, dnode, tsk->portid);
1307*4882a593Smuzhiyun 	if (rc == -ELINKCONG)
1308*4882a593Smuzhiyun 		tsk->cong_link_cnt = 1;
1309*4882a593Smuzhiyun }
1310*4882a593Smuzhiyun 
1311*4882a593Smuzhiyun /**
1312*4882a593Smuzhiyun  * tipc_sk_conn_proto_rcv - receive a connection mng protocol message
1313*4882a593Smuzhiyun  * @tsk: receiving socket
1314*4882a593Smuzhiyun  * @skb: pointer to message buffer.
1315*4882a593Smuzhiyun  */
tipc_sk_conn_proto_rcv(struct tipc_sock * tsk,struct sk_buff * skb,struct sk_buff_head * inputq,struct sk_buff_head * xmitq)1316*4882a593Smuzhiyun static void tipc_sk_conn_proto_rcv(struct tipc_sock *tsk, struct sk_buff *skb,
1317*4882a593Smuzhiyun 				   struct sk_buff_head *inputq,
1318*4882a593Smuzhiyun 				   struct sk_buff_head *xmitq)
1319*4882a593Smuzhiyun {
1320*4882a593Smuzhiyun 	struct tipc_msg *hdr = buf_msg(skb);
1321*4882a593Smuzhiyun 	u32 onode = tsk_own_node(tsk);
1322*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
1323*4882a593Smuzhiyun 	int mtyp = msg_type(hdr);
1324*4882a593Smuzhiyun 	bool was_cong;
1325*4882a593Smuzhiyun 
1326*4882a593Smuzhiyun 	/* Ignore if connection cannot be validated: */
1327*4882a593Smuzhiyun 	if (!tsk_peer_msg(tsk, hdr)) {
1328*4882a593Smuzhiyun 		trace_tipc_sk_drop_msg(sk, skb, TIPC_DUMP_NONE, "@proto_rcv!");
1329*4882a593Smuzhiyun 		goto exit;
1330*4882a593Smuzhiyun 	}
1331*4882a593Smuzhiyun 
1332*4882a593Smuzhiyun 	if (unlikely(msg_errcode(hdr))) {
1333*4882a593Smuzhiyun 		tipc_set_sk_state(sk, TIPC_DISCONNECTING);
1334*4882a593Smuzhiyun 		tipc_node_remove_conn(sock_net(sk), tsk_peer_node(tsk),
1335*4882a593Smuzhiyun 				      tsk_peer_port(tsk));
1336*4882a593Smuzhiyun 		sk->sk_state_change(sk);
1337*4882a593Smuzhiyun 
1338*4882a593Smuzhiyun 		/* State change is ignored if socket already awake,
1339*4882a593Smuzhiyun 		 * - convert msg to abort msg and add to inqueue
1340*4882a593Smuzhiyun 		 */
1341*4882a593Smuzhiyun 		msg_set_user(hdr, TIPC_CRITICAL_IMPORTANCE);
1342*4882a593Smuzhiyun 		msg_set_type(hdr, TIPC_CONN_MSG);
1343*4882a593Smuzhiyun 		msg_set_size(hdr, BASIC_H_SIZE);
1344*4882a593Smuzhiyun 		msg_set_hdr_sz(hdr, BASIC_H_SIZE);
1345*4882a593Smuzhiyun 		__skb_queue_tail(inputq, skb);
1346*4882a593Smuzhiyun 		return;
1347*4882a593Smuzhiyun 	}
1348*4882a593Smuzhiyun 
1349*4882a593Smuzhiyun 	tsk->probe_unacked = false;
1350*4882a593Smuzhiyun 
1351*4882a593Smuzhiyun 	if (mtyp == CONN_PROBE) {
1352*4882a593Smuzhiyun 		msg_set_type(hdr, CONN_PROBE_REPLY);
1353*4882a593Smuzhiyun 		if (tipc_msg_reverse(onode, &skb, TIPC_OK))
1354*4882a593Smuzhiyun 			__skb_queue_tail(xmitq, skb);
1355*4882a593Smuzhiyun 		return;
1356*4882a593Smuzhiyun 	} else if (mtyp == CONN_ACK) {
1357*4882a593Smuzhiyun 		was_cong = tsk_conn_cong(tsk);
1358*4882a593Smuzhiyun 		tipc_sk_push_backlog(tsk, msg_nagle_ack(hdr));
1359*4882a593Smuzhiyun 		tsk->snt_unacked -= msg_conn_ack(hdr);
1360*4882a593Smuzhiyun 		if (tsk->peer_caps & TIPC_BLOCK_FLOWCTL)
1361*4882a593Smuzhiyun 			tsk->snd_win = msg_adv_win(hdr);
1362*4882a593Smuzhiyun 		if (was_cong && !tsk_conn_cong(tsk))
1363*4882a593Smuzhiyun 			sk->sk_write_space(sk);
1364*4882a593Smuzhiyun 	} else if (mtyp != CONN_PROBE_REPLY) {
1365*4882a593Smuzhiyun 		pr_warn("Received unknown CONN_PROTO msg\n");
1366*4882a593Smuzhiyun 	}
1367*4882a593Smuzhiyun exit:
1368*4882a593Smuzhiyun 	kfree_skb(skb);
1369*4882a593Smuzhiyun }
1370*4882a593Smuzhiyun 
1371*4882a593Smuzhiyun /**
1372*4882a593Smuzhiyun  * tipc_sendmsg - send message in connectionless manner
1373*4882a593Smuzhiyun  * @sock: socket structure
1374*4882a593Smuzhiyun  * @m: message to send
1375*4882a593Smuzhiyun  * @dsz: amount of user data to be sent
1376*4882a593Smuzhiyun  *
1377*4882a593Smuzhiyun  * Message must have an destination specified explicitly.
1378*4882a593Smuzhiyun  * Used for SOCK_RDM and SOCK_DGRAM messages,
1379*4882a593Smuzhiyun  * and for 'SYN' messages on SOCK_SEQPACKET and SOCK_STREAM connections.
1380*4882a593Smuzhiyun  * (Note: 'SYN+' is prohibited on SOCK_STREAM.)
1381*4882a593Smuzhiyun  *
1382*4882a593Smuzhiyun  * Returns the number of bytes sent on success, or errno otherwise
1383*4882a593Smuzhiyun  */
tipc_sendmsg(struct socket * sock,struct msghdr * m,size_t dsz)1384*4882a593Smuzhiyun static int tipc_sendmsg(struct socket *sock,
1385*4882a593Smuzhiyun 			struct msghdr *m, size_t dsz)
1386*4882a593Smuzhiyun {
1387*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
1388*4882a593Smuzhiyun 	int ret;
1389*4882a593Smuzhiyun 
1390*4882a593Smuzhiyun 	lock_sock(sk);
1391*4882a593Smuzhiyun 	ret = __tipc_sendmsg(sock, m, dsz);
1392*4882a593Smuzhiyun 	release_sock(sk);
1393*4882a593Smuzhiyun 
1394*4882a593Smuzhiyun 	return ret;
1395*4882a593Smuzhiyun }
1396*4882a593Smuzhiyun 
__tipc_sendmsg(struct socket * sock,struct msghdr * m,size_t dlen)1397*4882a593Smuzhiyun static int __tipc_sendmsg(struct socket *sock, struct msghdr *m, size_t dlen)
1398*4882a593Smuzhiyun {
1399*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
1400*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
1401*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
1402*4882a593Smuzhiyun 	DECLARE_SOCKADDR(struct sockaddr_tipc *, dest, m->msg_name);
1403*4882a593Smuzhiyun 	long timeout = sock_sndtimeo(sk, m->msg_flags & MSG_DONTWAIT);
1404*4882a593Smuzhiyun 	struct list_head *clinks = &tsk->cong_links;
1405*4882a593Smuzhiyun 	bool syn = !tipc_sk_type_connectionless(sk);
1406*4882a593Smuzhiyun 	struct tipc_group *grp = tsk->group;
1407*4882a593Smuzhiyun 	struct tipc_msg *hdr = &tsk->phdr;
1408*4882a593Smuzhiyun 	struct tipc_name_seq *seq;
1409*4882a593Smuzhiyun 	struct sk_buff_head pkts;
1410*4882a593Smuzhiyun 	u32 dport = 0, dnode = 0;
1411*4882a593Smuzhiyun 	u32 type = 0, inst = 0;
1412*4882a593Smuzhiyun 	int mtu, rc;
1413*4882a593Smuzhiyun 
1414*4882a593Smuzhiyun 	if (unlikely(dlen > TIPC_MAX_USER_MSG_SIZE))
1415*4882a593Smuzhiyun 		return -EMSGSIZE;
1416*4882a593Smuzhiyun 
1417*4882a593Smuzhiyun 	if (likely(dest)) {
1418*4882a593Smuzhiyun 		if (unlikely(m->msg_namelen < sizeof(*dest)))
1419*4882a593Smuzhiyun 			return -EINVAL;
1420*4882a593Smuzhiyun 		if (unlikely(dest->family != AF_TIPC))
1421*4882a593Smuzhiyun 			return -EINVAL;
1422*4882a593Smuzhiyun 	}
1423*4882a593Smuzhiyun 
1424*4882a593Smuzhiyun 	if (grp) {
1425*4882a593Smuzhiyun 		if (!dest)
1426*4882a593Smuzhiyun 			return tipc_send_group_bcast(sock, m, dlen, timeout);
1427*4882a593Smuzhiyun 		if (dest->addrtype == TIPC_ADDR_NAME)
1428*4882a593Smuzhiyun 			return tipc_send_group_anycast(sock, m, dlen, timeout);
1429*4882a593Smuzhiyun 		if (dest->addrtype == TIPC_ADDR_ID)
1430*4882a593Smuzhiyun 			return tipc_send_group_unicast(sock, m, dlen, timeout);
1431*4882a593Smuzhiyun 		if (dest->addrtype == TIPC_ADDR_MCAST)
1432*4882a593Smuzhiyun 			return tipc_send_group_mcast(sock, m, dlen, timeout);
1433*4882a593Smuzhiyun 		return -EINVAL;
1434*4882a593Smuzhiyun 	}
1435*4882a593Smuzhiyun 
1436*4882a593Smuzhiyun 	if (unlikely(!dest)) {
1437*4882a593Smuzhiyun 		dest = &tsk->peer;
1438*4882a593Smuzhiyun 		if (!syn && dest->family != AF_TIPC)
1439*4882a593Smuzhiyun 			return -EDESTADDRREQ;
1440*4882a593Smuzhiyun 	}
1441*4882a593Smuzhiyun 
1442*4882a593Smuzhiyun 	if (unlikely(syn)) {
1443*4882a593Smuzhiyun 		if (sk->sk_state == TIPC_LISTEN)
1444*4882a593Smuzhiyun 			return -EPIPE;
1445*4882a593Smuzhiyun 		if (sk->sk_state != TIPC_OPEN)
1446*4882a593Smuzhiyun 			return -EISCONN;
1447*4882a593Smuzhiyun 		if (tsk->published)
1448*4882a593Smuzhiyun 			return -EOPNOTSUPP;
1449*4882a593Smuzhiyun 		if (dest->addrtype == TIPC_ADDR_NAME) {
1450*4882a593Smuzhiyun 			tsk->conn_type = dest->addr.name.name.type;
1451*4882a593Smuzhiyun 			tsk->conn_instance = dest->addr.name.name.instance;
1452*4882a593Smuzhiyun 		}
1453*4882a593Smuzhiyun 		msg_set_syn(hdr, 1);
1454*4882a593Smuzhiyun 	}
1455*4882a593Smuzhiyun 
1456*4882a593Smuzhiyun 	seq = &dest->addr.nameseq;
1457*4882a593Smuzhiyun 	if (dest->addrtype == TIPC_ADDR_MCAST)
1458*4882a593Smuzhiyun 		return tipc_sendmcast(sock, seq, m, dlen, timeout);
1459*4882a593Smuzhiyun 
1460*4882a593Smuzhiyun 	if (dest->addrtype == TIPC_ADDR_NAME) {
1461*4882a593Smuzhiyun 		type = dest->addr.name.name.type;
1462*4882a593Smuzhiyun 		inst = dest->addr.name.name.instance;
1463*4882a593Smuzhiyun 		dnode = dest->addr.name.domain;
1464*4882a593Smuzhiyun 		dport = tipc_nametbl_translate(net, type, inst, &dnode);
1465*4882a593Smuzhiyun 		if (unlikely(!dport && !dnode))
1466*4882a593Smuzhiyun 			return -EHOSTUNREACH;
1467*4882a593Smuzhiyun 	} else if (dest->addrtype == TIPC_ADDR_ID) {
1468*4882a593Smuzhiyun 		dnode = dest->addr.id.node;
1469*4882a593Smuzhiyun 	} else {
1470*4882a593Smuzhiyun 		return -EINVAL;
1471*4882a593Smuzhiyun 	}
1472*4882a593Smuzhiyun 
1473*4882a593Smuzhiyun 	/* Block or return if destination link is congested */
1474*4882a593Smuzhiyun 	rc = tipc_wait_for_cond(sock, &timeout,
1475*4882a593Smuzhiyun 				!tipc_dest_find(clinks, dnode, 0));
1476*4882a593Smuzhiyun 	if (unlikely(rc))
1477*4882a593Smuzhiyun 		return rc;
1478*4882a593Smuzhiyun 
1479*4882a593Smuzhiyun 	if (dest->addrtype == TIPC_ADDR_NAME) {
1480*4882a593Smuzhiyun 		msg_set_type(hdr, TIPC_NAMED_MSG);
1481*4882a593Smuzhiyun 		msg_set_hdr_sz(hdr, NAMED_H_SIZE);
1482*4882a593Smuzhiyun 		msg_set_nametype(hdr, type);
1483*4882a593Smuzhiyun 		msg_set_nameinst(hdr, inst);
1484*4882a593Smuzhiyun 		msg_set_lookup_scope(hdr, tipc_node2scope(dnode));
1485*4882a593Smuzhiyun 		msg_set_destnode(hdr, dnode);
1486*4882a593Smuzhiyun 		msg_set_destport(hdr, dport);
1487*4882a593Smuzhiyun 	} else { /* TIPC_ADDR_ID */
1488*4882a593Smuzhiyun 		msg_set_type(hdr, TIPC_DIRECT_MSG);
1489*4882a593Smuzhiyun 		msg_set_lookup_scope(hdr, 0);
1490*4882a593Smuzhiyun 		msg_set_destnode(hdr, dnode);
1491*4882a593Smuzhiyun 		msg_set_destport(hdr, dest->addr.id.ref);
1492*4882a593Smuzhiyun 		msg_set_hdr_sz(hdr, BASIC_H_SIZE);
1493*4882a593Smuzhiyun 	}
1494*4882a593Smuzhiyun 
1495*4882a593Smuzhiyun 	__skb_queue_head_init(&pkts);
1496*4882a593Smuzhiyun 	mtu = tipc_node_get_mtu(net, dnode, tsk->portid, true);
1497*4882a593Smuzhiyun 	rc = tipc_msg_build(hdr, m, 0, dlen, mtu, &pkts);
1498*4882a593Smuzhiyun 	if (unlikely(rc != dlen))
1499*4882a593Smuzhiyun 		return rc;
1500*4882a593Smuzhiyun 	if (unlikely(syn && !tipc_msg_skb_clone(&pkts, &sk->sk_write_queue))) {
1501*4882a593Smuzhiyun 		__skb_queue_purge(&pkts);
1502*4882a593Smuzhiyun 		return -ENOMEM;
1503*4882a593Smuzhiyun 	}
1504*4882a593Smuzhiyun 
1505*4882a593Smuzhiyun 	trace_tipc_sk_sendmsg(sk, skb_peek(&pkts), TIPC_DUMP_SK_SNDQ, " ");
1506*4882a593Smuzhiyun 	rc = tipc_node_xmit(net, &pkts, dnode, tsk->portid);
1507*4882a593Smuzhiyun 	if (unlikely(rc == -ELINKCONG)) {
1508*4882a593Smuzhiyun 		tipc_dest_push(clinks, dnode, 0);
1509*4882a593Smuzhiyun 		tsk->cong_link_cnt++;
1510*4882a593Smuzhiyun 		rc = 0;
1511*4882a593Smuzhiyun 	}
1512*4882a593Smuzhiyun 
1513*4882a593Smuzhiyun 	if (unlikely(syn && !rc)) {
1514*4882a593Smuzhiyun 		tipc_set_sk_state(sk, TIPC_CONNECTING);
1515*4882a593Smuzhiyun 		if (dlen && timeout) {
1516*4882a593Smuzhiyun 			timeout = msecs_to_jiffies(timeout);
1517*4882a593Smuzhiyun 			tipc_wait_for_connect(sock, &timeout);
1518*4882a593Smuzhiyun 		}
1519*4882a593Smuzhiyun 	}
1520*4882a593Smuzhiyun 
1521*4882a593Smuzhiyun 	return rc ? rc : dlen;
1522*4882a593Smuzhiyun }
1523*4882a593Smuzhiyun 
1524*4882a593Smuzhiyun /**
1525*4882a593Smuzhiyun  * tipc_sendstream - send stream-oriented data
1526*4882a593Smuzhiyun  * @sock: socket structure
1527*4882a593Smuzhiyun  * @m: data to send
1528*4882a593Smuzhiyun  * @dsz: total length of data to be transmitted
1529*4882a593Smuzhiyun  *
1530*4882a593Smuzhiyun  * Used for SOCK_STREAM data.
1531*4882a593Smuzhiyun  *
1532*4882a593Smuzhiyun  * Returns the number of bytes sent on success (or partial success),
1533*4882a593Smuzhiyun  * or errno if no data sent
1534*4882a593Smuzhiyun  */
tipc_sendstream(struct socket * sock,struct msghdr * m,size_t dsz)1535*4882a593Smuzhiyun static int tipc_sendstream(struct socket *sock, struct msghdr *m, size_t dsz)
1536*4882a593Smuzhiyun {
1537*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
1538*4882a593Smuzhiyun 	int ret;
1539*4882a593Smuzhiyun 
1540*4882a593Smuzhiyun 	lock_sock(sk);
1541*4882a593Smuzhiyun 	ret = __tipc_sendstream(sock, m, dsz);
1542*4882a593Smuzhiyun 	release_sock(sk);
1543*4882a593Smuzhiyun 
1544*4882a593Smuzhiyun 	return ret;
1545*4882a593Smuzhiyun }
1546*4882a593Smuzhiyun 
__tipc_sendstream(struct socket * sock,struct msghdr * m,size_t dlen)1547*4882a593Smuzhiyun static int __tipc_sendstream(struct socket *sock, struct msghdr *m, size_t dlen)
1548*4882a593Smuzhiyun {
1549*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
1550*4882a593Smuzhiyun 	DECLARE_SOCKADDR(struct sockaddr_tipc *, dest, m->msg_name);
1551*4882a593Smuzhiyun 	long timeout = sock_sndtimeo(sk, m->msg_flags & MSG_DONTWAIT);
1552*4882a593Smuzhiyun 	struct sk_buff_head *txq = &sk->sk_write_queue;
1553*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
1554*4882a593Smuzhiyun 	struct tipc_msg *hdr = &tsk->phdr;
1555*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
1556*4882a593Smuzhiyun 	struct sk_buff *skb;
1557*4882a593Smuzhiyun 	u32 dnode = tsk_peer_node(tsk);
1558*4882a593Smuzhiyun 	int maxnagle = tsk->maxnagle;
1559*4882a593Smuzhiyun 	int maxpkt = tsk->max_pkt;
1560*4882a593Smuzhiyun 	int send, sent = 0;
1561*4882a593Smuzhiyun 	int blocks, rc = 0;
1562*4882a593Smuzhiyun 
1563*4882a593Smuzhiyun 	if (unlikely(dlen > INT_MAX))
1564*4882a593Smuzhiyun 		return -EMSGSIZE;
1565*4882a593Smuzhiyun 
1566*4882a593Smuzhiyun 	/* Handle implicit connection setup */
1567*4882a593Smuzhiyun 	if (unlikely(dest && sk->sk_state == TIPC_OPEN)) {
1568*4882a593Smuzhiyun 		rc = __tipc_sendmsg(sock, m, dlen);
1569*4882a593Smuzhiyun 		if (dlen && dlen == rc) {
1570*4882a593Smuzhiyun 			tsk->peer_caps = tipc_node_get_capabilities(net, dnode);
1571*4882a593Smuzhiyun 			tsk->snt_unacked = tsk_inc(tsk, dlen + msg_hdr_sz(hdr));
1572*4882a593Smuzhiyun 		}
1573*4882a593Smuzhiyun 		return rc;
1574*4882a593Smuzhiyun 	}
1575*4882a593Smuzhiyun 
1576*4882a593Smuzhiyun 	do {
1577*4882a593Smuzhiyun 		rc = tipc_wait_for_cond(sock, &timeout,
1578*4882a593Smuzhiyun 					(!tsk->cong_link_cnt &&
1579*4882a593Smuzhiyun 					 !tsk_conn_cong(tsk) &&
1580*4882a593Smuzhiyun 					 tipc_sk_connected(sk)));
1581*4882a593Smuzhiyun 		if (unlikely(rc))
1582*4882a593Smuzhiyun 			break;
1583*4882a593Smuzhiyun 		send = min_t(size_t, dlen - sent, TIPC_MAX_USER_MSG_SIZE);
1584*4882a593Smuzhiyun 		blocks = tsk->snd_backlog;
1585*4882a593Smuzhiyun 		if (tsk->oneway++ >= tsk->nagle_start && maxnagle &&
1586*4882a593Smuzhiyun 		    send <= maxnagle) {
1587*4882a593Smuzhiyun 			rc = tipc_msg_append(hdr, m, send, maxnagle, txq);
1588*4882a593Smuzhiyun 			if (unlikely(rc < 0))
1589*4882a593Smuzhiyun 				break;
1590*4882a593Smuzhiyun 			blocks += rc;
1591*4882a593Smuzhiyun 			tsk->msg_acc++;
1592*4882a593Smuzhiyun 			if (blocks <= 64 && tsk->expect_ack) {
1593*4882a593Smuzhiyun 				tsk->snd_backlog = blocks;
1594*4882a593Smuzhiyun 				sent += send;
1595*4882a593Smuzhiyun 				break;
1596*4882a593Smuzhiyun 			} else if (blocks > 64) {
1597*4882a593Smuzhiyun 				tsk->pkt_cnt += skb_queue_len(txq);
1598*4882a593Smuzhiyun 			} else {
1599*4882a593Smuzhiyun 				skb = skb_peek_tail(txq);
1600*4882a593Smuzhiyun 				if (skb) {
1601*4882a593Smuzhiyun 					msg_set_ack_required(buf_msg(skb));
1602*4882a593Smuzhiyun 					tsk->expect_ack = true;
1603*4882a593Smuzhiyun 				} else {
1604*4882a593Smuzhiyun 					tsk->expect_ack = false;
1605*4882a593Smuzhiyun 				}
1606*4882a593Smuzhiyun 				tsk->msg_acc = 0;
1607*4882a593Smuzhiyun 				tsk->pkt_cnt = 0;
1608*4882a593Smuzhiyun 			}
1609*4882a593Smuzhiyun 		} else {
1610*4882a593Smuzhiyun 			rc = tipc_msg_build(hdr, m, sent, send, maxpkt, txq);
1611*4882a593Smuzhiyun 			if (unlikely(rc != send))
1612*4882a593Smuzhiyun 				break;
1613*4882a593Smuzhiyun 			blocks += tsk_inc(tsk, send + MIN_H_SIZE);
1614*4882a593Smuzhiyun 		}
1615*4882a593Smuzhiyun 		trace_tipc_sk_sendstream(sk, skb_peek(txq),
1616*4882a593Smuzhiyun 					 TIPC_DUMP_SK_SNDQ, " ");
1617*4882a593Smuzhiyun 		rc = tipc_node_xmit(net, txq, dnode, tsk->portid);
1618*4882a593Smuzhiyun 		if (unlikely(rc == -ELINKCONG)) {
1619*4882a593Smuzhiyun 			tsk->cong_link_cnt = 1;
1620*4882a593Smuzhiyun 			rc = 0;
1621*4882a593Smuzhiyun 		}
1622*4882a593Smuzhiyun 		if (likely(!rc)) {
1623*4882a593Smuzhiyun 			tsk->snt_unacked += blocks;
1624*4882a593Smuzhiyun 			tsk->snd_backlog = 0;
1625*4882a593Smuzhiyun 			sent += send;
1626*4882a593Smuzhiyun 		}
1627*4882a593Smuzhiyun 	} while (sent < dlen && !rc);
1628*4882a593Smuzhiyun 
1629*4882a593Smuzhiyun 	return sent ? sent : rc;
1630*4882a593Smuzhiyun }
1631*4882a593Smuzhiyun 
1632*4882a593Smuzhiyun /**
1633*4882a593Smuzhiyun  * tipc_send_packet - send a connection-oriented message
1634*4882a593Smuzhiyun  * @sock: socket structure
1635*4882a593Smuzhiyun  * @m: message to send
1636*4882a593Smuzhiyun  * @dsz: length of data to be transmitted
1637*4882a593Smuzhiyun  *
1638*4882a593Smuzhiyun  * Used for SOCK_SEQPACKET messages.
1639*4882a593Smuzhiyun  *
1640*4882a593Smuzhiyun  * Returns the number of bytes sent on success, or errno otherwise
1641*4882a593Smuzhiyun  */
tipc_send_packet(struct socket * sock,struct msghdr * m,size_t dsz)1642*4882a593Smuzhiyun static int tipc_send_packet(struct socket *sock, struct msghdr *m, size_t dsz)
1643*4882a593Smuzhiyun {
1644*4882a593Smuzhiyun 	if (dsz > TIPC_MAX_USER_MSG_SIZE)
1645*4882a593Smuzhiyun 		return -EMSGSIZE;
1646*4882a593Smuzhiyun 
1647*4882a593Smuzhiyun 	return tipc_sendstream(sock, m, dsz);
1648*4882a593Smuzhiyun }
1649*4882a593Smuzhiyun 
1650*4882a593Smuzhiyun /* tipc_sk_finish_conn - complete the setup of a connection
1651*4882a593Smuzhiyun  */
tipc_sk_finish_conn(struct tipc_sock * tsk,u32 peer_port,u32 peer_node)1652*4882a593Smuzhiyun static void tipc_sk_finish_conn(struct tipc_sock *tsk, u32 peer_port,
1653*4882a593Smuzhiyun 				u32 peer_node)
1654*4882a593Smuzhiyun {
1655*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
1656*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
1657*4882a593Smuzhiyun 	struct tipc_msg *msg = &tsk->phdr;
1658*4882a593Smuzhiyun 
1659*4882a593Smuzhiyun 	msg_set_syn(msg, 0);
1660*4882a593Smuzhiyun 	msg_set_destnode(msg, peer_node);
1661*4882a593Smuzhiyun 	msg_set_destport(msg, peer_port);
1662*4882a593Smuzhiyun 	msg_set_type(msg, TIPC_CONN_MSG);
1663*4882a593Smuzhiyun 	msg_set_lookup_scope(msg, 0);
1664*4882a593Smuzhiyun 	msg_set_hdr_sz(msg, SHORT_H_SIZE);
1665*4882a593Smuzhiyun 
1666*4882a593Smuzhiyun 	sk_reset_timer(sk, &sk->sk_timer, jiffies + CONN_PROBING_INTV);
1667*4882a593Smuzhiyun 	tipc_set_sk_state(sk, TIPC_ESTABLISHED);
1668*4882a593Smuzhiyun 	tipc_node_add_conn(net, peer_node, tsk->portid, peer_port);
1669*4882a593Smuzhiyun 	tsk->max_pkt = tipc_node_get_mtu(net, peer_node, tsk->portid, true);
1670*4882a593Smuzhiyun 	tsk->peer_caps = tipc_node_get_capabilities(net, peer_node);
1671*4882a593Smuzhiyun 	tsk_set_nagle(tsk);
1672*4882a593Smuzhiyun 	__skb_queue_purge(&sk->sk_write_queue);
1673*4882a593Smuzhiyun 	if (tsk->peer_caps & TIPC_BLOCK_FLOWCTL)
1674*4882a593Smuzhiyun 		return;
1675*4882a593Smuzhiyun 
1676*4882a593Smuzhiyun 	/* Fall back to message based flow control */
1677*4882a593Smuzhiyun 	tsk->rcv_win = FLOWCTL_MSG_WIN;
1678*4882a593Smuzhiyun 	tsk->snd_win = FLOWCTL_MSG_WIN;
1679*4882a593Smuzhiyun }
1680*4882a593Smuzhiyun 
1681*4882a593Smuzhiyun /**
1682*4882a593Smuzhiyun  * tipc_sk_set_orig_addr - capture sender's address for received message
1683*4882a593Smuzhiyun  * @m: descriptor for message info
1684*4882a593Smuzhiyun  * @skb: received message
1685*4882a593Smuzhiyun  *
1686*4882a593Smuzhiyun  * Note: Address is not captured if not requested by receiver.
1687*4882a593Smuzhiyun  */
tipc_sk_set_orig_addr(struct msghdr * m,struct sk_buff * skb)1688*4882a593Smuzhiyun static void tipc_sk_set_orig_addr(struct msghdr *m, struct sk_buff *skb)
1689*4882a593Smuzhiyun {
1690*4882a593Smuzhiyun 	DECLARE_SOCKADDR(struct sockaddr_pair *, srcaddr, m->msg_name);
1691*4882a593Smuzhiyun 	struct tipc_msg *hdr = buf_msg(skb);
1692*4882a593Smuzhiyun 
1693*4882a593Smuzhiyun 	if (!srcaddr)
1694*4882a593Smuzhiyun 		return;
1695*4882a593Smuzhiyun 
1696*4882a593Smuzhiyun 	srcaddr->sock.family = AF_TIPC;
1697*4882a593Smuzhiyun 	srcaddr->sock.addrtype = TIPC_ADDR_ID;
1698*4882a593Smuzhiyun 	srcaddr->sock.scope = 0;
1699*4882a593Smuzhiyun 	srcaddr->sock.addr.id.ref = msg_origport(hdr);
1700*4882a593Smuzhiyun 	srcaddr->sock.addr.id.node = msg_orignode(hdr);
1701*4882a593Smuzhiyun 	srcaddr->sock.addr.name.domain = 0;
1702*4882a593Smuzhiyun 	m->msg_namelen = sizeof(struct sockaddr_tipc);
1703*4882a593Smuzhiyun 
1704*4882a593Smuzhiyun 	if (!msg_in_group(hdr))
1705*4882a593Smuzhiyun 		return;
1706*4882a593Smuzhiyun 
1707*4882a593Smuzhiyun 	/* Group message users may also want to know sending member's id */
1708*4882a593Smuzhiyun 	srcaddr->member.family = AF_TIPC;
1709*4882a593Smuzhiyun 	srcaddr->member.addrtype = TIPC_ADDR_NAME;
1710*4882a593Smuzhiyun 	srcaddr->member.scope = 0;
1711*4882a593Smuzhiyun 	srcaddr->member.addr.name.name.type = msg_nametype(hdr);
1712*4882a593Smuzhiyun 	srcaddr->member.addr.name.name.instance = TIPC_SKB_CB(skb)->orig_member;
1713*4882a593Smuzhiyun 	srcaddr->member.addr.name.domain = 0;
1714*4882a593Smuzhiyun 	m->msg_namelen = sizeof(*srcaddr);
1715*4882a593Smuzhiyun }
1716*4882a593Smuzhiyun 
1717*4882a593Smuzhiyun /**
1718*4882a593Smuzhiyun  * tipc_sk_anc_data_recv - optionally capture ancillary data for received message
1719*4882a593Smuzhiyun  * @m: descriptor for message info
1720*4882a593Smuzhiyun  * @skb: received message buffer
1721*4882a593Smuzhiyun  * @tsk: TIPC port associated with message
1722*4882a593Smuzhiyun  *
1723*4882a593Smuzhiyun  * Note: Ancillary data is not captured if not requested by receiver.
1724*4882a593Smuzhiyun  *
1725*4882a593Smuzhiyun  * Returns 0 if successful, otherwise errno
1726*4882a593Smuzhiyun  */
tipc_sk_anc_data_recv(struct msghdr * m,struct sk_buff * skb,struct tipc_sock * tsk)1727*4882a593Smuzhiyun static int tipc_sk_anc_data_recv(struct msghdr *m, struct sk_buff *skb,
1728*4882a593Smuzhiyun 				 struct tipc_sock *tsk)
1729*4882a593Smuzhiyun {
1730*4882a593Smuzhiyun 	struct tipc_msg *msg;
1731*4882a593Smuzhiyun 	u32 anc_data[3];
1732*4882a593Smuzhiyun 	u32 err;
1733*4882a593Smuzhiyun 	u32 dest_type;
1734*4882a593Smuzhiyun 	int has_name;
1735*4882a593Smuzhiyun 	int res;
1736*4882a593Smuzhiyun 
1737*4882a593Smuzhiyun 	if (likely(m->msg_controllen == 0))
1738*4882a593Smuzhiyun 		return 0;
1739*4882a593Smuzhiyun 	msg = buf_msg(skb);
1740*4882a593Smuzhiyun 
1741*4882a593Smuzhiyun 	/* Optionally capture errored message object(s) */
1742*4882a593Smuzhiyun 	err = msg ? msg_errcode(msg) : 0;
1743*4882a593Smuzhiyun 	if (unlikely(err)) {
1744*4882a593Smuzhiyun 		anc_data[0] = err;
1745*4882a593Smuzhiyun 		anc_data[1] = msg_data_sz(msg);
1746*4882a593Smuzhiyun 		res = put_cmsg(m, SOL_TIPC, TIPC_ERRINFO, 8, anc_data);
1747*4882a593Smuzhiyun 		if (res)
1748*4882a593Smuzhiyun 			return res;
1749*4882a593Smuzhiyun 		if (anc_data[1]) {
1750*4882a593Smuzhiyun 			if (skb_linearize(skb))
1751*4882a593Smuzhiyun 				return -ENOMEM;
1752*4882a593Smuzhiyun 			msg = buf_msg(skb);
1753*4882a593Smuzhiyun 			res = put_cmsg(m, SOL_TIPC, TIPC_RETDATA, anc_data[1],
1754*4882a593Smuzhiyun 				       msg_data(msg));
1755*4882a593Smuzhiyun 			if (res)
1756*4882a593Smuzhiyun 				return res;
1757*4882a593Smuzhiyun 		}
1758*4882a593Smuzhiyun 	}
1759*4882a593Smuzhiyun 
1760*4882a593Smuzhiyun 	/* Optionally capture message destination object */
1761*4882a593Smuzhiyun 	dest_type = msg ? msg_type(msg) : TIPC_DIRECT_MSG;
1762*4882a593Smuzhiyun 	switch (dest_type) {
1763*4882a593Smuzhiyun 	case TIPC_NAMED_MSG:
1764*4882a593Smuzhiyun 		has_name = 1;
1765*4882a593Smuzhiyun 		anc_data[0] = msg_nametype(msg);
1766*4882a593Smuzhiyun 		anc_data[1] = msg_namelower(msg);
1767*4882a593Smuzhiyun 		anc_data[2] = msg_namelower(msg);
1768*4882a593Smuzhiyun 		break;
1769*4882a593Smuzhiyun 	case TIPC_MCAST_MSG:
1770*4882a593Smuzhiyun 		has_name = 1;
1771*4882a593Smuzhiyun 		anc_data[0] = msg_nametype(msg);
1772*4882a593Smuzhiyun 		anc_data[1] = msg_namelower(msg);
1773*4882a593Smuzhiyun 		anc_data[2] = msg_nameupper(msg);
1774*4882a593Smuzhiyun 		break;
1775*4882a593Smuzhiyun 	case TIPC_CONN_MSG:
1776*4882a593Smuzhiyun 		has_name = (tsk->conn_type != 0);
1777*4882a593Smuzhiyun 		anc_data[0] = tsk->conn_type;
1778*4882a593Smuzhiyun 		anc_data[1] = tsk->conn_instance;
1779*4882a593Smuzhiyun 		anc_data[2] = tsk->conn_instance;
1780*4882a593Smuzhiyun 		break;
1781*4882a593Smuzhiyun 	default:
1782*4882a593Smuzhiyun 		has_name = 0;
1783*4882a593Smuzhiyun 	}
1784*4882a593Smuzhiyun 	if (has_name) {
1785*4882a593Smuzhiyun 		res = put_cmsg(m, SOL_TIPC, TIPC_DESTNAME, 12, anc_data);
1786*4882a593Smuzhiyun 		if (res)
1787*4882a593Smuzhiyun 			return res;
1788*4882a593Smuzhiyun 	}
1789*4882a593Smuzhiyun 
1790*4882a593Smuzhiyun 	return 0;
1791*4882a593Smuzhiyun }
1792*4882a593Smuzhiyun 
tipc_sk_build_ack(struct tipc_sock * tsk)1793*4882a593Smuzhiyun static struct sk_buff *tipc_sk_build_ack(struct tipc_sock *tsk)
1794*4882a593Smuzhiyun {
1795*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
1796*4882a593Smuzhiyun 	struct sk_buff *skb = NULL;
1797*4882a593Smuzhiyun 	struct tipc_msg *msg;
1798*4882a593Smuzhiyun 	u32 peer_port = tsk_peer_port(tsk);
1799*4882a593Smuzhiyun 	u32 dnode = tsk_peer_node(tsk);
1800*4882a593Smuzhiyun 
1801*4882a593Smuzhiyun 	if (!tipc_sk_connected(sk))
1802*4882a593Smuzhiyun 		return NULL;
1803*4882a593Smuzhiyun 	skb = tipc_msg_create(CONN_MANAGER, CONN_ACK, INT_H_SIZE, 0,
1804*4882a593Smuzhiyun 			      dnode, tsk_own_node(tsk), peer_port,
1805*4882a593Smuzhiyun 			      tsk->portid, TIPC_OK);
1806*4882a593Smuzhiyun 	if (!skb)
1807*4882a593Smuzhiyun 		return NULL;
1808*4882a593Smuzhiyun 	msg = buf_msg(skb);
1809*4882a593Smuzhiyun 	msg_set_conn_ack(msg, tsk->rcv_unacked);
1810*4882a593Smuzhiyun 	tsk->rcv_unacked = 0;
1811*4882a593Smuzhiyun 
1812*4882a593Smuzhiyun 	/* Adjust to and advertize the correct window limit */
1813*4882a593Smuzhiyun 	if (tsk->peer_caps & TIPC_BLOCK_FLOWCTL) {
1814*4882a593Smuzhiyun 		tsk->rcv_win = tsk_adv_blocks(tsk->sk.sk_rcvbuf);
1815*4882a593Smuzhiyun 		msg_set_adv_win(msg, tsk->rcv_win);
1816*4882a593Smuzhiyun 	}
1817*4882a593Smuzhiyun 	return skb;
1818*4882a593Smuzhiyun }
1819*4882a593Smuzhiyun 
tipc_sk_send_ack(struct tipc_sock * tsk)1820*4882a593Smuzhiyun static void tipc_sk_send_ack(struct tipc_sock *tsk)
1821*4882a593Smuzhiyun {
1822*4882a593Smuzhiyun 	struct sk_buff *skb;
1823*4882a593Smuzhiyun 
1824*4882a593Smuzhiyun 	skb = tipc_sk_build_ack(tsk);
1825*4882a593Smuzhiyun 	if (!skb)
1826*4882a593Smuzhiyun 		return;
1827*4882a593Smuzhiyun 
1828*4882a593Smuzhiyun 	tipc_node_xmit_skb(sock_net(&tsk->sk), skb, tsk_peer_node(tsk),
1829*4882a593Smuzhiyun 			   msg_link_selector(buf_msg(skb)));
1830*4882a593Smuzhiyun }
1831*4882a593Smuzhiyun 
tipc_wait_for_rcvmsg(struct socket * sock,long * timeop)1832*4882a593Smuzhiyun static int tipc_wait_for_rcvmsg(struct socket *sock, long *timeop)
1833*4882a593Smuzhiyun {
1834*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
1835*4882a593Smuzhiyun 	DEFINE_WAIT_FUNC(wait, woken_wake_function);
1836*4882a593Smuzhiyun 	long timeo = *timeop;
1837*4882a593Smuzhiyun 	int err = sock_error(sk);
1838*4882a593Smuzhiyun 
1839*4882a593Smuzhiyun 	if (err)
1840*4882a593Smuzhiyun 		return err;
1841*4882a593Smuzhiyun 
1842*4882a593Smuzhiyun 	for (;;) {
1843*4882a593Smuzhiyun 		if (timeo && skb_queue_empty(&sk->sk_receive_queue)) {
1844*4882a593Smuzhiyun 			if (sk->sk_shutdown & RCV_SHUTDOWN) {
1845*4882a593Smuzhiyun 				err = -ENOTCONN;
1846*4882a593Smuzhiyun 				break;
1847*4882a593Smuzhiyun 			}
1848*4882a593Smuzhiyun 			add_wait_queue(sk_sleep(sk), &wait);
1849*4882a593Smuzhiyun 			release_sock(sk);
1850*4882a593Smuzhiyun 			timeo = wait_woken(&wait, TASK_INTERRUPTIBLE, timeo);
1851*4882a593Smuzhiyun 			sched_annotate_sleep();
1852*4882a593Smuzhiyun 			lock_sock(sk);
1853*4882a593Smuzhiyun 			remove_wait_queue(sk_sleep(sk), &wait);
1854*4882a593Smuzhiyun 		}
1855*4882a593Smuzhiyun 		err = 0;
1856*4882a593Smuzhiyun 		if (!skb_queue_empty(&sk->sk_receive_queue))
1857*4882a593Smuzhiyun 			break;
1858*4882a593Smuzhiyun 		err = -EAGAIN;
1859*4882a593Smuzhiyun 		if (!timeo)
1860*4882a593Smuzhiyun 			break;
1861*4882a593Smuzhiyun 		err = sock_intr_errno(timeo);
1862*4882a593Smuzhiyun 		if (signal_pending(current))
1863*4882a593Smuzhiyun 			break;
1864*4882a593Smuzhiyun 
1865*4882a593Smuzhiyun 		err = sock_error(sk);
1866*4882a593Smuzhiyun 		if (err)
1867*4882a593Smuzhiyun 			break;
1868*4882a593Smuzhiyun 	}
1869*4882a593Smuzhiyun 	*timeop = timeo;
1870*4882a593Smuzhiyun 	return err;
1871*4882a593Smuzhiyun }
1872*4882a593Smuzhiyun 
1873*4882a593Smuzhiyun /**
1874*4882a593Smuzhiyun  * tipc_recvmsg - receive packet-oriented message
1875*4882a593Smuzhiyun  * @m: descriptor for message info
1876*4882a593Smuzhiyun  * @buflen: length of user buffer area
1877*4882a593Smuzhiyun  * @flags: receive flags
1878*4882a593Smuzhiyun  *
1879*4882a593Smuzhiyun  * Used for SOCK_DGRAM, SOCK_RDM, and SOCK_SEQPACKET messages.
1880*4882a593Smuzhiyun  * If the complete message doesn't fit in user area, truncate it.
1881*4882a593Smuzhiyun  *
1882*4882a593Smuzhiyun  * Returns size of returned message data, errno otherwise
1883*4882a593Smuzhiyun  */
tipc_recvmsg(struct socket * sock,struct msghdr * m,size_t buflen,int flags)1884*4882a593Smuzhiyun static int tipc_recvmsg(struct socket *sock, struct msghdr *m,
1885*4882a593Smuzhiyun 			size_t buflen,	int flags)
1886*4882a593Smuzhiyun {
1887*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
1888*4882a593Smuzhiyun 	bool connected = !tipc_sk_type_connectionless(sk);
1889*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
1890*4882a593Smuzhiyun 	int rc, err, hlen, dlen, copy;
1891*4882a593Smuzhiyun 	struct tipc_skb_cb *skb_cb;
1892*4882a593Smuzhiyun 	struct sk_buff_head xmitq;
1893*4882a593Smuzhiyun 	struct tipc_msg *hdr;
1894*4882a593Smuzhiyun 	struct sk_buff *skb;
1895*4882a593Smuzhiyun 	bool grp_evt;
1896*4882a593Smuzhiyun 	long timeout;
1897*4882a593Smuzhiyun 
1898*4882a593Smuzhiyun 	/* Catch invalid receive requests */
1899*4882a593Smuzhiyun 	if (unlikely(!buflen))
1900*4882a593Smuzhiyun 		return -EINVAL;
1901*4882a593Smuzhiyun 
1902*4882a593Smuzhiyun 	lock_sock(sk);
1903*4882a593Smuzhiyun 	if (unlikely(connected && sk->sk_state == TIPC_OPEN)) {
1904*4882a593Smuzhiyun 		rc = -ENOTCONN;
1905*4882a593Smuzhiyun 		goto exit;
1906*4882a593Smuzhiyun 	}
1907*4882a593Smuzhiyun 	timeout = sock_rcvtimeo(sk, flags & MSG_DONTWAIT);
1908*4882a593Smuzhiyun 
1909*4882a593Smuzhiyun 	/* Step rcv queue to first msg with data or error; wait if necessary */
1910*4882a593Smuzhiyun 	do {
1911*4882a593Smuzhiyun 		rc = tipc_wait_for_rcvmsg(sock, &timeout);
1912*4882a593Smuzhiyun 		if (unlikely(rc))
1913*4882a593Smuzhiyun 			goto exit;
1914*4882a593Smuzhiyun 		skb = skb_peek(&sk->sk_receive_queue);
1915*4882a593Smuzhiyun 		skb_cb = TIPC_SKB_CB(skb);
1916*4882a593Smuzhiyun 		hdr = buf_msg(skb);
1917*4882a593Smuzhiyun 		dlen = msg_data_sz(hdr);
1918*4882a593Smuzhiyun 		hlen = msg_hdr_sz(hdr);
1919*4882a593Smuzhiyun 		err = msg_errcode(hdr);
1920*4882a593Smuzhiyun 		grp_evt = msg_is_grp_evt(hdr);
1921*4882a593Smuzhiyun 		if (likely(dlen || err))
1922*4882a593Smuzhiyun 			break;
1923*4882a593Smuzhiyun 		tsk_advance_rx_queue(sk);
1924*4882a593Smuzhiyun 	} while (1);
1925*4882a593Smuzhiyun 
1926*4882a593Smuzhiyun 	/* Collect msg meta data, including error code and rejected data */
1927*4882a593Smuzhiyun 	tipc_sk_set_orig_addr(m, skb);
1928*4882a593Smuzhiyun 	rc = tipc_sk_anc_data_recv(m, skb, tsk);
1929*4882a593Smuzhiyun 	if (unlikely(rc))
1930*4882a593Smuzhiyun 		goto exit;
1931*4882a593Smuzhiyun 	hdr = buf_msg(skb);
1932*4882a593Smuzhiyun 
1933*4882a593Smuzhiyun 	/* Capture data if non-error msg, otherwise just set return value */
1934*4882a593Smuzhiyun 	if (likely(!err)) {
1935*4882a593Smuzhiyun 		int offset = skb_cb->bytes_read;
1936*4882a593Smuzhiyun 
1937*4882a593Smuzhiyun 		copy = min_t(int, dlen - offset, buflen);
1938*4882a593Smuzhiyun 		rc = skb_copy_datagram_msg(skb, hlen + offset, m, copy);
1939*4882a593Smuzhiyun 		if (unlikely(rc))
1940*4882a593Smuzhiyun 			goto exit;
1941*4882a593Smuzhiyun 		if (unlikely(offset + copy < dlen)) {
1942*4882a593Smuzhiyun 			if (flags & MSG_EOR) {
1943*4882a593Smuzhiyun 				if (!(flags & MSG_PEEK))
1944*4882a593Smuzhiyun 					skb_cb->bytes_read = offset + copy;
1945*4882a593Smuzhiyun 			} else {
1946*4882a593Smuzhiyun 				m->msg_flags |= MSG_TRUNC;
1947*4882a593Smuzhiyun 				skb_cb->bytes_read = 0;
1948*4882a593Smuzhiyun 			}
1949*4882a593Smuzhiyun 		} else {
1950*4882a593Smuzhiyun 			if (flags & MSG_EOR)
1951*4882a593Smuzhiyun 				m->msg_flags |= MSG_EOR;
1952*4882a593Smuzhiyun 			skb_cb->bytes_read = 0;
1953*4882a593Smuzhiyun 		}
1954*4882a593Smuzhiyun 	} else {
1955*4882a593Smuzhiyun 		copy = 0;
1956*4882a593Smuzhiyun 		rc = 0;
1957*4882a593Smuzhiyun 		if (err != TIPC_CONN_SHUTDOWN && connected && !m->msg_control) {
1958*4882a593Smuzhiyun 			rc = -ECONNRESET;
1959*4882a593Smuzhiyun 			goto exit;
1960*4882a593Smuzhiyun 		}
1961*4882a593Smuzhiyun 	}
1962*4882a593Smuzhiyun 
1963*4882a593Smuzhiyun 	/* Mark message as group event if applicable */
1964*4882a593Smuzhiyun 	if (unlikely(grp_evt)) {
1965*4882a593Smuzhiyun 		if (msg_grp_evt(hdr) == TIPC_WITHDRAWN)
1966*4882a593Smuzhiyun 			m->msg_flags |= MSG_EOR;
1967*4882a593Smuzhiyun 		m->msg_flags |= MSG_OOB;
1968*4882a593Smuzhiyun 		copy = 0;
1969*4882a593Smuzhiyun 	}
1970*4882a593Smuzhiyun 
1971*4882a593Smuzhiyun 	/* Caption of data or error code/rejected data was successful */
1972*4882a593Smuzhiyun 	if (unlikely(flags & MSG_PEEK))
1973*4882a593Smuzhiyun 		goto exit;
1974*4882a593Smuzhiyun 
1975*4882a593Smuzhiyun 	/* Send group flow control advertisement when applicable */
1976*4882a593Smuzhiyun 	if (tsk->group && msg_in_group(hdr) && !grp_evt) {
1977*4882a593Smuzhiyun 		__skb_queue_head_init(&xmitq);
1978*4882a593Smuzhiyun 		tipc_group_update_rcv_win(tsk->group, tsk_blocks(hlen + dlen),
1979*4882a593Smuzhiyun 					  msg_orignode(hdr), msg_origport(hdr),
1980*4882a593Smuzhiyun 					  &xmitq);
1981*4882a593Smuzhiyun 		tipc_node_distr_xmit(sock_net(sk), &xmitq);
1982*4882a593Smuzhiyun 	}
1983*4882a593Smuzhiyun 
1984*4882a593Smuzhiyun 	if (skb_cb->bytes_read)
1985*4882a593Smuzhiyun 		goto exit;
1986*4882a593Smuzhiyun 
1987*4882a593Smuzhiyun 	tsk_advance_rx_queue(sk);
1988*4882a593Smuzhiyun 
1989*4882a593Smuzhiyun 	if (likely(!connected))
1990*4882a593Smuzhiyun 		goto exit;
1991*4882a593Smuzhiyun 
1992*4882a593Smuzhiyun 	/* Send connection flow control advertisement when applicable */
1993*4882a593Smuzhiyun 	tsk->rcv_unacked += tsk_inc(tsk, hlen + dlen);
1994*4882a593Smuzhiyun 	if (tsk->rcv_unacked >= tsk->rcv_win / TIPC_ACK_RATE)
1995*4882a593Smuzhiyun 		tipc_sk_send_ack(tsk);
1996*4882a593Smuzhiyun exit:
1997*4882a593Smuzhiyun 	release_sock(sk);
1998*4882a593Smuzhiyun 	return rc ? rc : copy;
1999*4882a593Smuzhiyun }
2000*4882a593Smuzhiyun 
2001*4882a593Smuzhiyun /**
2002*4882a593Smuzhiyun  * tipc_recvstream - receive stream-oriented data
2003*4882a593Smuzhiyun  * @m: descriptor for message info
2004*4882a593Smuzhiyun  * @buflen: total size of user buffer area
2005*4882a593Smuzhiyun  * @flags: receive flags
2006*4882a593Smuzhiyun  *
2007*4882a593Smuzhiyun  * Used for SOCK_STREAM messages only.  If not enough data is available
2008*4882a593Smuzhiyun  * will optionally wait for more; never truncates data.
2009*4882a593Smuzhiyun  *
2010*4882a593Smuzhiyun  * Returns size of returned message data, errno otherwise
2011*4882a593Smuzhiyun  */
tipc_recvstream(struct socket * sock,struct msghdr * m,size_t buflen,int flags)2012*4882a593Smuzhiyun static int tipc_recvstream(struct socket *sock, struct msghdr *m,
2013*4882a593Smuzhiyun 			   size_t buflen, int flags)
2014*4882a593Smuzhiyun {
2015*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
2016*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
2017*4882a593Smuzhiyun 	struct sk_buff *skb;
2018*4882a593Smuzhiyun 	struct tipc_msg *hdr;
2019*4882a593Smuzhiyun 	struct tipc_skb_cb *skb_cb;
2020*4882a593Smuzhiyun 	bool peek = flags & MSG_PEEK;
2021*4882a593Smuzhiyun 	int offset, required, copy, copied = 0;
2022*4882a593Smuzhiyun 	int hlen, dlen, err, rc;
2023*4882a593Smuzhiyun 	long timeout;
2024*4882a593Smuzhiyun 
2025*4882a593Smuzhiyun 	/* Catch invalid receive attempts */
2026*4882a593Smuzhiyun 	if (unlikely(!buflen))
2027*4882a593Smuzhiyun 		return -EINVAL;
2028*4882a593Smuzhiyun 
2029*4882a593Smuzhiyun 	lock_sock(sk);
2030*4882a593Smuzhiyun 
2031*4882a593Smuzhiyun 	if (unlikely(sk->sk_state == TIPC_OPEN)) {
2032*4882a593Smuzhiyun 		rc = -ENOTCONN;
2033*4882a593Smuzhiyun 		goto exit;
2034*4882a593Smuzhiyun 	}
2035*4882a593Smuzhiyun 	required = sock_rcvlowat(sk, flags & MSG_WAITALL, buflen);
2036*4882a593Smuzhiyun 	timeout = sock_rcvtimeo(sk, flags & MSG_DONTWAIT);
2037*4882a593Smuzhiyun 
2038*4882a593Smuzhiyun 	do {
2039*4882a593Smuzhiyun 		/* Look at first msg in receive queue; wait if necessary */
2040*4882a593Smuzhiyun 		rc = tipc_wait_for_rcvmsg(sock, &timeout);
2041*4882a593Smuzhiyun 		if (unlikely(rc))
2042*4882a593Smuzhiyun 			break;
2043*4882a593Smuzhiyun 		skb = skb_peek(&sk->sk_receive_queue);
2044*4882a593Smuzhiyun 		skb_cb = TIPC_SKB_CB(skb);
2045*4882a593Smuzhiyun 		hdr = buf_msg(skb);
2046*4882a593Smuzhiyun 		dlen = msg_data_sz(hdr);
2047*4882a593Smuzhiyun 		hlen = msg_hdr_sz(hdr);
2048*4882a593Smuzhiyun 		err = msg_errcode(hdr);
2049*4882a593Smuzhiyun 
2050*4882a593Smuzhiyun 		/* Discard any empty non-errored (SYN-) message */
2051*4882a593Smuzhiyun 		if (unlikely(!dlen && !err)) {
2052*4882a593Smuzhiyun 			tsk_advance_rx_queue(sk);
2053*4882a593Smuzhiyun 			continue;
2054*4882a593Smuzhiyun 		}
2055*4882a593Smuzhiyun 
2056*4882a593Smuzhiyun 		/* Collect msg meta data, incl. error code and rejected data */
2057*4882a593Smuzhiyun 		if (!copied) {
2058*4882a593Smuzhiyun 			tipc_sk_set_orig_addr(m, skb);
2059*4882a593Smuzhiyun 			rc = tipc_sk_anc_data_recv(m, skb, tsk);
2060*4882a593Smuzhiyun 			if (rc)
2061*4882a593Smuzhiyun 				break;
2062*4882a593Smuzhiyun 			hdr = buf_msg(skb);
2063*4882a593Smuzhiyun 		}
2064*4882a593Smuzhiyun 
2065*4882a593Smuzhiyun 		/* Copy data if msg ok, otherwise return error/partial data */
2066*4882a593Smuzhiyun 		if (likely(!err)) {
2067*4882a593Smuzhiyun 			offset = skb_cb->bytes_read;
2068*4882a593Smuzhiyun 			copy = min_t(int, dlen - offset, buflen - copied);
2069*4882a593Smuzhiyun 			rc = skb_copy_datagram_msg(skb, hlen + offset, m, copy);
2070*4882a593Smuzhiyun 			if (unlikely(rc))
2071*4882a593Smuzhiyun 				break;
2072*4882a593Smuzhiyun 			copied += copy;
2073*4882a593Smuzhiyun 			offset += copy;
2074*4882a593Smuzhiyun 			if (unlikely(offset < dlen)) {
2075*4882a593Smuzhiyun 				if (!peek)
2076*4882a593Smuzhiyun 					skb_cb->bytes_read = offset;
2077*4882a593Smuzhiyun 				break;
2078*4882a593Smuzhiyun 			}
2079*4882a593Smuzhiyun 		} else {
2080*4882a593Smuzhiyun 			rc = 0;
2081*4882a593Smuzhiyun 			if ((err != TIPC_CONN_SHUTDOWN) && !m->msg_control)
2082*4882a593Smuzhiyun 				rc = -ECONNRESET;
2083*4882a593Smuzhiyun 			if (copied || rc)
2084*4882a593Smuzhiyun 				break;
2085*4882a593Smuzhiyun 		}
2086*4882a593Smuzhiyun 
2087*4882a593Smuzhiyun 		if (unlikely(peek))
2088*4882a593Smuzhiyun 			break;
2089*4882a593Smuzhiyun 
2090*4882a593Smuzhiyun 		tsk_advance_rx_queue(sk);
2091*4882a593Smuzhiyun 
2092*4882a593Smuzhiyun 		/* Send connection flow control advertisement when applicable */
2093*4882a593Smuzhiyun 		tsk->rcv_unacked += tsk_inc(tsk, hlen + dlen);
2094*4882a593Smuzhiyun 		if (tsk->rcv_unacked >= tsk->rcv_win / TIPC_ACK_RATE)
2095*4882a593Smuzhiyun 			tipc_sk_send_ack(tsk);
2096*4882a593Smuzhiyun 
2097*4882a593Smuzhiyun 		/* Exit if all requested data or FIN/error received */
2098*4882a593Smuzhiyun 		if (copied == buflen || err)
2099*4882a593Smuzhiyun 			break;
2100*4882a593Smuzhiyun 
2101*4882a593Smuzhiyun 	} while (!skb_queue_empty(&sk->sk_receive_queue) || copied < required);
2102*4882a593Smuzhiyun exit:
2103*4882a593Smuzhiyun 	release_sock(sk);
2104*4882a593Smuzhiyun 	return copied ? copied : rc;
2105*4882a593Smuzhiyun }
2106*4882a593Smuzhiyun 
2107*4882a593Smuzhiyun /**
2108*4882a593Smuzhiyun  * tipc_write_space - wake up thread if port congestion is released
2109*4882a593Smuzhiyun  * @sk: socket
2110*4882a593Smuzhiyun  */
tipc_write_space(struct sock * sk)2111*4882a593Smuzhiyun static void tipc_write_space(struct sock *sk)
2112*4882a593Smuzhiyun {
2113*4882a593Smuzhiyun 	struct socket_wq *wq;
2114*4882a593Smuzhiyun 
2115*4882a593Smuzhiyun 	rcu_read_lock();
2116*4882a593Smuzhiyun 	wq = rcu_dereference(sk->sk_wq);
2117*4882a593Smuzhiyun 	if (skwq_has_sleeper(wq))
2118*4882a593Smuzhiyun 		wake_up_interruptible_sync_poll(&wq->wait, EPOLLOUT |
2119*4882a593Smuzhiyun 						EPOLLWRNORM | EPOLLWRBAND);
2120*4882a593Smuzhiyun 	rcu_read_unlock();
2121*4882a593Smuzhiyun }
2122*4882a593Smuzhiyun 
2123*4882a593Smuzhiyun /**
2124*4882a593Smuzhiyun  * tipc_data_ready - wake up threads to indicate messages have been received
2125*4882a593Smuzhiyun  * @sk: socket
2126*4882a593Smuzhiyun  */
tipc_data_ready(struct sock * sk)2127*4882a593Smuzhiyun static void tipc_data_ready(struct sock *sk)
2128*4882a593Smuzhiyun {
2129*4882a593Smuzhiyun 	struct socket_wq *wq;
2130*4882a593Smuzhiyun 
2131*4882a593Smuzhiyun 	rcu_read_lock();
2132*4882a593Smuzhiyun 	wq = rcu_dereference(sk->sk_wq);
2133*4882a593Smuzhiyun 	if (skwq_has_sleeper(wq))
2134*4882a593Smuzhiyun 		wake_up_interruptible_sync_poll(&wq->wait, EPOLLIN |
2135*4882a593Smuzhiyun 						EPOLLRDNORM | EPOLLRDBAND);
2136*4882a593Smuzhiyun 	rcu_read_unlock();
2137*4882a593Smuzhiyun }
2138*4882a593Smuzhiyun 
tipc_sock_destruct(struct sock * sk)2139*4882a593Smuzhiyun static void tipc_sock_destruct(struct sock *sk)
2140*4882a593Smuzhiyun {
2141*4882a593Smuzhiyun 	__skb_queue_purge(&sk->sk_receive_queue);
2142*4882a593Smuzhiyun }
2143*4882a593Smuzhiyun 
tipc_sk_proto_rcv(struct sock * sk,struct sk_buff_head * inputq,struct sk_buff_head * xmitq)2144*4882a593Smuzhiyun static void tipc_sk_proto_rcv(struct sock *sk,
2145*4882a593Smuzhiyun 			      struct sk_buff_head *inputq,
2146*4882a593Smuzhiyun 			      struct sk_buff_head *xmitq)
2147*4882a593Smuzhiyun {
2148*4882a593Smuzhiyun 	struct sk_buff *skb = __skb_dequeue(inputq);
2149*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
2150*4882a593Smuzhiyun 	struct tipc_msg *hdr = buf_msg(skb);
2151*4882a593Smuzhiyun 	struct tipc_group *grp = tsk->group;
2152*4882a593Smuzhiyun 	bool wakeup = false;
2153*4882a593Smuzhiyun 
2154*4882a593Smuzhiyun 	switch (msg_user(hdr)) {
2155*4882a593Smuzhiyun 	case CONN_MANAGER:
2156*4882a593Smuzhiyun 		tipc_sk_conn_proto_rcv(tsk, skb, inputq, xmitq);
2157*4882a593Smuzhiyun 		return;
2158*4882a593Smuzhiyun 	case SOCK_WAKEUP:
2159*4882a593Smuzhiyun 		tipc_dest_del(&tsk->cong_links, msg_orignode(hdr), 0);
2160*4882a593Smuzhiyun 		/* coupled with smp_rmb() in tipc_wait_for_cond() */
2161*4882a593Smuzhiyun 		smp_wmb();
2162*4882a593Smuzhiyun 		tsk->cong_link_cnt--;
2163*4882a593Smuzhiyun 		wakeup = true;
2164*4882a593Smuzhiyun 		tipc_sk_push_backlog(tsk, false);
2165*4882a593Smuzhiyun 		break;
2166*4882a593Smuzhiyun 	case GROUP_PROTOCOL:
2167*4882a593Smuzhiyun 		tipc_group_proto_rcv(grp, &wakeup, hdr, inputq, xmitq);
2168*4882a593Smuzhiyun 		break;
2169*4882a593Smuzhiyun 	case TOP_SRV:
2170*4882a593Smuzhiyun 		tipc_group_member_evt(tsk->group, &wakeup, &sk->sk_rcvbuf,
2171*4882a593Smuzhiyun 				      hdr, inputq, xmitq);
2172*4882a593Smuzhiyun 		break;
2173*4882a593Smuzhiyun 	default:
2174*4882a593Smuzhiyun 		break;
2175*4882a593Smuzhiyun 	}
2176*4882a593Smuzhiyun 
2177*4882a593Smuzhiyun 	if (wakeup)
2178*4882a593Smuzhiyun 		sk->sk_write_space(sk);
2179*4882a593Smuzhiyun 
2180*4882a593Smuzhiyun 	kfree_skb(skb);
2181*4882a593Smuzhiyun }
2182*4882a593Smuzhiyun 
2183*4882a593Smuzhiyun /**
2184*4882a593Smuzhiyun  * tipc_sk_filter_connect - check incoming message for a connection-based socket
2185*4882a593Smuzhiyun  * @tsk: TIPC socket
2186*4882a593Smuzhiyun  * @skb: pointer to message buffer.
2187*4882a593Smuzhiyun  * @xmitq: for Nagle ACK if any
2188*4882a593Smuzhiyun  * Returns true if message should be added to receive queue, false otherwise
2189*4882a593Smuzhiyun  */
tipc_sk_filter_connect(struct tipc_sock * tsk,struct sk_buff * skb,struct sk_buff_head * xmitq)2190*4882a593Smuzhiyun static bool tipc_sk_filter_connect(struct tipc_sock *tsk, struct sk_buff *skb,
2191*4882a593Smuzhiyun 				   struct sk_buff_head *xmitq)
2192*4882a593Smuzhiyun {
2193*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
2194*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
2195*4882a593Smuzhiyun 	struct tipc_msg *hdr = buf_msg(skb);
2196*4882a593Smuzhiyun 	bool con_msg = msg_connected(hdr);
2197*4882a593Smuzhiyun 	u32 pport = tsk_peer_port(tsk);
2198*4882a593Smuzhiyun 	u32 pnode = tsk_peer_node(tsk);
2199*4882a593Smuzhiyun 	u32 oport = msg_origport(hdr);
2200*4882a593Smuzhiyun 	u32 onode = msg_orignode(hdr);
2201*4882a593Smuzhiyun 	int err = msg_errcode(hdr);
2202*4882a593Smuzhiyun 	unsigned long delay;
2203*4882a593Smuzhiyun 
2204*4882a593Smuzhiyun 	if (unlikely(msg_mcast(hdr)))
2205*4882a593Smuzhiyun 		return false;
2206*4882a593Smuzhiyun 	tsk->oneway = 0;
2207*4882a593Smuzhiyun 
2208*4882a593Smuzhiyun 	switch (sk->sk_state) {
2209*4882a593Smuzhiyun 	case TIPC_CONNECTING:
2210*4882a593Smuzhiyun 		/* Setup ACK */
2211*4882a593Smuzhiyun 		if (likely(con_msg)) {
2212*4882a593Smuzhiyun 			if (err)
2213*4882a593Smuzhiyun 				break;
2214*4882a593Smuzhiyun 			tipc_sk_finish_conn(tsk, oport, onode);
2215*4882a593Smuzhiyun 			msg_set_importance(&tsk->phdr, msg_importance(hdr));
2216*4882a593Smuzhiyun 			/* ACK+ message with data is added to receive queue */
2217*4882a593Smuzhiyun 			if (msg_data_sz(hdr))
2218*4882a593Smuzhiyun 				return true;
2219*4882a593Smuzhiyun 			/* Empty ACK-, - wake up sleeping connect() and drop */
2220*4882a593Smuzhiyun 			sk->sk_state_change(sk);
2221*4882a593Smuzhiyun 			msg_set_dest_droppable(hdr, 1);
2222*4882a593Smuzhiyun 			return false;
2223*4882a593Smuzhiyun 		}
2224*4882a593Smuzhiyun 		/* Ignore connectionless message if not from listening socket */
2225*4882a593Smuzhiyun 		if (oport != pport || onode != pnode)
2226*4882a593Smuzhiyun 			return false;
2227*4882a593Smuzhiyun 
2228*4882a593Smuzhiyun 		/* Rejected SYN */
2229*4882a593Smuzhiyun 		if (err != TIPC_ERR_OVERLOAD)
2230*4882a593Smuzhiyun 			break;
2231*4882a593Smuzhiyun 
2232*4882a593Smuzhiyun 		/* Prepare for new setup attempt if we have a SYN clone */
2233*4882a593Smuzhiyun 		if (skb_queue_empty(&sk->sk_write_queue))
2234*4882a593Smuzhiyun 			break;
2235*4882a593Smuzhiyun 		get_random_bytes(&delay, 2);
2236*4882a593Smuzhiyun 		delay %= (tsk->conn_timeout / 4);
2237*4882a593Smuzhiyun 		delay = msecs_to_jiffies(delay + 100);
2238*4882a593Smuzhiyun 		sk_reset_timer(sk, &sk->sk_timer, jiffies + delay);
2239*4882a593Smuzhiyun 		return false;
2240*4882a593Smuzhiyun 	case TIPC_OPEN:
2241*4882a593Smuzhiyun 	case TIPC_DISCONNECTING:
2242*4882a593Smuzhiyun 		return false;
2243*4882a593Smuzhiyun 	case TIPC_LISTEN:
2244*4882a593Smuzhiyun 		/* Accept only SYN message */
2245*4882a593Smuzhiyun 		if (!msg_is_syn(hdr) &&
2246*4882a593Smuzhiyun 		    tipc_node_get_capabilities(net, onode) & TIPC_SYN_BIT)
2247*4882a593Smuzhiyun 			return false;
2248*4882a593Smuzhiyun 		if (!con_msg && !err)
2249*4882a593Smuzhiyun 			return true;
2250*4882a593Smuzhiyun 		return false;
2251*4882a593Smuzhiyun 	case TIPC_ESTABLISHED:
2252*4882a593Smuzhiyun 		if (!skb_queue_empty(&sk->sk_write_queue))
2253*4882a593Smuzhiyun 			tipc_sk_push_backlog(tsk, false);
2254*4882a593Smuzhiyun 		/* Accept only connection-based messages sent by peer */
2255*4882a593Smuzhiyun 		if (likely(con_msg && !err && pport == oport &&
2256*4882a593Smuzhiyun 			   pnode == onode)) {
2257*4882a593Smuzhiyun 			if (msg_ack_required(hdr)) {
2258*4882a593Smuzhiyun 				struct sk_buff *skb;
2259*4882a593Smuzhiyun 
2260*4882a593Smuzhiyun 				skb = tipc_sk_build_ack(tsk);
2261*4882a593Smuzhiyun 				if (skb) {
2262*4882a593Smuzhiyun 					msg_set_nagle_ack(buf_msg(skb));
2263*4882a593Smuzhiyun 					__skb_queue_tail(xmitq, skb);
2264*4882a593Smuzhiyun 				}
2265*4882a593Smuzhiyun 			}
2266*4882a593Smuzhiyun 			return true;
2267*4882a593Smuzhiyun 		}
2268*4882a593Smuzhiyun 		if (!tsk_peer_msg(tsk, hdr))
2269*4882a593Smuzhiyun 			return false;
2270*4882a593Smuzhiyun 		if (!err)
2271*4882a593Smuzhiyun 			return true;
2272*4882a593Smuzhiyun 		tipc_set_sk_state(sk, TIPC_DISCONNECTING);
2273*4882a593Smuzhiyun 		tipc_node_remove_conn(net, pnode, tsk->portid);
2274*4882a593Smuzhiyun 		sk->sk_state_change(sk);
2275*4882a593Smuzhiyun 		return true;
2276*4882a593Smuzhiyun 	default:
2277*4882a593Smuzhiyun 		pr_err("Unknown sk_state %u\n", sk->sk_state);
2278*4882a593Smuzhiyun 	}
2279*4882a593Smuzhiyun 	/* Abort connection setup attempt */
2280*4882a593Smuzhiyun 	tipc_set_sk_state(sk, TIPC_DISCONNECTING);
2281*4882a593Smuzhiyun 	sk->sk_err = ECONNREFUSED;
2282*4882a593Smuzhiyun 	sk->sk_state_change(sk);
2283*4882a593Smuzhiyun 	return true;
2284*4882a593Smuzhiyun }
2285*4882a593Smuzhiyun 
2286*4882a593Smuzhiyun /**
2287*4882a593Smuzhiyun  * rcvbuf_limit - get proper overload limit of socket receive queue
2288*4882a593Smuzhiyun  * @sk: socket
2289*4882a593Smuzhiyun  * @skb: message
2290*4882a593Smuzhiyun  *
2291*4882a593Smuzhiyun  * For connection oriented messages, irrespective of importance,
2292*4882a593Smuzhiyun  * default queue limit is 2 MB.
2293*4882a593Smuzhiyun  *
2294*4882a593Smuzhiyun  * For connectionless messages, queue limits are based on message
2295*4882a593Smuzhiyun  * importance as follows:
2296*4882a593Smuzhiyun  *
2297*4882a593Smuzhiyun  * TIPC_LOW_IMPORTANCE       (2 MB)
2298*4882a593Smuzhiyun  * TIPC_MEDIUM_IMPORTANCE    (4 MB)
2299*4882a593Smuzhiyun  * TIPC_HIGH_IMPORTANCE      (8 MB)
2300*4882a593Smuzhiyun  * TIPC_CRITICAL_IMPORTANCE  (16 MB)
2301*4882a593Smuzhiyun  *
2302*4882a593Smuzhiyun  * Returns overload limit according to corresponding message importance
2303*4882a593Smuzhiyun  */
rcvbuf_limit(struct sock * sk,struct sk_buff * skb)2304*4882a593Smuzhiyun static unsigned int rcvbuf_limit(struct sock *sk, struct sk_buff *skb)
2305*4882a593Smuzhiyun {
2306*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
2307*4882a593Smuzhiyun 	struct tipc_msg *hdr = buf_msg(skb);
2308*4882a593Smuzhiyun 
2309*4882a593Smuzhiyun 	if (unlikely(msg_in_group(hdr)))
2310*4882a593Smuzhiyun 		return READ_ONCE(sk->sk_rcvbuf);
2311*4882a593Smuzhiyun 
2312*4882a593Smuzhiyun 	if (unlikely(!msg_connected(hdr)))
2313*4882a593Smuzhiyun 		return READ_ONCE(sk->sk_rcvbuf) << msg_importance(hdr);
2314*4882a593Smuzhiyun 
2315*4882a593Smuzhiyun 	if (likely(tsk->peer_caps & TIPC_BLOCK_FLOWCTL))
2316*4882a593Smuzhiyun 		return READ_ONCE(sk->sk_rcvbuf);
2317*4882a593Smuzhiyun 
2318*4882a593Smuzhiyun 	return FLOWCTL_MSG_LIM;
2319*4882a593Smuzhiyun }
2320*4882a593Smuzhiyun 
2321*4882a593Smuzhiyun /**
2322*4882a593Smuzhiyun  * tipc_sk_filter_rcv - validate incoming message
2323*4882a593Smuzhiyun  * @sk: socket
2324*4882a593Smuzhiyun  * @skb: pointer to message.
2325*4882a593Smuzhiyun  *
2326*4882a593Smuzhiyun  * Enqueues message on receive queue if acceptable; optionally handles
2327*4882a593Smuzhiyun  * disconnect indication for a connected socket.
2328*4882a593Smuzhiyun  *
2329*4882a593Smuzhiyun  * Called with socket lock already taken
2330*4882a593Smuzhiyun  *
2331*4882a593Smuzhiyun  */
tipc_sk_filter_rcv(struct sock * sk,struct sk_buff * skb,struct sk_buff_head * xmitq)2332*4882a593Smuzhiyun static void tipc_sk_filter_rcv(struct sock *sk, struct sk_buff *skb,
2333*4882a593Smuzhiyun 			       struct sk_buff_head *xmitq)
2334*4882a593Smuzhiyun {
2335*4882a593Smuzhiyun 	bool sk_conn = !tipc_sk_type_connectionless(sk);
2336*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
2337*4882a593Smuzhiyun 	struct tipc_group *grp = tsk->group;
2338*4882a593Smuzhiyun 	struct tipc_msg *hdr = buf_msg(skb);
2339*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
2340*4882a593Smuzhiyun 	struct sk_buff_head inputq;
2341*4882a593Smuzhiyun 	int mtyp = msg_type(hdr);
2342*4882a593Smuzhiyun 	int limit, err = TIPC_OK;
2343*4882a593Smuzhiyun 
2344*4882a593Smuzhiyun 	trace_tipc_sk_filter_rcv(sk, skb, TIPC_DUMP_ALL, " ");
2345*4882a593Smuzhiyun 	TIPC_SKB_CB(skb)->bytes_read = 0;
2346*4882a593Smuzhiyun 	__skb_queue_head_init(&inputq);
2347*4882a593Smuzhiyun 	__skb_queue_tail(&inputq, skb);
2348*4882a593Smuzhiyun 
2349*4882a593Smuzhiyun 	if (unlikely(!msg_isdata(hdr)))
2350*4882a593Smuzhiyun 		tipc_sk_proto_rcv(sk, &inputq, xmitq);
2351*4882a593Smuzhiyun 
2352*4882a593Smuzhiyun 	if (unlikely(grp))
2353*4882a593Smuzhiyun 		tipc_group_filter_msg(grp, &inputq, xmitq);
2354*4882a593Smuzhiyun 
2355*4882a593Smuzhiyun 	if (unlikely(!grp) && mtyp == TIPC_MCAST_MSG)
2356*4882a593Smuzhiyun 		tipc_mcast_filter_msg(net, &tsk->mc_method.deferredq, &inputq);
2357*4882a593Smuzhiyun 
2358*4882a593Smuzhiyun 	/* Validate and add to receive buffer if there is space */
2359*4882a593Smuzhiyun 	while ((skb = __skb_dequeue(&inputq))) {
2360*4882a593Smuzhiyun 		hdr = buf_msg(skb);
2361*4882a593Smuzhiyun 		limit = rcvbuf_limit(sk, skb);
2362*4882a593Smuzhiyun 		if ((sk_conn && !tipc_sk_filter_connect(tsk, skb, xmitq)) ||
2363*4882a593Smuzhiyun 		    (!sk_conn && msg_connected(hdr)) ||
2364*4882a593Smuzhiyun 		    (!grp && msg_in_group(hdr)))
2365*4882a593Smuzhiyun 			err = TIPC_ERR_NO_PORT;
2366*4882a593Smuzhiyun 		else if (sk_rmem_alloc_get(sk) + skb->truesize >= limit) {
2367*4882a593Smuzhiyun 			trace_tipc_sk_dump(sk, skb, TIPC_DUMP_ALL,
2368*4882a593Smuzhiyun 					   "err_overload2!");
2369*4882a593Smuzhiyun 			atomic_inc(&sk->sk_drops);
2370*4882a593Smuzhiyun 			err = TIPC_ERR_OVERLOAD;
2371*4882a593Smuzhiyun 		}
2372*4882a593Smuzhiyun 
2373*4882a593Smuzhiyun 		if (unlikely(err)) {
2374*4882a593Smuzhiyun 			if (tipc_msg_reverse(tipc_own_addr(net), &skb, err)) {
2375*4882a593Smuzhiyun 				trace_tipc_sk_rej_msg(sk, skb, TIPC_DUMP_NONE,
2376*4882a593Smuzhiyun 						      "@filter_rcv!");
2377*4882a593Smuzhiyun 				__skb_queue_tail(xmitq, skb);
2378*4882a593Smuzhiyun 			}
2379*4882a593Smuzhiyun 			err = TIPC_OK;
2380*4882a593Smuzhiyun 			continue;
2381*4882a593Smuzhiyun 		}
2382*4882a593Smuzhiyun 		__skb_queue_tail(&sk->sk_receive_queue, skb);
2383*4882a593Smuzhiyun 		skb_set_owner_r(skb, sk);
2384*4882a593Smuzhiyun 		trace_tipc_sk_overlimit2(sk, skb, TIPC_DUMP_ALL,
2385*4882a593Smuzhiyun 					 "rcvq >90% allocated!");
2386*4882a593Smuzhiyun 		sk->sk_data_ready(sk);
2387*4882a593Smuzhiyun 	}
2388*4882a593Smuzhiyun }
2389*4882a593Smuzhiyun 
2390*4882a593Smuzhiyun /**
2391*4882a593Smuzhiyun  * tipc_sk_backlog_rcv - handle incoming message from backlog queue
2392*4882a593Smuzhiyun  * @sk: socket
2393*4882a593Smuzhiyun  * @skb: message
2394*4882a593Smuzhiyun  *
2395*4882a593Smuzhiyun  * Caller must hold socket lock
2396*4882a593Smuzhiyun  */
tipc_sk_backlog_rcv(struct sock * sk,struct sk_buff * skb)2397*4882a593Smuzhiyun static int tipc_sk_backlog_rcv(struct sock *sk, struct sk_buff *skb)
2398*4882a593Smuzhiyun {
2399*4882a593Smuzhiyun 	unsigned int before = sk_rmem_alloc_get(sk);
2400*4882a593Smuzhiyun 	struct sk_buff_head xmitq;
2401*4882a593Smuzhiyun 	unsigned int added;
2402*4882a593Smuzhiyun 
2403*4882a593Smuzhiyun 	__skb_queue_head_init(&xmitq);
2404*4882a593Smuzhiyun 
2405*4882a593Smuzhiyun 	tipc_sk_filter_rcv(sk, skb, &xmitq);
2406*4882a593Smuzhiyun 	added = sk_rmem_alloc_get(sk) - before;
2407*4882a593Smuzhiyun 	atomic_add(added, &tipc_sk(sk)->dupl_rcvcnt);
2408*4882a593Smuzhiyun 
2409*4882a593Smuzhiyun 	/* Send pending response/rejected messages, if any */
2410*4882a593Smuzhiyun 	tipc_node_distr_xmit(sock_net(sk), &xmitq);
2411*4882a593Smuzhiyun 	return 0;
2412*4882a593Smuzhiyun }
2413*4882a593Smuzhiyun 
2414*4882a593Smuzhiyun /**
2415*4882a593Smuzhiyun  * tipc_sk_enqueue - extract all buffers with destination 'dport' from
2416*4882a593Smuzhiyun  *                   inputq and try adding them to socket or backlog queue
2417*4882a593Smuzhiyun  * @inputq: list of incoming buffers with potentially different destinations
2418*4882a593Smuzhiyun  * @sk: socket where the buffers should be enqueued
2419*4882a593Smuzhiyun  * @dport: port number for the socket
2420*4882a593Smuzhiyun  *
2421*4882a593Smuzhiyun  * Caller must hold socket lock
2422*4882a593Smuzhiyun  */
tipc_sk_enqueue(struct sk_buff_head * inputq,struct sock * sk,u32 dport,struct sk_buff_head * xmitq)2423*4882a593Smuzhiyun static void tipc_sk_enqueue(struct sk_buff_head *inputq, struct sock *sk,
2424*4882a593Smuzhiyun 			    u32 dport, struct sk_buff_head *xmitq)
2425*4882a593Smuzhiyun {
2426*4882a593Smuzhiyun 	unsigned long time_limit = jiffies + usecs_to_jiffies(20000);
2427*4882a593Smuzhiyun 	struct sk_buff *skb;
2428*4882a593Smuzhiyun 	unsigned int lim;
2429*4882a593Smuzhiyun 	atomic_t *dcnt;
2430*4882a593Smuzhiyun 	u32 onode;
2431*4882a593Smuzhiyun 
2432*4882a593Smuzhiyun 	while (skb_queue_len(inputq)) {
2433*4882a593Smuzhiyun 		if (unlikely(time_after_eq(jiffies, time_limit)))
2434*4882a593Smuzhiyun 			return;
2435*4882a593Smuzhiyun 
2436*4882a593Smuzhiyun 		skb = tipc_skb_dequeue(inputq, dport);
2437*4882a593Smuzhiyun 		if (unlikely(!skb))
2438*4882a593Smuzhiyun 			return;
2439*4882a593Smuzhiyun 
2440*4882a593Smuzhiyun 		/* Add message directly to receive queue if possible */
2441*4882a593Smuzhiyun 		if (!sock_owned_by_user(sk)) {
2442*4882a593Smuzhiyun 			tipc_sk_filter_rcv(sk, skb, xmitq);
2443*4882a593Smuzhiyun 			continue;
2444*4882a593Smuzhiyun 		}
2445*4882a593Smuzhiyun 
2446*4882a593Smuzhiyun 		/* Try backlog, compensating for double-counted bytes */
2447*4882a593Smuzhiyun 		dcnt = &tipc_sk(sk)->dupl_rcvcnt;
2448*4882a593Smuzhiyun 		if (!sk->sk_backlog.len)
2449*4882a593Smuzhiyun 			atomic_set(dcnt, 0);
2450*4882a593Smuzhiyun 		lim = rcvbuf_limit(sk, skb) + atomic_read(dcnt);
2451*4882a593Smuzhiyun 		if (likely(!sk_add_backlog(sk, skb, lim))) {
2452*4882a593Smuzhiyun 			trace_tipc_sk_overlimit1(sk, skb, TIPC_DUMP_ALL,
2453*4882a593Smuzhiyun 						 "bklg & rcvq >90% allocated!");
2454*4882a593Smuzhiyun 			continue;
2455*4882a593Smuzhiyun 		}
2456*4882a593Smuzhiyun 
2457*4882a593Smuzhiyun 		trace_tipc_sk_dump(sk, skb, TIPC_DUMP_ALL, "err_overload!");
2458*4882a593Smuzhiyun 		/* Overload => reject message back to sender */
2459*4882a593Smuzhiyun 		onode = tipc_own_addr(sock_net(sk));
2460*4882a593Smuzhiyun 		atomic_inc(&sk->sk_drops);
2461*4882a593Smuzhiyun 		if (tipc_msg_reverse(onode, &skb, TIPC_ERR_OVERLOAD)) {
2462*4882a593Smuzhiyun 			trace_tipc_sk_rej_msg(sk, skb, TIPC_DUMP_ALL,
2463*4882a593Smuzhiyun 					      "@sk_enqueue!");
2464*4882a593Smuzhiyun 			__skb_queue_tail(xmitq, skb);
2465*4882a593Smuzhiyun 		}
2466*4882a593Smuzhiyun 		break;
2467*4882a593Smuzhiyun 	}
2468*4882a593Smuzhiyun }
2469*4882a593Smuzhiyun 
2470*4882a593Smuzhiyun /**
2471*4882a593Smuzhiyun  * tipc_sk_rcv - handle a chain of incoming buffers
2472*4882a593Smuzhiyun  * @inputq: buffer list containing the buffers
2473*4882a593Smuzhiyun  * Consumes all buffers in list until inputq is empty
2474*4882a593Smuzhiyun  * Note: may be called in multiple threads referring to the same queue
2475*4882a593Smuzhiyun  */
tipc_sk_rcv(struct net * net,struct sk_buff_head * inputq)2476*4882a593Smuzhiyun void tipc_sk_rcv(struct net *net, struct sk_buff_head *inputq)
2477*4882a593Smuzhiyun {
2478*4882a593Smuzhiyun 	struct sk_buff_head xmitq;
2479*4882a593Smuzhiyun 	u32 dnode, dport = 0;
2480*4882a593Smuzhiyun 	int err;
2481*4882a593Smuzhiyun 	struct tipc_sock *tsk;
2482*4882a593Smuzhiyun 	struct sock *sk;
2483*4882a593Smuzhiyun 	struct sk_buff *skb;
2484*4882a593Smuzhiyun 
2485*4882a593Smuzhiyun 	__skb_queue_head_init(&xmitq);
2486*4882a593Smuzhiyun 	while (skb_queue_len(inputq)) {
2487*4882a593Smuzhiyun 		dport = tipc_skb_peek_port(inputq, dport);
2488*4882a593Smuzhiyun 		tsk = tipc_sk_lookup(net, dport);
2489*4882a593Smuzhiyun 
2490*4882a593Smuzhiyun 		if (likely(tsk)) {
2491*4882a593Smuzhiyun 			sk = &tsk->sk;
2492*4882a593Smuzhiyun 			if (likely(spin_trylock_bh(&sk->sk_lock.slock))) {
2493*4882a593Smuzhiyun 				tipc_sk_enqueue(inputq, sk, dport, &xmitq);
2494*4882a593Smuzhiyun 				spin_unlock_bh(&sk->sk_lock.slock);
2495*4882a593Smuzhiyun 			}
2496*4882a593Smuzhiyun 			/* Send pending response/rejected messages, if any */
2497*4882a593Smuzhiyun 			tipc_node_distr_xmit(sock_net(sk), &xmitq);
2498*4882a593Smuzhiyun 			sock_put(sk);
2499*4882a593Smuzhiyun 			continue;
2500*4882a593Smuzhiyun 		}
2501*4882a593Smuzhiyun 		/* No destination socket => dequeue skb if still there */
2502*4882a593Smuzhiyun 		skb = tipc_skb_dequeue(inputq, dport);
2503*4882a593Smuzhiyun 		if (!skb)
2504*4882a593Smuzhiyun 			return;
2505*4882a593Smuzhiyun 
2506*4882a593Smuzhiyun 		/* Try secondary lookup if unresolved named message */
2507*4882a593Smuzhiyun 		err = TIPC_ERR_NO_PORT;
2508*4882a593Smuzhiyun 		if (tipc_msg_lookup_dest(net, skb, &err))
2509*4882a593Smuzhiyun 			goto xmit;
2510*4882a593Smuzhiyun 
2511*4882a593Smuzhiyun 		/* Prepare for message rejection */
2512*4882a593Smuzhiyun 		if (!tipc_msg_reverse(tipc_own_addr(net), &skb, err))
2513*4882a593Smuzhiyun 			continue;
2514*4882a593Smuzhiyun 
2515*4882a593Smuzhiyun 		trace_tipc_sk_rej_msg(NULL, skb, TIPC_DUMP_NONE, "@sk_rcv!");
2516*4882a593Smuzhiyun xmit:
2517*4882a593Smuzhiyun 		dnode = msg_destnode(buf_msg(skb));
2518*4882a593Smuzhiyun 		tipc_node_xmit_skb(net, skb, dnode, dport);
2519*4882a593Smuzhiyun 	}
2520*4882a593Smuzhiyun }
2521*4882a593Smuzhiyun 
tipc_wait_for_connect(struct socket * sock,long * timeo_p)2522*4882a593Smuzhiyun static int tipc_wait_for_connect(struct socket *sock, long *timeo_p)
2523*4882a593Smuzhiyun {
2524*4882a593Smuzhiyun 	DEFINE_WAIT_FUNC(wait, woken_wake_function);
2525*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
2526*4882a593Smuzhiyun 	int done;
2527*4882a593Smuzhiyun 
2528*4882a593Smuzhiyun 	do {
2529*4882a593Smuzhiyun 		int err = sock_error(sk);
2530*4882a593Smuzhiyun 		if (err)
2531*4882a593Smuzhiyun 			return err;
2532*4882a593Smuzhiyun 		if (!*timeo_p)
2533*4882a593Smuzhiyun 			return -ETIMEDOUT;
2534*4882a593Smuzhiyun 		if (signal_pending(current))
2535*4882a593Smuzhiyun 			return sock_intr_errno(*timeo_p);
2536*4882a593Smuzhiyun 		if (sk->sk_state == TIPC_DISCONNECTING)
2537*4882a593Smuzhiyun 			break;
2538*4882a593Smuzhiyun 
2539*4882a593Smuzhiyun 		add_wait_queue(sk_sleep(sk), &wait);
2540*4882a593Smuzhiyun 		done = sk_wait_event(sk, timeo_p, tipc_sk_connected(sk),
2541*4882a593Smuzhiyun 				     &wait);
2542*4882a593Smuzhiyun 		remove_wait_queue(sk_sleep(sk), &wait);
2543*4882a593Smuzhiyun 	} while (!done);
2544*4882a593Smuzhiyun 	return 0;
2545*4882a593Smuzhiyun }
2546*4882a593Smuzhiyun 
tipc_sockaddr_is_sane(struct sockaddr_tipc * addr)2547*4882a593Smuzhiyun static bool tipc_sockaddr_is_sane(struct sockaddr_tipc *addr)
2548*4882a593Smuzhiyun {
2549*4882a593Smuzhiyun 	if (addr->family != AF_TIPC)
2550*4882a593Smuzhiyun 		return false;
2551*4882a593Smuzhiyun 	if (addr->addrtype == TIPC_SERVICE_RANGE)
2552*4882a593Smuzhiyun 		return (addr->addr.nameseq.lower <= addr->addr.nameseq.upper);
2553*4882a593Smuzhiyun 	return (addr->addrtype == TIPC_SERVICE_ADDR ||
2554*4882a593Smuzhiyun 		addr->addrtype == TIPC_SOCKET_ADDR);
2555*4882a593Smuzhiyun }
2556*4882a593Smuzhiyun 
2557*4882a593Smuzhiyun /**
2558*4882a593Smuzhiyun  * tipc_connect - establish a connection to another TIPC port
2559*4882a593Smuzhiyun  * @sock: socket structure
2560*4882a593Smuzhiyun  * @dest: socket address for destination port
2561*4882a593Smuzhiyun  * @destlen: size of socket address data structure
2562*4882a593Smuzhiyun  * @flags: file-related flags associated with socket
2563*4882a593Smuzhiyun  *
2564*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
2565*4882a593Smuzhiyun  */
tipc_connect(struct socket * sock,struct sockaddr * dest,int destlen,int flags)2566*4882a593Smuzhiyun static int tipc_connect(struct socket *sock, struct sockaddr *dest,
2567*4882a593Smuzhiyun 			int destlen, int flags)
2568*4882a593Smuzhiyun {
2569*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
2570*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
2571*4882a593Smuzhiyun 	struct sockaddr_tipc *dst = (struct sockaddr_tipc *)dest;
2572*4882a593Smuzhiyun 	struct msghdr m = {NULL,};
2573*4882a593Smuzhiyun 	long timeout = (flags & O_NONBLOCK) ? 0 : tsk->conn_timeout;
2574*4882a593Smuzhiyun 	int previous;
2575*4882a593Smuzhiyun 	int res = 0;
2576*4882a593Smuzhiyun 
2577*4882a593Smuzhiyun 	if (destlen != sizeof(struct sockaddr_tipc))
2578*4882a593Smuzhiyun 		return -EINVAL;
2579*4882a593Smuzhiyun 
2580*4882a593Smuzhiyun 	lock_sock(sk);
2581*4882a593Smuzhiyun 
2582*4882a593Smuzhiyun 	if (tsk->group) {
2583*4882a593Smuzhiyun 		res = -EINVAL;
2584*4882a593Smuzhiyun 		goto exit;
2585*4882a593Smuzhiyun 	}
2586*4882a593Smuzhiyun 
2587*4882a593Smuzhiyun 	if (dst->family == AF_UNSPEC) {
2588*4882a593Smuzhiyun 		memset(&tsk->peer, 0, sizeof(struct sockaddr_tipc));
2589*4882a593Smuzhiyun 		if (!tipc_sk_type_connectionless(sk))
2590*4882a593Smuzhiyun 			res = -EINVAL;
2591*4882a593Smuzhiyun 		goto exit;
2592*4882a593Smuzhiyun 	}
2593*4882a593Smuzhiyun 	if (!tipc_sockaddr_is_sane(dst)) {
2594*4882a593Smuzhiyun 		res = -EINVAL;
2595*4882a593Smuzhiyun 		goto exit;
2596*4882a593Smuzhiyun 	}
2597*4882a593Smuzhiyun 	/* DGRAM/RDM connect(), just save the destaddr */
2598*4882a593Smuzhiyun 	if (tipc_sk_type_connectionless(sk)) {
2599*4882a593Smuzhiyun 		memcpy(&tsk->peer, dest, destlen);
2600*4882a593Smuzhiyun 		goto exit;
2601*4882a593Smuzhiyun 	} else if (dst->addrtype == TIPC_SERVICE_RANGE) {
2602*4882a593Smuzhiyun 		res = -EINVAL;
2603*4882a593Smuzhiyun 		goto exit;
2604*4882a593Smuzhiyun 	}
2605*4882a593Smuzhiyun 
2606*4882a593Smuzhiyun 	previous = sk->sk_state;
2607*4882a593Smuzhiyun 
2608*4882a593Smuzhiyun 	switch (sk->sk_state) {
2609*4882a593Smuzhiyun 	case TIPC_OPEN:
2610*4882a593Smuzhiyun 		/* Send a 'SYN-' to destination */
2611*4882a593Smuzhiyun 		m.msg_name = dest;
2612*4882a593Smuzhiyun 		m.msg_namelen = destlen;
2613*4882a593Smuzhiyun 
2614*4882a593Smuzhiyun 		/* If connect is in non-blocking case, set MSG_DONTWAIT to
2615*4882a593Smuzhiyun 		 * indicate send_msg() is never blocked.
2616*4882a593Smuzhiyun 		 */
2617*4882a593Smuzhiyun 		if (!timeout)
2618*4882a593Smuzhiyun 			m.msg_flags = MSG_DONTWAIT;
2619*4882a593Smuzhiyun 
2620*4882a593Smuzhiyun 		res = __tipc_sendmsg(sock, &m, 0);
2621*4882a593Smuzhiyun 		if ((res < 0) && (res != -EWOULDBLOCK))
2622*4882a593Smuzhiyun 			goto exit;
2623*4882a593Smuzhiyun 
2624*4882a593Smuzhiyun 		/* Just entered TIPC_CONNECTING state; the only
2625*4882a593Smuzhiyun 		 * difference is that return value in non-blocking
2626*4882a593Smuzhiyun 		 * case is EINPROGRESS, rather than EALREADY.
2627*4882a593Smuzhiyun 		 */
2628*4882a593Smuzhiyun 		res = -EINPROGRESS;
2629*4882a593Smuzhiyun 		fallthrough;
2630*4882a593Smuzhiyun 	case TIPC_CONNECTING:
2631*4882a593Smuzhiyun 		if (!timeout) {
2632*4882a593Smuzhiyun 			if (previous == TIPC_CONNECTING)
2633*4882a593Smuzhiyun 				res = -EALREADY;
2634*4882a593Smuzhiyun 			goto exit;
2635*4882a593Smuzhiyun 		}
2636*4882a593Smuzhiyun 		timeout = msecs_to_jiffies(timeout);
2637*4882a593Smuzhiyun 		/* Wait until an 'ACK' or 'RST' arrives, or a timeout occurs */
2638*4882a593Smuzhiyun 		res = tipc_wait_for_connect(sock, &timeout);
2639*4882a593Smuzhiyun 		break;
2640*4882a593Smuzhiyun 	case TIPC_ESTABLISHED:
2641*4882a593Smuzhiyun 		res = -EISCONN;
2642*4882a593Smuzhiyun 		break;
2643*4882a593Smuzhiyun 	default:
2644*4882a593Smuzhiyun 		res = -EINVAL;
2645*4882a593Smuzhiyun 	}
2646*4882a593Smuzhiyun 
2647*4882a593Smuzhiyun exit:
2648*4882a593Smuzhiyun 	release_sock(sk);
2649*4882a593Smuzhiyun 	return res;
2650*4882a593Smuzhiyun }
2651*4882a593Smuzhiyun 
2652*4882a593Smuzhiyun /**
2653*4882a593Smuzhiyun  * tipc_listen - allow socket to listen for incoming connections
2654*4882a593Smuzhiyun  * @sock: socket structure
2655*4882a593Smuzhiyun  * @len: (unused)
2656*4882a593Smuzhiyun  *
2657*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
2658*4882a593Smuzhiyun  */
tipc_listen(struct socket * sock,int len)2659*4882a593Smuzhiyun static int tipc_listen(struct socket *sock, int len)
2660*4882a593Smuzhiyun {
2661*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
2662*4882a593Smuzhiyun 	int res;
2663*4882a593Smuzhiyun 
2664*4882a593Smuzhiyun 	lock_sock(sk);
2665*4882a593Smuzhiyun 	res = tipc_set_sk_state(sk, TIPC_LISTEN);
2666*4882a593Smuzhiyun 	release_sock(sk);
2667*4882a593Smuzhiyun 
2668*4882a593Smuzhiyun 	return res;
2669*4882a593Smuzhiyun }
2670*4882a593Smuzhiyun 
tipc_wait_for_accept(struct socket * sock,long timeo)2671*4882a593Smuzhiyun static int tipc_wait_for_accept(struct socket *sock, long timeo)
2672*4882a593Smuzhiyun {
2673*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
2674*4882a593Smuzhiyun 	DEFINE_WAIT_FUNC(wait, woken_wake_function);
2675*4882a593Smuzhiyun 	int err;
2676*4882a593Smuzhiyun 
2677*4882a593Smuzhiyun 	/* True wake-one mechanism for incoming connections: only
2678*4882a593Smuzhiyun 	 * one process gets woken up, not the 'whole herd'.
2679*4882a593Smuzhiyun 	 * Since we do not 'race & poll' for established sockets
2680*4882a593Smuzhiyun 	 * anymore, the common case will execute the loop only once.
2681*4882a593Smuzhiyun 	*/
2682*4882a593Smuzhiyun 	for (;;) {
2683*4882a593Smuzhiyun 		if (timeo && skb_queue_empty(&sk->sk_receive_queue)) {
2684*4882a593Smuzhiyun 			add_wait_queue(sk_sleep(sk), &wait);
2685*4882a593Smuzhiyun 			release_sock(sk);
2686*4882a593Smuzhiyun 			timeo = wait_woken(&wait, TASK_INTERRUPTIBLE, timeo);
2687*4882a593Smuzhiyun 			lock_sock(sk);
2688*4882a593Smuzhiyun 			remove_wait_queue(sk_sleep(sk), &wait);
2689*4882a593Smuzhiyun 		}
2690*4882a593Smuzhiyun 		err = 0;
2691*4882a593Smuzhiyun 		if (!skb_queue_empty(&sk->sk_receive_queue))
2692*4882a593Smuzhiyun 			break;
2693*4882a593Smuzhiyun 		err = -EAGAIN;
2694*4882a593Smuzhiyun 		if (!timeo)
2695*4882a593Smuzhiyun 			break;
2696*4882a593Smuzhiyun 		err = sock_intr_errno(timeo);
2697*4882a593Smuzhiyun 		if (signal_pending(current))
2698*4882a593Smuzhiyun 			break;
2699*4882a593Smuzhiyun 	}
2700*4882a593Smuzhiyun 	return err;
2701*4882a593Smuzhiyun }
2702*4882a593Smuzhiyun 
2703*4882a593Smuzhiyun /**
2704*4882a593Smuzhiyun  * tipc_accept - wait for connection request
2705*4882a593Smuzhiyun  * @sock: listening socket
2706*4882a593Smuzhiyun  * @new_sock: new socket that is to be connected
2707*4882a593Smuzhiyun  * @flags: file-related flags associated with socket
2708*4882a593Smuzhiyun  *
2709*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
2710*4882a593Smuzhiyun  */
tipc_accept(struct socket * sock,struct socket * new_sock,int flags,bool kern)2711*4882a593Smuzhiyun static int tipc_accept(struct socket *sock, struct socket *new_sock, int flags,
2712*4882a593Smuzhiyun 		       bool kern)
2713*4882a593Smuzhiyun {
2714*4882a593Smuzhiyun 	struct sock *new_sk, *sk = sock->sk;
2715*4882a593Smuzhiyun 	struct tipc_sock *new_tsock;
2716*4882a593Smuzhiyun 	struct msghdr m = {NULL,};
2717*4882a593Smuzhiyun 	struct tipc_msg *msg;
2718*4882a593Smuzhiyun 	struct sk_buff *buf;
2719*4882a593Smuzhiyun 	long timeo;
2720*4882a593Smuzhiyun 	int res;
2721*4882a593Smuzhiyun 
2722*4882a593Smuzhiyun 	lock_sock(sk);
2723*4882a593Smuzhiyun 
2724*4882a593Smuzhiyun 	if (sk->sk_state != TIPC_LISTEN) {
2725*4882a593Smuzhiyun 		res = -EINVAL;
2726*4882a593Smuzhiyun 		goto exit;
2727*4882a593Smuzhiyun 	}
2728*4882a593Smuzhiyun 	timeo = sock_rcvtimeo(sk, flags & O_NONBLOCK);
2729*4882a593Smuzhiyun 	res = tipc_wait_for_accept(sock, timeo);
2730*4882a593Smuzhiyun 	if (res)
2731*4882a593Smuzhiyun 		goto exit;
2732*4882a593Smuzhiyun 
2733*4882a593Smuzhiyun 	buf = skb_peek(&sk->sk_receive_queue);
2734*4882a593Smuzhiyun 
2735*4882a593Smuzhiyun 	res = tipc_sk_create(sock_net(sock->sk), new_sock, 0, kern);
2736*4882a593Smuzhiyun 	if (res)
2737*4882a593Smuzhiyun 		goto exit;
2738*4882a593Smuzhiyun 	security_sk_clone(sock->sk, new_sock->sk);
2739*4882a593Smuzhiyun 
2740*4882a593Smuzhiyun 	new_sk = new_sock->sk;
2741*4882a593Smuzhiyun 	new_tsock = tipc_sk(new_sk);
2742*4882a593Smuzhiyun 	msg = buf_msg(buf);
2743*4882a593Smuzhiyun 
2744*4882a593Smuzhiyun 	/* we lock on new_sk; but lockdep sees the lock on sk */
2745*4882a593Smuzhiyun 	lock_sock_nested(new_sk, SINGLE_DEPTH_NESTING);
2746*4882a593Smuzhiyun 
2747*4882a593Smuzhiyun 	/*
2748*4882a593Smuzhiyun 	 * Reject any stray messages received by new socket
2749*4882a593Smuzhiyun 	 * before the socket lock was taken (very, very unlikely)
2750*4882a593Smuzhiyun 	 */
2751*4882a593Smuzhiyun 	tsk_rej_rx_queue(new_sk, TIPC_ERR_NO_PORT);
2752*4882a593Smuzhiyun 
2753*4882a593Smuzhiyun 	/* Connect new socket to it's peer */
2754*4882a593Smuzhiyun 	tipc_sk_finish_conn(new_tsock, msg_origport(msg), msg_orignode(msg));
2755*4882a593Smuzhiyun 
2756*4882a593Smuzhiyun 	tsk_set_importance(new_sk, msg_importance(msg));
2757*4882a593Smuzhiyun 	if (msg_named(msg)) {
2758*4882a593Smuzhiyun 		new_tsock->conn_type = msg_nametype(msg);
2759*4882a593Smuzhiyun 		new_tsock->conn_instance = msg_nameinst(msg);
2760*4882a593Smuzhiyun 	}
2761*4882a593Smuzhiyun 
2762*4882a593Smuzhiyun 	/*
2763*4882a593Smuzhiyun 	 * Respond to 'SYN-' by discarding it & returning 'ACK'.
2764*4882a593Smuzhiyun 	 * Respond to 'SYN+' by queuing it on new socket & returning 'ACK'.
2765*4882a593Smuzhiyun 	 */
2766*4882a593Smuzhiyun 	if (!msg_data_sz(msg)) {
2767*4882a593Smuzhiyun 		tsk_advance_rx_queue(sk);
2768*4882a593Smuzhiyun 	} else {
2769*4882a593Smuzhiyun 		__skb_dequeue(&sk->sk_receive_queue);
2770*4882a593Smuzhiyun 		__skb_queue_head(&new_sk->sk_receive_queue, buf);
2771*4882a593Smuzhiyun 		skb_set_owner_r(buf, new_sk);
2772*4882a593Smuzhiyun 	}
2773*4882a593Smuzhiyun 	__tipc_sendstream(new_sock, &m, 0);
2774*4882a593Smuzhiyun 	release_sock(new_sk);
2775*4882a593Smuzhiyun exit:
2776*4882a593Smuzhiyun 	release_sock(sk);
2777*4882a593Smuzhiyun 	return res;
2778*4882a593Smuzhiyun }
2779*4882a593Smuzhiyun 
2780*4882a593Smuzhiyun /**
2781*4882a593Smuzhiyun  * tipc_shutdown - shutdown socket connection
2782*4882a593Smuzhiyun  * @sock: socket structure
2783*4882a593Smuzhiyun  * @how: direction to close (must be SHUT_RDWR)
2784*4882a593Smuzhiyun  *
2785*4882a593Smuzhiyun  * Terminates connection (if necessary), then purges socket's receive queue.
2786*4882a593Smuzhiyun  *
2787*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
2788*4882a593Smuzhiyun  */
tipc_shutdown(struct socket * sock,int how)2789*4882a593Smuzhiyun static int tipc_shutdown(struct socket *sock, int how)
2790*4882a593Smuzhiyun {
2791*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
2792*4882a593Smuzhiyun 	int res;
2793*4882a593Smuzhiyun 
2794*4882a593Smuzhiyun 	if (how != SHUT_RDWR)
2795*4882a593Smuzhiyun 		return -EINVAL;
2796*4882a593Smuzhiyun 
2797*4882a593Smuzhiyun 	lock_sock(sk);
2798*4882a593Smuzhiyun 
2799*4882a593Smuzhiyun 	trace_tipc_sk_shutdown(sk, NULL, TIPC_DUMP_ALL, " ");
2800*4882a593Smuzhiyun 	__tipc_shutdown(sock, TIPC_CONN_SHUTDOWN);
2801*4882a593Smuzhiyun 	sk->sk_shutdown = SHUTDOWN_MASK;
2802*4882a593Smuzhiyun 
2803*4882a593Smuzhiyun 	if (sk->sk_state == TIPC_DISCONNECTING) {
2804*4882a593Smuzhiyun 		/* Discard any unreceived messages */
2805*4882a593Smuzhiyun 		__skb_queue_purge(&sk->sk_receive_queue);
2806*4882a593Smuzhiyun 
2807*4882a593Smuzhiyun 		res = 0;
2808*4882a593Smuzhiyun 	} else {
2809*4882a593Smuzhiyun 		res = -ENOTCONN;
2810*4882a593Smuzhiyun 	}
2811*4882a593Smuzhiyun 	/* Wake up anyone sleeping in poll. */
2812*4882a593Smuzhiyun 	sk->sk_state_change(sk);
2813*4882a593Smuzhiyun 
2814*4882a593Smuzhiyun 	release_sock(sk);
2815*4882a593Smuzhiyun 	return res;
2816*4882a593Smuzhiyun }
2817*4882a593Smuzhiyun 
tipc_sk_check_probing_state(struct sock * sk,struct sk_buff_head * list)2818*4882a593Smuzhiyun static void tipc_sk_check_probing_state(struct sock *sk,
2819*4882a593Smuzhiyun 					struct sk_buff_head *list)
2820*4882a593Smuzhiyun {
2821*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
2822*4882a593Smuzhiyun 	u32 pnode = tsk_peer_node(tsk);
2823*4882a593Smuzhiyun 	u32 pport = tsk_peer_port(tsk);
2824*4882a593Smuzhiyun 	u32 self = tsk_own_node(tsk);
2825*4882a593Smuzhiyun 	u32 oport = tsk->portid;
2826*4882a593Smuzhiyun 	struct sk_buff *skb;
2827*4882a593Smuzhiyun 
2828*4882a593Smuzhiyun 	if (tsk->probe_unacked) {
2829*4882a593Smuzhiyun 		tipc_set_sk_state(sk, TIPC_DISCONNECTING);
2830*4882a593Smuzhiyun 		sk->sk_err = ECONNABORTED;
2831*4882a593Smuzhiyun 		tipc_node_remove_conn(sock_net(sk), pnode, pport);
2832*4882a593Smuzhiyun 		sk->sk_state_change(sk);
2833*4882a593Smuzhiyun 		return;
2834*4882a593Smuzhiyun 	}
2835*4882a593Smuzhiyun 	/* Prepare new probe */
2836*4882a593Smuzhiyun 	skb = tipc_msg_create(CONN_MANAGER, CONN_PROBE, INT_H_SIZE, 0,
2837*4882a593Smuzhiyun 			      pnode, self, pport, oport, TIPC_OK);
2838*4882a593Smuzhiyun 	if (skb)
2839*4882a593Smuzhiyun 		__skb_queue_tail(list, skb);
2840*4882a593Smuzhiyun 	tsk->probe_unacked = true;
2841*4882a593Smuzhiyun 	sk_reset_timer(sk, &sk->sk_timer, jiffies + CONN_PROBING_INTV);
2842*4882a593Smuzhiyun }
2843*4882a593Smuzhiyun 
tipc_sk_retry_connect(struct sock * sk,struct sk_buff_head * list)2844*4882a593Smuzhiyun static void tipc_sk_retry_connect(struct sock *sk, struct sk_buff_head *list)
2845*4882a593Smuzhiyun {
2846*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
2847*4882a593Smuzhiyun 
2848*4882a593Smuzhiyun 	/* Try again later if dest link is congested */
2849*4882a593Smuzhiyun 	if (tsk->cong_link_cnt) {
2850*4882a593Smuzhiyun 		sk_reset_timer(sk, &sk->sk_timer,
2851*4882a593Smuzhiyun 			       jiffies + msecs_to_jiffies(100));
2852*4882a593Smuzhiyun 		return;
2853*4882a593Smuzhiyun 	}
2854*4882a593Smuzhiyun 	/* Prepare SYN for retransmit */
2855*4882a593Smuzhiyun 	tipc_msg_skb_clone(&sk->sk_write_queue, list);
2856*4882a593Smuzhiyun }
2857*4882a593Smuzhiyun 
tipc_sk_timeout(struct timer_list * t)2858*4882a593Smuzhiyun static void tipc_sk_timeout(struct timer_list *t)
2859*4882a593Smuzhiyun {
2860*4882a593Smuzhiyun 	struct sock *sk = from_timer(sk, t, sk_timer);
2861*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
2862*4882a593Smuzhiyun 	u32 pnode = tsk_peer_node(tsk);
2863*4882a593Smuzhiyun 	struct sk_buff_head list;
2864*4882a593Smuzhiyun 	int rc = 0;
2865*4882a593Smuzhiyun 
2866*4882a593Smuzhiyun 	__skb_queue_head_init(&list);
2867*4882a593Smuzhiyun 	bh_lock_sock(sk);
2868*4882a593Smuzhiyun 
2869*4882a593Smuzhiyun 	/* Try again later if socket is busy */
2870*4882a593Smuzhiyun 	if (sock_owned_by_user(sk)) {
2871*4882a593Smuzhiyun 		sk_reset_timer(sk, &sk->sk_timer, jiffies + HZ / 20);
2872*4882a593Smuzhiyun 		bh_unlock_sock(sk);
2873*4882a593Smuzhiyun 		sock_put(sk);
2874*4882a593Smuzhiyun 		return;
2875*4882a593Smuzhiyun 	}
2876*4882a593Smuzhiyun 
2877*4882a593Smuzhiyun 	if (sk->sk_state == TIPC_ESTABLISHED)
2878*4882a593Smuzhiyun 		tipc_sk_check_probing_state(sk, &list);
2879*4882a593Smuzhiyun 	else if (sk->sk_state == TIPC_CONNECTING)
2880*4882a593Smuzhiyun 		tipc_sk_retry_connect(sk, &list);
2881*4882a593Smuzhiyun 
2882*4882a593Smuzhiyun 	bh_unlock_sock(sk);
2883*4882a593Smuzhiyun 
2884*4882a593Smuzhiyun 	if (!skb_queue_empty(&list))
2885*4882a593Smuzhiyun 		rc = tipc_node_xmit(sock_net(sk), &list, pnode, tsk->portid);
2886*4882a593Smuzhiyun 
2887*4882a593Smuzhiyun 	/* SYN messages may cause link congestion */
2888*4882a593Smuzhiyun 	if (rc == -ELINKCONG) {
2889*4882a593Smuzhiyun 		tipc_dest_push(&tsk->cong_links, pnode, 0);
2890*4882a593Smuzhiyun 		tsk->cong_link_cnt = 1;
2891*4882a593Smuzhiyun 	}
2892*4882a593Smuzhiyun 	sock_put(sk);
2893*4882a593Smuzhiyun }
2894*4882a593Smuzhiyun 
tipc_sk_publish(struct tipc_sock * tsk,uint scope,struct tipc_name_seq const * seq)2895*4882a593Smuzhiyun static int tipc_sk_publish(struct tipc_sock *tsk, uint scope,
2896*4882a593Smuzhiyun 			   struct tipc_name_seq const *seq)
2897*4882a593Smuzhiyun {
2898*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
2899*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
2900*4882a593Smuzhiyun 	struct publication *publ;
2901*4882a593Smuzhiyun 	u32 key;
2902*4882a593Smuzhiyun 
2903*4882a593Smuzhiyun 	if (scope != TIPC_NODE_SCOPE)
2904*4882a593Smuzhiyun 		scope = TIPC_CLUSTER_SCOPE;
2905*4882a593Smuzhiyun 
2906*4882a593Smuzhiyun 	if (tipc_sk_connected(sk))
2907*4882a593Smuzhiyun 		return -EINVAL;
2908*4882a593Smuzhiyun 	key = tsk->portid + tsk->pub_count + 1;
2909*4882a593Smuzhiyun 	if (key == tsk->portid)
2910*4882a593Smuzhiyun 		return -EADDRINUSE;
2911*4882a593Smuzhiyun 
2912*4882a593Smuzhiyun 	publ = tipc_nametbl_publish(net, seq->type, seq->lower, seq->upper,
2913*4882a593Smuzhiyun 				    scope, tsk->portid, key);
2914*4882a593Smuzhiyun 	if (unlikely(!publ))
2915*4882a593Smuzhiyun 		return -EINVAL;
2916*4882a593Smuzhiyun 
2917*4882a593Smuzhiyun 	list_add(&publ->binding_sock, &tsk->publications);
2918*4882a593Smuzhiyun 	tsk->pub_count++;
2919*4882a593Smuzhiyun 	tsk->published = 1;
2920*4882a593Smuzhiyun 	return 0;
2921*4882a593Smuzhiyun }
2922*4882a593Smuzhiyun 
tipc_sk_withdraw(struct tipc_sock * tsk,uint scope,struct tipc_name_seq const * seq)2923*4882a593Smuzhiyun static int tipc_sk_withdraw(struct tipc_sock *tsk, uint scope,
2924*4882a593Smuzhiyun 			    struct tipc_name_seq const *seq)
2925*4882a593Smuzhiyun {
2926*4882a593Smuzhiyun 	struct net *net = sock_net(&tsk->sk);
2927*4882a593Smuzhiyun 	struct publication *publ;
2928*4882a593Smuzhiyun 	struct publication *safe;
2929*4882a593Smuzhiyun 	int rc = -EINVAL;
2930*4882a593Smuzhiyun 
2931*4882a593Smuzhiyun 	if (scope != TIPC_NODE_SCOPE)
2932*4882a593Smuzhiyun 		scope = TIPC_CLUSTER_SCOPE;
2933*4882a593Smuzhiyun 
2934*4882a593Smuzhiyun 	list_for_each_entry_safe(publ, safe, &tsk->publications, binding_sock) {
2935*4882a593Smuzhiyun 		if (seq) {
2936*4882a593Smuzhiyun 			if (publ->scope != scope)
2937*4882a593Smuzhiyun 				continue;
2938*4882a593Smuzhiyun 			if (publ->type != seq->type)
2939*4882a593Smuzhiyun 				continue;
2940*4882a593Smuzhiyun 			if (publ->lower != seq->lower)
2941*4882a593Smuzhiyun 				continue;
2942*4882a593Smuzhiyun 			if (publ->upper != seq->upper)
2943*4882a593Smuzhiyun 				break;
2944*4882a593Smuzhiyun 			tipc_nametbl_withdraw(net, publ->type, publ->lower,
2945*4882a593Smuzhiyun 					      publ->upper, publ->key);
2946*4882a593Smuzhiyun 			rc = 0;
2947*4882a593Smuzhiyun 			break;
2948*4882a593Smuzhiyun 		}
2949*4882a593Smuzhiyun 		tipc_nametbl_withdraw(net, publ->type, publ->lower,
2950*4882a593Smuzhiyun 				      publ->upper, publ->key);
2951*4882a593Smuzhiyun 		rc = 0;
2952*4882a593Smuzhiyun 	}
2953*4882a593Smuzhiyun 	if (list_empty(&tsk->publications))
2954*4882a593Smuzhiyun 		tsk->published = 0;
2955*4882a593Smuzhiyun 	return rc;
2956*4882a593Smuzhiyun }
2957*4882a593Smuzhiyun 
2958*4882a593Smuzhiyun /* tipc_sk_reinit: set non-zero address in all existing sockets
2959*4882a593Smuzhiyun  *                 when we go from standalone to network mode.
2960*4882a593Smuzhiyun  */
tipc_sk_reinit(struct net * net)2961*4882a593Smuzhiyun void tipc_sk_reinit(struct net *net)
2962*4882a593Smuzhiyun {
2963*4882a593Smuzhiyun 	struct tipc_net *tn = net_generic(net, tipc_net_id);
2964*4882a593Smuzhiyun 	struct rhashtable_iter iter;
2965*4882a593Smuzhiyun 	struct tipc_sock *tsk;
2966*4882a593Smuzhiyun 	struct tipc_msg *msg;
2967*4882a593Smuzhiyun 
2968*4882a593Smuzhiyun 	rhashtable_walk_enter(&tn->sk_rht, &iter);
2969*4882a593Smuzhiyun 
2970*4882a593Smuzhiyun 	do {
2971*4882a593Smuzhiyun 		rhashtable_walk_start(&iter);
2972*4882a593Smuzhiyun 
2973*4882a593Smuzhiyun 		while ((tsk = rhashtable_walk_next(&iter)) && !IS_ERR(tsk)) {
2974*4882a593Smuzhiyun 			sock_hold(&tsk->sk);
2975*4882a593Smuzhiyun 			rhashtable_walk_stop(&iter);
2976*4882a593Smuzhiyun 			lock_sock(&tsk->sk);
2977*4882a593Smuzhiyun 			msg = &tsk->phdr;
2978*4882a593Smuzhiyun 			msg_set_prevnode(msg, tipc_own_addr(net));
2979*4882a593Smuzhiyun 			msg_set_orignode(msg, tipc_own_addr(net));
2980*4882a593Smuzhiyun 			release_sock(&tsk->sk);
2981*4882a593Smuzhiyun 			rhashtable_walk_start(&iter);
2982*4882a593Smuzhiyun 			sock_put(&tsk->sk);
2983*4882a593Smuzhiyun 		}
2984*4882a593Smuzhiyun 
2985*4882a593Smuzhiyun 		rhashtable_walk_stop(&iter);
2986*4882a593Smuzhiyun 	} while (tsk == ERR_PTR(-EAGAIN));
2987*4882a593Smuzhiyun 
2988*4882a593Smuzhiyun 	rhashtable_walk_exit(&iter);
2989*4882a593Smuzhiyun }
2990*4882a593Smuzhiyun 
tipc_sk_lookup(struct net * net,u32 portid)2991*4882a593Smuzhiyun static struct tipc_sock *tipc_sk_lookup(struct net *net, u32 portid)
2992*4882a593Smuzhiyun {
2993*4882a593Smuzhiyun 	struct tipc_net *tn = net_generic(net, tipc_net_id);
2994*4882a593Smuzhiyun 	struct tipc_sock *tsk;
2995*4882a593Smuzhiyun 
2996*4882a593Smuzhiyun 	rcu_read_lock();
2997*4882a593Smuzhiyun 	tsk = rhashtable_lookup(&tn->sk_rht, &portid, tsk_rht_params);
2998*4882a593Smuzhiyun 	if (tsk)
2999*4882a593Smuzhiyun 		sock_hold(&tsk->sk);
3000*4882a593Smuzhiyun 	rcu_read_unlock();
3001*4882a593Smuzhiyun 
3002*4882a593Smuzhiyun 	return tsk;
3003*4882a593Smuzhiyun }
3004*4882a593Smuzhiyun 
tipc_sk_insert(struct tipc_sock * tsk)3005*4882a593Smuzhiyun static int tipc_sk_insert(struct tipc_sock *tsk)
3006*4882a593Smuzhiyun {
3007*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
3008*4882a593Smuzhiyun 	struct net *net = sock_net(sk);
3009*4882a593Smuzhiyun 	struct tipc_net *tn = net_generic(net, tipc_net_id);
3010*4882a593Smuzhiyun 	u32 remaining = (TIPC_MAX_PORT - TIPC_MIN_PORT) + 1;
3011*4882a593Smuzhiyun 	u32 portid = prandom_u32() % remaining + TIPC_MIN_PORT;
3012*4882a593Smuzhiyun 
3013*4882a593Smuzhiyun 	while (remaining--) {
3014*4882a593Smuzhiyun 		portid++;
3015*4882a593Smuzhiyun 		if ((portid < TIPC_MIN_PORT) || (portid > TIPC_MAX_PORT))
3016*4882a593Smuzhiyun 			portid = TIPC_MIN_PORT;
3017*4882a593Smuzhiyun 		tsk->portid = portid;
3018*4882a593Smuzhiyun 		sock_hold(&tsk->sk);
3019*4882a593Smuzhiyun 		if (!rhashtable_lookup_insert_fast(&tn->sk_rht, &tsk->node,
3020*4882a593Smuzhiyun 						   tsk_rht_params))
3021*4882a593Smuzhiyun 			return 0;
3022*4882a593Smuzhiyun 		sock_put(&tsk->sk);
3023*4882a593Smuzhiyun 	}
3024*4882a593Smuzhiyun 
3025*4882a593Smuzhiyun 	return -1;
3026*4882a593Smuzhiyun }
3027*4882a593Smuzhiyun 
tipc_sk_remove(struct tipc_sock * tsk)3028*4882a593Smuzhiyun static void tipc_sk_remove(struct tipc_sock *tsk)
3029*4882a593Smuzhiyun {
3030*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
3031*4882a593Smuzhiyun 	struct tipc_net *tn = net_generic(sock_net(sk), tipc_net_id);
3032*4882a593Smuzhiyun 
3033*4882a593Smuzhiyun 	if (!rhashtable_remove_fast(&tn->sk_rht, &tsk->node, tsk_rht_params)) {
3034*4882a593Smuzhiyun 		WARN_ON(refcount_read(&sk->sk_refcnt) == 1);
3035*4882a593Smuzhiyun 		__sock_put(sk);
3036*4882a593Smuzhiyun 	}
3037*4882a593Smuzhiyun }
3038*4882a593Smuzhiyun 
3039*4882a593Smuzhiyun static const struct rhashtable_params tsk_rht_params = {
3040*4882a593Smuzhiyun 	.nelem_hint = 192,
3041*4882a593Smuzhiyun 	.head_offset = offsetof(struct tipc_sock, node),
3042*4882a593Smuzhiyun 	.key_offset = offsetof(struct tipc_sock, portid),
3043*4882a593Smuzhiyun 	.key_len = sizeof(u32), /* portid */
3044*4882a593Smuzhiyun 	.max_size = 1048576,
3045*4882a593Smuzhiyun 	.min_size = 256,
3046*4882a593Smuzhiyun 	.automatic_shrinking = true,
3047*4882a593Smuzhiyun };
3048*4882a593Smuzhiyun 
tipc_sk_rht_init(struct net * net)3049*4882a593Smuzhiyun int tipc_sk_rht_init(struct net *net)
3050*4882a593Smuzhiyun {
3051*4882a593Smuzhiyun 	struct tipc_net *tn = net_generic(net, tipc_net_id);
3052*4882a593Smuzhiyun 
3053*4882a593Smuzhiyun 	return rhashtable_init(&tn->sk_rht, &tsk_rht_params);
3054*4882a593Smuzhiyun }
3055*4882a593Smuzhiyun 
tipc_sk_rht_destroy(struct net * net)3056*4882a593Smuzhiyun void tipc_sk_rht_destroy(struct net *net)
3057*4882a593Smuzhiyun {
3058*4882a593Smuzhiyun 	struct tipc_net *tn = net_generic(net, tipc_net_id);
3059*4882a593Smuzhiyun 
3060*4882a593Smuzhiyun 	/* Wait for socket readers to complete */
3061*4882a593Smuzhiyun 	synchronize_net();
3062*4882a593Smuzhiyun 
3063*4882a593Smuzhiyun 	rhashtable_destroy(&tn->sk_rht);
3064*4882a593Smuzhiyun }
3065*4882a593Smuzhiyun 
tipc_sk_join(struct tipc_sock * tsk,struct tipc_group_req * mreq)3066*4882a593Smuzhiyun static int tipc_sk_join(struct tipc_sock *tsk, struct tipc_group_req *mreq)
3067*4882a593Smuzhiyun {
3068*4882a593Smuzhiyun 	struct net *net = sock_net(&tsk->sk);
3069*4882a593Smuzhiyun 	struct tipc_group *grp = tsk->group;
3070*4882a593Smuzhiyun 	struct tipc_msg *hdr = &tsk->phdr;
3071*4882a593Smuzhiyun 	struct tipc_name_seq seq;
3072*4882a593Smuzhiyun 	int rc;
3073*4882a593Smuzhiyun 
3074*4882a593Smuzhiyun 	if (mreq->type < TIPC_RESERVED_TYPES)
3075*4882a593Smuzhiyun 		return -EACCES;
3076*4882a593Smuzhiyun 	if (mreq->scope > TIPC_NODE_SCOPE)
3077*4882a593Smuzhiyun 		return -EINVAL;
3078*4882a593Smuzhiyun 	if (grp)
3079*4882a593Smuzhiyun 		return -EACCES;
3080*4882a593Smuzhiyun 	grp = tipc_group_create(net, tsk->portid, mreq, &tsk->group_is_open);
3081*4882a593Smuzhiyun 	if (!grp)
3082*4882a593Smuzhiyun 		return -ENOMEM;
3083*4882a593Smuzhiyun 	tsk->group = grp;
3084*4882a593Smuzhiyun 	msg_set_lookup_scope(hdr, mreq->scope);
3085*4882a593Smuzhiyun 	msg_set_nametype(hdr, mreq->type);
3086*4882a593Smuzhiyun 	msg_set_dest_droppable(hdr, true);
3087*4882a593Smuzhiyun 	seq.type = mreq->type;
3088*4882a593Smuzhiyun 	seq.lower = mreq->instance;
3089*4882a593Smuzhiyun 	seq.upper = seq.lower;
3090*4882a593Smuzhiyun 	tipc_nametbl_build_group(net, grp, mreq->type, mreq->scope);
3091*4882a593Smuzhiyun 	rc = tipc_sk_publish(tsk, mreq->scope, &seq);
3092*4882a593Smuzhiyun 	if (rc) {
3093*4882a593Smuzhiyun 		tipc_group_delete(net, grp);
3094*4882a593Smuzhiyun 		tsk->group = NULL;
3095*4882a593Smuzhiyun 		return rc;
3096*4882a593Smuzhiyun 	}
3097*4882a593Smuzhiyun 	/* Eliminate any risk that a broadcast overtakes sent JOINs */
3098*4882a593Smuzhiyun 	tsk->mc_method.rcast = true;
3099*4882a593Smuzhiyun 	tsk->mc_method.mandatory = true;
3100*4882a593Smuzhiyun 	tipc_group_join(net, grp, &tsk->sk.sk_rcvbuf);
3101*4882a593Smuzhiyun 	return rc;
3102*4882a593Smuzhiyun }
3103*4882a593Smuzhiyun 
tipc_sk_leave(struct tipc_sock * tsk)3104*4882a593Smuzhiyun static int tipc_sk_leave(struct tipc_sock *tsk)
3105*4882a593Smuzhiyun {
3106*4882a593Smuzhiyun 	struct net *net = sock_net(&tsk->sk);
3107*4882a593Smuzhiyun 	struct tipc_group *grp = tsk->group;
3108*4882a593Smuzhiyun 	struct tipc_name_seq seq;
3109*4882a593Smuzhiyun 	int scope;
3110*4882a593Smuzhiyun 
3111*4882a593Smuzhiyun 	if (!grp)
3112*4882a593Smuzhiyun 		return -EINVAL;
3113*4882a593Smuzhiyun 	tipc_group_self(grp, &seq, &scope);
3114*4882a593Smuzhiyun 	tipc_group_delete(net, grp);
3115*4882a593Smuzhiyun 	tsk->group = NULL;
3116*4882a593Smuzhiyun 	tipc_sk_withdraw(tsk, scope, &seq);
3117*4882a593Smuzhiyun 	return 0;
3118*4882a593Smuzhiyun }
3119*4882a593Smuzhiyun 
3120*4882a593Smuzhiyun /**
3121*4882a593Smuzhiyun  * tipc_setsockopt - set socket option
3122*4882a593Smuzhiyun  * @sock: socket structure
3123*4882a593Smuzhiyun  * @lvl: option level
3124*4882a593Smuzhiyun  * @opt: option identifier
3125*4882a593Smuzhiyun  * @ov: pointer to new option value
3126*4882a593Smuzhiyun  * @ol: length of option value
3127*4882a593Smuzhiyun  *
3128*4882a593Smuzhiyun  * For stream sockets only, accepts and ignores all IPPROTO_TCP options
3129*4882a593Smuzhiyun  * (to ease compatibility).
3130*4882a593Smuzhiyun  *
3131*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
3132*4882a593Smuzhiyun  */
tipc_setsockopt(struct socket * sock,int lvl,int opt,sockptr_t ov,unsigned int ol)3133*4882a593Smuzhiyun static int tipc_setsockopt(struct socket *sock, int lvl, int opt,
3134*4882a593Smuzhiyun 			   sockptr_t ov, unsigned int ol)
3135*4882a593Smuzhiyun {
3136*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
3137*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
3138*4882a593Smuzhiyun 	struct tipc_group_req mreq;
3139*4882a593Smuzhiyun 	u32 value = 0;
3140*4882a593Smuzhiyun 	int res = 0;
3141*4882a593Smuzhiyun 
3142*4882a593Smuzhiyun 	if ((lvl == IPPROTO_TCP) && (sock->type == SOCK_STREAM))
3143*4882a593Smuzhiyun 		return 0;
3144*4882a593Smuzhiyun 	if (lvl != SOL_TIPC)
3145*4882a593Smuzhiyun 		return -ENOPROTOOPT;
3146*4882a593Smuzhiyun 
3147*4882a593Smuzhiyun 	switch (opt) {
3148*4882a593Smuzhiyun 	case TIPC_IMPORTANCE:
3149*4882a593Smuzhiyun 	case TIPC_SRC_DROPPABLE:
3150*4882a593Smuzhiyun 	case TIPC_DEST_DROPPABLE:
3151*4882a593Smuzhiyun 	case TIPC_CONN_TIMEOUT:
3152*4882a593Smuzhiyun 	case TIPC_NODELAY:
3153*4882a593Smuzhiyun 		if (ol < sizeof(value))
3154*4882a593Smuzhiyun 			return -EINVAL;
3155*4882a593Smuzhiyun 		if (copy_from_sockptr(&value, ov, sizeof(u32)))
3156*4882a593Smuzhiyun 			return -EFAULT;
3157*4882a593Smuzhiyun 		break;
3158*4882a593Smuzhiyun 	case TIPC_GROUP_JOIN:
3159*4882a593Smuzhiyun 		if (ol < sizeof(mreq))
3160*4882a593Smuzhiyun 			return -EINVAL;
3161*4882a593Smuzhiyun 		if (copy_from_sockptr(&mreq, ov, sizeof(mreq)))
3162*4882a593Smuzhiyun 			return -EFAULT;
3163*4882a593Smuzhiyun 		break;
3164*4882a593Smuzhiyun 	default:
3165*4882a593Smuzhiyun 		if (!sockptr_is_null(ov) || ol)
3166*4882a593Smuzhiyun 			return -EINVAL;
3167*4882a593Smuzhiyun 	}
3168*4882a593Smuzhiyun 
3169*4882a593Smuzhiyun 	lock_sock(sk);
3170*4882a593Smuzhiyun 
3171*4882a593Smuzhiyun 	switch (opt) {
3172*4882a593Smuzhiyun 	case TIPC_IMPORTANCE:
3173*4882a593Smuzhiyun 		res = tsk_set_importance(sk, value);
3174*4882a593Smuzhiyun 		break;
3175*4882a593Smuzhiyun 	case TIPC_SRC_DROPPABLE:
3176*4882a593Smuzhiyun 		if (sock->type != SOCK_STREAM)
3177*4882a593Smuzhiyun 			tsk_set_unreliable(tsk, value);
3178*4882a593Smuzhiyun 		else
3179*4882a593Smuzhiyun 			res = -ENOPROTOOPT;
3180*4882a593Smuzhiyun 		break;
3181*4882a593Smuzhiyun 	case TIPC_DEST_DROPPABLE:
3182*4882a593Smuzhiyun 		tsk_set_unreturnable(tsk, value);
3183*4882a593Smuzhiyun 		break;
3184*4882a593Smuzhiyun 	case TIPC_CONN_TIMEOUT:
3185*4882a593Smuzhiyun 		tipc_sk(sk)->conn_timeout = value;
3186*4882a593Smuzhiyun 		break;
3187*4882a593Smuzhiyun 	case TIPC_MCAST_BROADCAST:
3188*4882a593Smuzhiyun 		tsk->mc_method.rcast = false;
3189*4882a593Smuzhiyun 		tsk->mc_method.mandatory = true;
3190*4882a593Smuzhiyun 		break;
3191*4882a593Smuzhiyun 	case TIPC_MCAST_REPLICAST:
3192*4882a593Smuzhiyun 		tsk->mc_method.rcast = true;
3193*4882a593Smuzhiyun 		tsk->mc_method.mandatory = true;
3194*4882a593Smuzhiyun 		break;
3195*4882a593Smuzhiyun 	case TIPC_GROUP_JOIN:
3196*4882a593Smuzhiyun 		res = tipc_sk_join(tsk, &mreq);
3197*4882a593Smuzhiyun 		break;
3198*4882a593Smuzhiyun 	case TIPC_GROUP_LEAVE:
3199*4882a593Smuzhiyun 		res = tipc_sk_leave(tsk);
3200*4882a593Smuzhiyun 		break;
3201*4882a593Smuzhiyun 	case TIPC_NODELAY:
3202*4882a593Smuzhiyun 		tsk->nodelay = !!value;
3203*4882a593Smuzhiyun 		tsk_set_nagle(tsk);
3204*4882a593Smuzhiyun 		break;
3205*4882a593Smuzhiyun 	default:
3206*4882a593Smuzhiyun 		res = -EINVAL;
3207*4882a593Smuzhiyun 	}
3208*4882a593Smuzhiyun 
3209*4882a593Smuzhiyun 	release_sock(sk);
3210*4882a593Smuzhiyun 
3211*4882a593Smuzhiyun 	return res;
3212*4882a593Smuzhiyun }
3213*4882a593Smuzhiyun 
3214*4882a593Smuzhiyun /**
3215*4882a593Smuzhiyun  * tipc_getsockopt - get socket option
3216*4882a593Smuzhiyun  * @sock: socket structure
3217*4882a593Smuzhiyun  * @lvl: option level
3218*4882a593Smuzhiyun  * @opt: option identifier
3219*4882a593Smuzhiyun  * @ov: receptacle for option value
3220*4882a593Smuzhiyun  * @ol: receptacle for length of option value
3221*4882a593Smuzhiyun  *
3222*4882a593Smuzhiyun  * For stream sockets only, returns 0 length result for all IPPROTO_TCP options
3223*4882a593Smuzhiyun  * (to ease compatibility).
3224*4882a593Smuzhiyun  *
3225*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
3226*4882a593Smuzhiyun  */
tipc_getsockopt(struct socket * sock,int lvl,int opt,char __user * ov,int __user * ol)3227*4882a593Smuzhiyun static int tipc_getsockopt(struct socket *sock, int lvl, int opt,
3228*4882a593Smuzhiyun 			   char __user *ov, int __user *ol)
3229*4882a593Smuzhiyun {
3230*4882a593Smuzhiyun 	struct sock *sk = sock->sk;
3231*4882a593Smuzhiyun 	struct tipc_sock *tsk = tipc_sk(sk);
3232*4882a593Smuzhiyun 	struct tipc_name_seq seq;
3233*4882a593Smuzhiyun 	int len, scope;
3234*4882a593Smuzhiyun 	u32 value;
3235*4882a593Smuzhiyun 	int res;
3236*4882a593Smuzhiyun 
3237*4882a593Smuzhiyun 	if ((lvl == IPPROTO_TCP) && (sock->type == SOCK_STREAM))
3238*4882a593Smuzhiyun 		return put_user(0, ol);
3239*4882a593Smuzhiyun 	if (lvl != SOL_TIPC)
3240*4882a593Smuzhiyun 		return -ENOPROTOOPT;
3241*4882a593Smuzhiyun 	res = get_user(len, ol);
3242*4882a593Smuzhiyun 	if (res)
3243*4882a593Smuzhiyun 		return res;
3244*4882a593Smuzhiyun 
3245*4882a593Smuzhiyun 	lock_sock(sk);
3246*4882a593Smuzhiyun 
3247*4882a593Smuzhiyun 	switch (opt) {
3248*4882a593Smuzhiyun 	case TIPC_IMPORTANCE:
3249*4882a593Smuzhiyun 		value = tsk_importance(tsk);
3250*4882a593Smuzhiyun 		break;
3251*4882a593Smuzhiyun 	case TIPC_SRC_DROPPABLE:
3252*4882a593Smuzhiyun 		value = tsk_unreliable(tsk);
3253*4882a593Smuzhiyun 		break;
3254*4882a593Smuzhiyun 	case TIPC_DEST_DROPPABLE:
3255*4882a593Smuzhiyun 		value = tsk_unreturnable(tsk);
3256*4882a593Smuzhiyun 		break;
3257*4882a593Smuzhiyun 	case TIPC_CONN_TIMEOUT:
3258*4882a593Smuzhiyun 		value = tsk->conn_timeout;
3259*4882a593Smuzhiyun 		/* no need to set "res", since already 0 at this point */
3260*4882a593Smuzhiyun 		break;
3261*4882a593Smuzhiyun 	case TIPC_NODE_RECVQ_DEPTH:
3262*4882a593Smuzhiyun 		value = 0; /* was tipc_queue_size, now obsolete */
3263*4882a593Smuzhiyun 		break;
3264*4882a593Smuzhiyun 	case TIPC_SOCK_RECVQ_DEPTH:
3265*4882a593Smuzhiyun 		value = skb_queue_len(&sk->sk_receive_queue);
3266*4882a593Smuzhiyun 		break;
3267*4882a593Smuzhiyun 	case TIPC_SOCK_RECVQ_USED:
3268*4882a593Smuzhiyun 		value = sk_rmem_alloc_get(sk);
3269*4882a593Smuzhiyun 		break;
3270*4882a593Smuzhiyun 	case TIPC_GROUP_JOIN:
3271*4882a593Smuzhiyun 		seq.type = 0;
3272*4882a593Smuzhiyun 		if (tsk->group)
3273*4882a593Smuzhiyun 			tipc_group_self(tsk->group, &seq, &scope);
3274*4882a593Smuzhiyun 		value = seq.type;
3275*4882a593Smuzhiyun 		break;
3276*4882a593Smuzhiyun 	default:
3277*4882a593Smuzhiyun 		res = -EINVAL;
3278*4882a593Smuzhiyun 	}
3279*4882a593Smuzhiyun 
3280*4882a593Smuzhiyun 	release_sock(sk);
3281*4882a593Smuzhiyun 
3282*4882a593Smuzhiyun 	if (res)
3283*4882a593Smuzhiyun 		return res;	/* "get" failed */
3284*4882a593Smuzhiyun 
3285*4882a593Smuzhiyun 	if (len < sizeof(value))
3286*4882a593Smuzhiyun 		return -EINVAL;
3287*4882a593Smuzhiyun 
3288*4882a593Smuzhiyun 	if (copy_to_user(ov, &value, sizeof(value)))
3289*4882a593Smuzhiyun 		return -EFAULT;
3290*4882a593Smuzhiyun 
3291*4882a593Smuzhiyun 	return put_user(sizeof(value), ol);
3292*4882a593Smuzhiyun }
3293*4882a593Smuzhiyun 
tipc_ioctl(struct socket * sock,unsigned int cmd,unsigned long arg)3294*4882a593Smuzhiyun static int tipc_ioctl(struct socket *sock, unsigned int cmd, unsigned long arg)
3295*4882a593Smuzhiyun {
3296*4882a593Smuzhiyun 	struct net *net = sock_net(sock->sk);
3297*4882a593Smuzhiyun 	struct tipc_sioc_nodeid_req nr = {0};
3298*4882a593Smuzhiyun 	struct tipc_sioc_ln_req lnr;
3299*4882a593Smuzhiyun 	void __user *argp = (void __user *)arg;
3300*4882a593Smuzhiyun 
3301*4882a593Smuzhiyun 	switch (cmd) {
3302*4882a593Smuzhiyun 	case SIOCGETLINKNAME:
3303*4882a593Smuzhiyun 		if (copy_from_user(&lnr, argp, sizeof(lnr)))
3304*4882a593Smuzhiyun 			return -EFAULT;
3305*4882a593Smuzhiyun 		if (!tipc_node_get_linkname(net,
3306*4882a593Smuzhiyun 					    lnr.bearer_id & 0xffff, lnr.peer,
3307*4882a593Smuzhiyun 					    lnr.linkname, TIPC_MAX_LINK_NAME)) {
3308*4882a593Smuzhiyun 			if (copy_to_user(argp, &lnr, sizeof(lnr)))
3309*4882a593Smuzhiyun 				return -EFAULT;
3310*4882a593Smuzhiyun 			return 0;
3311*4882a593Smuzhiyun 		}
3312*4882a593Smuzhiyun 		return -EADDRNOTAVAIL;
3313*4882a593Smuzhiyun 	case SIOCGETNODEID:
3314*4882a593Smuzhiyun 		if (copy_from_user(&nr, argp, sizeof(nr)))
3315*4882a593Smuzhiyun 			return -EFAULT;
3316*4882a593Smuzhiyun 		if (!tipc_node_get_id(net, nr.peer, nr.node_id))
3317*4882a593Smuzhiyun 			return -EADDRNOTAVAIL;
3318*4882a593Smuzhiyun 		if (copy_to_user(argp, &nr, sizeof(nr)))
3319*4882a593Smuzhiyun 			return -EFAULT;
3320*4882a593Smuzhiyun 		return 0;
3321*4882a593Smuzhiyun 	default:
3322*4882a593Smuzhiyun 		return -ENOIOCTLCMD;
3323*4882a593Smuzhiyun 	}
3324*4882a593Smuzhiyun }
3325*4882a593Smuzhiyun 
tipc_socketpair(struct socket * sock1,struct socket * sock2)3326*4882a593Smuzhiyun static int tipc_socketpair(struct socket *sock1, struct socket *sock2)
3327*4882a593Smuzhiyun {
3328*4882a593Smuzhiyun 	struct tipc_sock *tsk2 = tipc_sk(sock2->sk);
3329*4882a593Smuzhiyun 	struct tipc_sock *tsk1 = tipc_sk(sock1->sk);
3330*4882a593Smuzhiyun 	u32 onode = tipc_own_addr(sock_net(sock1->sk));
3331*4882a593Smuzhiyun 
3332*4882a593Smuzhiyun 	tsk1->peer.family = AF_TIPC;
3333*4882a593Smuzhiyun 	tsk1->peer.addrtype = TIPC_ADDR_ID;
3334*4882a593Smuzhiyun 	tsk1->peer.scope = TIPC_NODE_SCOPE;
3335*4882a593Smuzhiyun 	tsk1->peer.addr.id.ref = tsk2->portid;
3336*4882a593Smuzhiyun 	tsk1->peer.addr.id.node = onode;
3337*4882a593Smuzhiyun 	tsk2->peer.family = AF_TIPC;
3338*4882a593Smuzhiyun 	tsk2->peer.addrtype = TIPC_ADDR_ID;
3339*4882a593Smuzhiyun 	tsk2->peer.scope = TIPC_NODE_SCOPE;
3340*4882a593Smuzhiyun 	tsk2->peer.addr.id.ref = tsk1->portid;
3341*4882a593Smuzhiyun 	tsk2->peer.addr.id.node = onode;
3342*4882a593Smuzhiyun 
3343*4882a593Smuzhiyun 	tipc_sk_finish_conn(tsk1, tsk2->portid, onode);
3344*4882a593Smuzhiyun 	tipc_sk_finish_conn(tsk2, tsk1->portid, onode);
3345*4882a593Smuzhiyun 	return 0;
3346*4882a593Smuzhiyun }
3347*4882a593Smuzhiyun 
3348*4882a593Smuzhiyun /* Protocol switches for the various types of TIPC sockets */
3349*4882a593Smuzhiyun 
3350*4882a593Smuzhiyun static const struct proto_ops msg_ops = {
3351*4882a593Smuzhiyun 	.owner		= THIS_MODULE,
3352*4882a593Smuzhiyun 	.family		= AF_TIPC,
3353*4882a593Smuzhiyun 	.release	= tipc_release,
3354*4882a593Smuzhiyun 	.bind		= tipc_bind,
3355*4882a593Smuzhiyun 	.connect	= tipc_connect,
3356*4882a593Smuzhiyun 	.socketpair	= tipc_socketpair,
3357*4882a593Smuzhiyun 	.accept		= sock_no_accept,
3358*4882a593Smuzhiyun 	.getname	= tipc_getname,
3359*4882a593Smuzhiyun 	.poll		= tipc_poll,
3360*4882a593Smuzhiyun 	.ioctl		= tipc_ioctl,
3361*4882a593Smuzhiyun 	.listen		= sock_no_listen,
3362*4882a593Smuzhiyun 	.shutdown	= tipc_shutdown,
3363*4882a593Smuzhiyun 	.setsockopt	= tipc_setsockopt,
3364*4882a593Smuzhiyun 	.getsockopt	= tipc_getsockopt,
3365*4882a593Smuzhiyun 	.sendmsg	= tipc_sendmsg,
3366*4882a593Smuzhiyun 	.recvmsg	= tipc_recvmsg,
3367*4882a593Smuzhiyun 	.mmap		= sock_no_mmap,
3368*4882a593Smuzhiyun 	.sendpage	= sock_no_sendpage
3369*4882a593Smuzhiyun };
3370*4882a593Smuzhiyun 
3371*4882a593Smuzhiyun static const struct proto_ops packet_ops = {
3372*4882a593Smuzhiyun 	.owner		= THIS_MODULE,
3373*4882a593Smuzhiyun 	.family		= AF_TIPC,
3374*4882a593Smuzhiyun 	.release	= tipc_release,
3375*4882a593Smuzhiyun 	.bind		= tipc_bind,
3376*4882a593Smuzhiyun 	.connect	= tipc_connect,
3377*4882a593Smuzhiyun 	.socketpair	= tipc_socketpair,
3378*4882a593Smuzhiyun 	.accept		= tipc_accept,
3379*4882a593Smuzhiyun 	.getname	= tipc_getname,
3380*4882a593Smuzhiyun 	.poll		= tipc_poll,
3381*4882a593Smuzhiyun 	.ioctl		= tipc_ioctl,
3382*4882a593Smuzhiyun 	.listen		= tipc_listen,
3383*4882a593Smuzhiyun 	.shutdown	= tipc_shutdown,
3384*4882a593Smuzhiyun 	.setsockopt	= tipc_setsockopt,
3385*4882a593Smuzhiyun 	.getsockopt	= tipc_getsockopt,
3386*4882a593Smuzhiyun 	.sendmsg	= tipc_send_packet,
3387*4882a593Smuzhiyun 	.recvmsg	= tipc_recvmsg,
3388*4882a593Smuzhiyun 	.mmap		= sock_no_mmap,
3389*4882a593Smuzhiyun 	.sendpage	= sock_no_sendpage
3390*4882a593Smuzhiyun };
3391*4882a593Smuzhiyun 
3392*4882a593Smuzhiyun static const struct proto_ops stream_ops = {
3393*4882a593Smuzhiyun 	.owner		= THIS_MODULE,
3394*4882a593Smuzhiyun 	.family		= AF_TIPC,
3395*4882a593Smuzhiyun 	.release	= tipc_release,
3396*4882a593Smuzhiyun 	.bind		= tipc_bind,
3397*4882a593Smuzhiyun 	.connect	= tipc_connect,
3398*4882a593Smuzhiyun 	.socketpair	= tipc_socketpair,
3399*4882a593Smuzhiyun 	.accept		= tipc_accept,
3400*4882a593Smuzhiyun 	.getname	= tipc_getname,
3401*4882a593Smuzhiyun 	.poll		= tipc_poll,
3402*4882a593Smuzhiyun 	.ioctl		= tipc_ioctl,
3403*4882a593Smuzhiyun 	.listen		= tipc_listen,
3404*4882a593Smuzhiyun 	.shutdown	= tipc_shutdown,
3405*4882a593Smuzhiyun 	.setsockopt	= tipc_setsockopt,
3406*4882a593Smuzhiyun 	.getsockopt	= tipc_getsockopt,
3407*4882a593Smuzhiyun 	.sendmsg	= tipc_sendstream,
3408*4882a593Smuzhiyun 	.recvmsg	= tipc_recvstream,
3409*4882a593Smuzhiyun 	.mmap		= sock_no_mmap,
3410*4882a593Smuzhiyun 	.sendpage	= sock_no_sendpage
3411*4882a593Smuzhiyun };
3412*4882a593Smuzhiyun 
3413*4882a593Smuzhiyun static const struct net_proto_family tipc_family_ops = {
3414*4882a593Smuzhiyun 	.owner		= THIS_MODULE,
3415*4882a593Smuzhiyun 	.family		= AF_TIPC,
3416*4882a593Smuzhiyun 	.create		= tipc_sk_create
3417*4882a593Smuzhiyun };
3418*4882a593Smuzhiyun 
3419*4882a593Smuzhiyun static struct proto tipc_proto = {
3420*4882a593Smuzhiyun 	.name		= "TIPC",
3421*4882a593Smuzhiyun 	.owner		= THIS_MODULE,
3422*4882a593Smuzhiyun 	.obj_size	= sizeof(struct tipc_sock),
3423*4882a593Smuzhiyun 	.sysctl_rmem	= sysctl_tipc_rmem
3424*4882a593Smuzhiyun };
3425*4882a593Smuzhiyun 
3426*4882a593Smuzhiyun /**
3427*4882a593Smuzhiyun  * tipc_socket_init - initialize TIPC socket interface
3428*4882a593Smuzhiyun  *
3429*4882a593Smuzhiyun  * Returns 0 on success, errno otherwise
3430*4882a593Smuzhiyun  */
tipc_socket_init(void)3431*4882a593Smuzhiyun int tipc_socket_init(void)
3432*4882a593Smuzhiyun {
3433*4882a593Smuzhiyun 	int res;
3434*4882a593Smuzhiyun 
3435*4882a593Smuzhiyun 	res = proto_register(&tipc_proto, 1);
3436*4882a593Smuzhiyun 	if (res) {
3437*4882a593Smuzhiyun 		pr_err("Failed to register TIPC protocol type\n");
3438*4882a593Smuzhiyun 		goto out;
3439*4882a593Smuzhiyun 	}
3440*4882a593Smuzhiyun 
3441*4882a593Smuzhiyun 	res = sock_register(&tipc_family_ops);
3442*4882a593Smuzhiyun 	if (res) {
3443*4882a593Smuzhiyun 		pr_err("Failed to register TIPC socket type\n");
3444*4882a593Smuzhiyun 		proto_unregister(&tipc_proto);
3445*4882a593Smuzhiyun 		goto out;
3446*4882a593Smuzhiyun 	}
3447*4882a593Smuzhiyun  out:
3448*4882a593Smuzhiyun 	return res;
3449*4882a593Smuzhiyun }
3450*4882a593Smuzhiyun 
3451*4882a593Smuzhiyun /**
3452*4882a593Smuzhiyun  * tipc_socket_stop - stop TIPC socket interface
3453*4882a593Smuzhiyun  */
tipc_socket_stop(void)3454*4882a593Smuzhiyun void tipc_socket_stop(void)
3455*4882a593Smuzhiyun {
3456*4882a593Smuzhiyun 	sock_unregister(tipc_family_ops.family);
3457*4882a593Smuzhiyun 	proto_unregister(&tipc_proto);
3458*4882a593Smuzhiyun }
3459*4882a593Smuzhiyun 
3460*4882a593Smuzhiyun /* Caller should hold socket lock for the passed tipc socket. */
__tipc_nl_add_sk_con(struct sk_buff * skb,struct tipc_sock * tsk)3461*4882a593Smuzhiyun static int __tipc_nl_add_sk_con(struct sk_buff *skb, struct tipc_sock *tsk)
3462*4882a593Smuzhiyun {
3463*4882a593Smuzhiyun 	u32 peer_node;
3464*4882a593Smuzhiyun 	u32 peer_port;
3465*4882a593Smuzhiyun 	struct nlattr *nest;
3466*4882a593Smuzhiyun 
3467*4882a593Smuzhiyun 	peer_node = tsk_peer_node(tsk);
3468*4882a593Smuzhiyun 	peer_port = tsk_peer_port(tsk);
3469*4882a593Smuzhiyun 
3470*4882a593Smuzhiyun 	nest = nla_nest_start_noflag(skb, TIPC_NLA_SOCK_CON);
3471*4882a593Smuzhiyun 	if (!nest)
3472*4882a593Smuzhiyun 		return -EMSGSIZE;
3473*4882a593Smuzhiyun 
3474*4882a593Smuzhiyun 	if (nla_put_u32(skb, TIPC_NLA_CON_NODE, peer_node))
3475*4882a593Smuzhiyun 		goto msg_full;
3476*4882a593Smuzhiyun 	if (nla_put_u32(skb, TIPC_NLA_CON_SOCK, peer_port))
3477*4882a593Smuzhiyun 		goto msg_full;
3478*4882a593Smuzhiyun 
3479*4882a593Smuzhiyun 	if (tsk->conn_type != 0) {
3480*4882a593Smuzhiyun 		if (nla_put_flag(skb, TIPC_NLA_CON_FLAG))
3481*4882a593Smuzhiyun 			goto msg_full;
3482*4882a593Smuzhiyun 		if (nla_put_u32(skb, TIPC_NLA_CON_TYPE, tsk->conn_type))
3483*4882a593Smuzhiyun 			goto msg_full;
3484*4882a593Smuzhiyun 		if (nla_put_u32(skb, TIPC_NLA_CON_INST, tsk->conn_instance))
3485*4882a593Smuzhiyun 			goto msg_full;
3486*4882a593Smuzhiyun 	}
3487*4882a593Smuzhiyun 	nla_nest_end(skb, nest);
3488*4882a593Smuzhiyun 
3489*4882a593Smuzhiyun 	return 0;
3490*4882a593Smuzhiyun 
3491*4882a593Smuzhiyun msg_full:
3492*4882a593Smuzhiyun 	nla_nest_cancel(skb, nest);
3493*4882a593Smuzhiyun 
3494*4882a593Smuzhiyun 	return -EMSGSIZE;
3495*4882a593Smuzhiyun }
3496*4882a593Smuzhiyun 
__tipc_nl_add_sk_info(struct sk_buff * skb,struct tipc_sock * tsk)3497*4882a593Smuzhiyun static int __tipc_nl_add_sk_info(struct sk_buff *skb, struct tipc_sock
3498*4882a593Smuzhiyun 			  *tsk)
3499*4882a593Smuzhiyun {
3500*4882a593Smuzhiyun 	struct net *net = sock_net(skb->sk);
3501*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
3502*4882a593Smuzhiyun 
3503*4882a593Smuzhiyun 	if (nla_put_u32(skb, TIPC_NLA_SOCK_REF, tsk->portid) ||
3504*4882a593Smuzhiyun 	    nla_put_u32(skb, TIPC_NLA_SOCK_ADDR, tipc_own_addr(net)))
3505*4882a593Smuzhiyun 		return -EMSGSIZE;
3506*4882a593Smuzhiyun 
3507*4882a593Smuzhiyun 	if (tipc_sk_connected(sk)) {
3508*4882a593Smuzhiyun 		if (__tipc_nl_add_sk_con(skb, tsk))
3509*4882a593Smuzhiyun 			return -EMSGSIZE;
3510*4882a593Smuzhiyun 	} else if (!list_empty(&tsk->publications)) {
3511*4882a593Smuzhiyun 		if (nla_put_flag(skb, TIPC_NLA_SOCK_HAS_PUBL))
3512*4882a593Smuzhiyun 			return -EMSGSIZE;
3513*4882a593Smuzhiyun 	}
3514*4882a593Smuzhiyun 	return 0;
3515*4882a593Smuzhiyun }
3516*4882a593Smuzhiyun 
3517*4882a593Smuzhiyun /* Caller should hold socket lock for the passed tipc socket. */
__tipc_nl_add_sk(struct sk_buff * skb,struct netlink_callback * cb,struct tipc_sock * tsk)3518*4882a593Smuzhiyun static int __tipc_nl_add_sk(struct sk_buff *skb, struct netlink_callback *cb,
3519*4882a593Smuzhiyun 			    struct tipc_sock *tsk)
3520*4882a593Smuzhiyun {
3521*4882a593Smuzhiyun 	struct nlattr *attrs;
3522*4882a593Smuzhiyun 	void *hdr;
3523*4882a593Smuzhiyun 
3524*4882a593Smuzhiyun 	hdr = genlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
3525*4882a593Smuzhiyun 			  &tipc_genl_family, NLM_F_MULTI, TIPC_NL_SOCK_GET);
3526*4882a593Smuzhiyun 	if (!hdr)
3527*4882a593Smuzhiyun 		goto msg_cancel;
3528*4882a593Smuzhiyun 
3529*4882a593Smuzhiyun 	attrs = nla_nest_start_noflag(skb, TIPC_NLA_SOCK);
3530*4882a593Smuzhiyun 	if (!attrs)
3531*4882a593Smuzhiyun 		goto genlmsg_cancel;
3532*4882a593Smuzhiyun 
3533*4882a593Smuzhiyun 	if (__tipc_nl_add_sk_info(skb, tsk))
3534*4882a593Smuzhiyun 		goto attr_msg_cancel;
3535*4882a593Smuzhiyun 
3536*4882a593Smuzhiyun 	nla_nest_end(skb, attrs);
3537*4882a593Smuzhiyun 	genlmsg_end(skb, hdr);
3538*4882a593Smuzhiyun 
3539*4882a593Smuzhiyun 	return 0;
3540*4882a593Smuzhiyun 
3541*4882a593Smuzhiyun attr_msg_cancel:
3542*4882a593Smuzhiyun 	nla_nest_cancel(skb, attrs);
3543*4882a593Smuzhiyun genlmsg_cancel:
3544*4882a593Smuzhiyun 	genlmsg_cancel(skb, hdr);
3545*4882a593Smuzhiyun msg_cancel:
3546*4882a593Smuzhiyun 	return -EMSGSIZE;
3547*4882a593Smuzhiyun }
3548*4882a593Smuzhiyun 
tipc_nl_sk_walk(struct sk_buff * skb,struct netlink_callback * cb,int (* skb_handler)(struct sk_buff * skb,struct netlink_callback * cb,struct tipc_sock * tsk))3549*4882a593Smuzhiyun int tipc_nl_sk_walk(struct sk_buff *skb, struct netlink_callback *cb,
3550*4882a593Smuzhiyun 		    int (*skb_handler)(struct sk_buff *skb,
3551*4882a593Smuzhiyun 				       struct netlink_callback *cb,
3552*4882a593Smuzhiyun 				       struct tipc_sock *tsk))
3553*4882a593Smuzhiyun {
3554*4882a593Smuzhiyun 	struct rhashtable_iter *iter = (void *)cb->args[4];
3555*4882a593Smuzhiyun 	struct tipc_sock *tsk;
3556*4882a593Smuzhiyun 	int err;
3557*4882a593Smuzhiyun 
3558*4882a593Smuzhiyun 	rhashtable_walk_start(iter);
3559*4882a593Smuzhiyun 	while ((tsk = rhashtable_walk_next(iter)) != NULL) {
3560*4882a593Smuzhiyun 		if (IS_ERR(tsk)) {
3561*4882a593Smuzhiyun 			err = PTR_ERR(tsk);
3562*4882a593Smuzhiyun 			if (err == -EAGAIN) {
3563*4882a593Smuzhiyun 				err = 0;
3564*4882a593Smuzhiyun 				continue;
3565*4882a593Smuzhiyun 			}
3566*4882a593Smuzhiyun 			break;
3567*4882a593Smuzhiyun 		}
3568*4882a593Smuzhiyun 
3569*4882a593Smuzhiyun 		sock_hold(&tsk->sk);
3570*4882a593Smuzhiyun 		rhashtable_walk_stop(iter);
3571*4882a593Smuzhiyun 		lock_sock(&tsk->sk);
3572*4882a593Smuzhiyun 		err = skb_handler(skb, cb, tsk);
3573*4882a593Smuzhiyun 		if (err) {
3574*4882a593Smuzhiyun 			release_sock(&tsk->sk);
3575*4882a593Smuzhiyun 			sock_put(&tsk->sk);
3576*4882a593Smuzhiyun 			goto out;
3577*4882a593Smuzhiyun 		}
3578*4882a593Smuzhiyun 		release_sock(&tsk->sk);
3579*4882a593Smuzhiyun 		rhashtable_walk_start(iter);
3580*4882a593Smuzhiyun 		sock_put(&tsk->sk);
3581*4882a593Smuzhiyun 	}
3582*4882a593Smuzhiyun 	rhashtable_walk_stop(iter);
3583*4882a593Smuzhiyun out:
3584*4882a593Smuzhiyun 	return skb->len;
3585*4882a593Smuzhiyun }
3586*4882a593Smuzhiyun EXPORT_SYMBOL(tipc_nl_sk_walk);
3587*4882a593Smuzhiyun 
tipc_dump_start(struct netlink_callback * cb)3588*4882a593Smuzhiyun int tipc_dump_start(struct netlink_callback *cb)
3589*4882a593Smuzhiyun {
3590*4882a593Smuzhiyun 	return __tipc_dump_start(cb, sock_net(cb->skb->sk));
3591*4882a593Smuzhiyun }
3592*4882a593Smuzhiyun EXPORT_SYMBOL(tipc_dump_start);
3593*4882a593Smuzhiyun 
__tipc_dump_start(struct netlink_callback * cb,struct net * net)3594*4882a593Smuzhiyun int __tipc_dump_start(struct netlink_callback *cb, struct net *net)
3595*4882a593Smuzhiyun {
3596*4882a593Smuzhiyun 	/* tipc_nl_name_table_dump() uses cb->args[0...3]. */
3597*4882a593Smuzhiyun 	struct rhashtable_iter *iter = (void *)cb->args[4];
3598*4882a593Smuzhiyun 	struct tipc_net *tn = tipc_net(net);
3599*4882a593Smuzhiyun 
3600*4882a593Smuzhiyun 	if (!iter) {
3601*4882a593Smuzhiyun 		iter = kmalloc(sizeof(*iter), GFP_KERNEL);
3602*4882a593Smuzhiyun 		if (!iter)
3603*4882a593Smuzhiyun 			return -ENOMEM;
3604*4882a593Smuzhiyun 
3605*4882a593Smuzhiyun 		cb->args[4] = (long)iter;
3606*4882a593Smuzhiyun 	}
3607*4882a593Smuzhiyun 
3608*4882a593Smuzhiyun 	rhashtable_walk_enter(&tn->sk_rht, iter);
3609*4882a593Smuzhiyun 	return 0;
3610*4882a593Smuzhiyun }
3611*4882a593Smuzhiyun 
tipc_dump_done(struct netlink_callback * cb)3612*4882a593Smuzhiyun int tipc_dump_done(struct netlink_callback *cb)
3613*4882a593Smuzhiyun {
3614*4882a593Smuzhiyun 	struct rhashtable_iter *hti = (void *)cb->args[4];
3615*4882a593Smuzhiyun 
3616*4882a593Smuzhiyun 	rhashtable_walk_exit(hti);
3617*4882a593Smuzhiyun 	kfree(hti);
3618*4882a593Smuzhiyun 	return 0;
3619*4882a593Smuzhiyun }
3620*4882a593Smuzhiyun EXPORT_SYMBOL(tipc_dump_done);
3621*4882a593Smuzhiyun 
tipc_sk_fill_sock_diag(struct sk_buff * skb,struct netlink_callback * cb,struct tipc_sock * tsk,u32 sk_filter_state,u64 (* tipc_diag_gen_cookie)(struct sock * sk))3622*4882a593Smuzhiyun int tipc_sk_fill_sock_diag(struct sk_buff *skb, struct netlink_callback *cb,
3623*4882a593Smuzhiyun 			   struct tipc_sock *tsk, u32 sk_filter_state,
3624*4882a593Smuzhiyun 			   u64 (*tipc_diag_gen_cookie)(struct sock *sk))
3625*4882a593Smuzhiyun {
3626*4882a593Smuzhiyun 	struct sock *sk = &tsk->sk;
3627*4882a593Smuzhiyun 	struct nlattr *attrs;
3628*4882a593Smuzhiyun 	struct nlattr *stat;
3629*4882a593Smuzhiyun 
3630*4882a593Smuzhiyun 	/*filter response w.r.t sk_state*/
3631*4882a593Smuzhiyun 	if (!(sk_filter_state & (1 << sk->sk_state)))
3632*4882a593Smuzhiyun 		return 0;
3633*4882a593Smuzhiyun 
3634*4882a593Smuzhiyun 	attrs = nla_nest_start_noflag(skb, TIPC_NLA_SOCK);
3635*4882a593Smuzhiyun 	if (!attrs)
3636*4882a593Smuzhiyun 		goto msg_cancel;
3637*4882a593Smuzhiyun 
3638*4882a593Smuzhiyun 	if (__tipc_nl_add_sk_info(skb, tsk))
3639*4882a593Smuzhiyun 		goto attr_msg_cancel;
3640*4882a593Smuzhiyun 
3641*4882a593Smuzhiyun 	if (nla_put_u32(skb, TIPC_NLA_SOCK_TYPE, (u32)sk->sk_type) ||
3642*4882a593Smuzhiyun 	    nla_put_u32(skb, TIPC_NLA_SOCK_TIPC_STATE, (u32)sk->sk_state) ||
3643*4882a593Smuzhiyun 	    nla_put_u32(skb, TIPC_NLA_SOCK_INO, sock_i_ino(sk)) ||
3644*4882a593Smuzhiyun 	    nla_put_u32(skb, TIPC_NLA_SOCK_UID,
3645*4882a593Smuzhiyun 			from_kuid_munged(sk_user_ns(NETLINK_CB(cb->skb).sk),
3646*4882a593Smuzhiyun 					 sock_i_uid(sk))) ||
3647*4882a593Smuzhiyun 	    nla_put_u64_64bit(skb, TIPC_NLA_SOCK_COOKIE,
3648*4882a593Smuzhiyun 			      tipc_diag_gen_cookie(sk),
3649*4882a593Smuzhiyun 			      TIPC_NLA_SOCK_PAD))
3650*4882a593Smuzhiyun 		goto attr_msg_cancel;
3651*4882a593Smuzhiyun 
3652*4882a593Smuzhiyun 	stat = nla_nest_start_noflag(skb, TIPC_NLA_SOCK_STAT);
3653*4882a593Smuzhiyun 	if (!stat)
3654*4882a593Smuzhiyun 		goto attr_msg_cancel;
3655*4882a593Smuzhiyun 
3656*4882a593Smuzhiyun 	if (nla_put_u32(skb, TIPC_NLA_SOCK_STAT_RCVQ,
3657*4882a593Smuzhiyun 			skb_queue_len(&sk->sk_receive_queue)) ||
3658*4882a593Smuzhiyun 	    nla_put_u32(skb, TIPC_NLA_SOCK_STAT_SENDQ,
3659*4882a593Smuzhiyun 			skb_queue_len(&sk->sk_write_queue)) ||
3660*4882a593Smuzhiyun 	    nla_put_u32(skb, TIPC_NLA_SOCK_STAT_DROP,
3661*4882a593Smuzhiyun 			atomic_read(&sk->sk_drops)))
3662*4882a593Smuzhiyun 		goto stat_msg_cancel;
3663*4882a593Smuzhiyun 
3664*4882a593Smuzhiyun 	if (tsk->cong_link_cnt &&
3665*4882a593Smuzhiyun 	    nla_put_flag(skb, TIPC_NLA_SOCK_STAT_LINK_CONG))
3666*4882a593Smuzhiyun 		goto stat_msg_cancel;
3667*4882a593Smuzhiyun 
3668*4882a593Smuzhiyun 	if (tsk_conn_cong(tsk) &&
3669*4882a593Smuzhiyun 	    nla_put_flag(skb, TIPC_NLA_SOCK_STAT_CONN_CONG))
3670*4882a593Smuzhiyun 		goto stat_msg_cancel;
3671*4882a593Smuzhiyun 
3672*4882a593Smuzhiyun 	nla_nest_end(skb, stat);
3673*4882a593Smuzhiyun 
3674*4882a593Smuzhiyun 	if (tsk->group)
3675*4882a593Smuzhiyun 		if (tipc_group_fill_sock_diag(tsk->group, skb))
3676*4882a593Smuzhiyun 			goto stat_msg_cancel;
3677*4882a593Smuzhiyun 
3678*4882a593Smuzhiyun 	nla_nest_end(skb, attrs);
3679*4882a593Smuzhiyun 
3680*4882a593Smuzhiyun 	return 0;
3681*4882a593Smuzhiyun 
3682*4882a593Smuzhiyun stat_msg_cancel:
3683*4882a593Smuzhiyun 	nla_nest_cancel(skb, stat);
3684*4882a593Smuzhiyun attr_msg_cancel:
3685*4882a593Smuzhiyun 	nla_nest_cancel(skb, attrs);
3686*4882a593Smuzhiyun msg_cancel:
3687*4882a593Smuzhiyun 	return -EMSGSIZE;
3688*4882a593Smuzhiyun }
3689*4882a593Smuzhiyun EXPORT_SYMBOL(tipc_sk_fill_sock_diag);
3690*4882a593Smuzhiyun 
tipc_nl_sk_dump(struct sk_buff * skb,struct netlink_callback * cb)3691*4882a593Smuzhiyun int tipc_nl_sk_dump(struct sk_buff *skb, struct netlink_callback *cb)
3692*4882a593Smuzhiyun {
3693*4882a593Smuzhiyun 	return tipc_nl_sk_walk(skb, cb, __tipc_nl_add_sk);
3694*4882a593Smuzhiyun }
3695*4882a593Smuzhiyun 
3696*4882a593Smuzhiyun /* Caller should hold socket lock for the passed tipc socket. */
__tipc_nl_add_sk_publ(struct sk_buff * skb,struct netlink_callback * cb,struct publication * publ)3697*4882a593Smuzhiyun static int __tipc_nl_add_sk_publ(struct sk_buff *skb,
3698*4882a593Smuzhiyun 				 struct netlink_callback *cb,
3699*4882a593Smuzhiyun 				 struct publication *publ)
3700*4882a593Smuzhiyun {
3701*4882a593Smuzhiyun 	void *hdr;
3702*4882a593Smuzhiyun 	struct nlattr *attrs;
3703*4882a593Smuzhiyun 
3704*4882a593Smuzhiyun 	hdr = genlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
3705*4882a593Smuzhiyun 			  &tipc_genl_family, NLM_F_MULTI, TIPC_NL_PUBL_GET);
3706*4882a593Smuzhiyun 	if (!hdr)
3707*4882a593Smuzhiyun 		goto msg_cancel;
3708*4882a593Smuzhiyun 
3709*4882a593Smuzhiyun 	attrs = nla_nest_start_noflag(skb, TIPC_NLA_PUBL);
3710*4882a593Smuzhiyun 	if (!attrs)
3711*4882a593Smuzhiyun 		goto genlmsg_cancel;
3712*4882a593Smuzhiyun 
3713*4882a593Smuzhiyun 	if (nla_put_u32(skb, TIPC_NLA_PUBL_KEY, publ->key))
3714*4882a593Smuzhiyun 		goto attr_msg_cancel;
3715*4882a593Smuzhiyun 	if (nla_put_u32(skb, TIPC_NLA_PUBL_TYPE, publ->type))
3716*4882a593Smuzhiyun 		goto attr_msg_cancel;
3717*4882a593Smuzhiyun 	if (nla_put_u32(skb, TIPC_NLA_PUBL_LOWER, publ->lower))
3718*4882a593Smuzhiyun 		goto attr_msg_cancel;
3719*4882a593Smuzhiyun 	if (nla_put_u32(skb, TIPC_NLA_PUBL_UPPER, publ->upper))
3720*4882a593Smuzhiyun 		goto attr_msg_cancel;
3721*4882a593Smuzhiyun 
3722*4882a593Smuzhiyun 	nla_nest_end(skb, attrs);
3723*4882a593Smuzhiyun 	genlmsg_end(skb, hdr);
3724*4882a593Smuzhiyun 
3725*4882a593Smuzhiyun 	return 0;
3726*4882a593Smuzhiyun 
3727*4882a593Smuzhiyun attr_msg_cancel:
3728*4882a593Smuzhiyun 	nla_nest_cancel(skb, attrs);
3729*4882a593Smuzhiyun genlmsg_cancel:
3730*4882a593Smuzhiyun 	genlmsg_cancel(skb, hdr);
3731*4882a593Smuzhiyun msg_cancel:
3732*4882a593Smuzhiyun 	return -EMSGSIZE;
3733*4882a593Smuzhiyun }
3734*4882a593Smuzhiyun 
3735*4882a593Smuzhiyun /* Caller should hold socket lock for the passed tipc socket. */
__tipc_nl_list_sk_publ(struct sk_buff * skb,struct netlink_callback * cb,struct tipc_sock * tsk,u32 * last_publ)3736*4882a593Smuzhiyun static int __tipc_nl_list_sk_publ(struct sk_buff *skb,
3737*4882a593Smuzhiyun 				  struct netlink_callback *cb,
3738*4882a593Smuzhiyun 				  struct tipc_sock *tsk, u32 *last_publ)
3739*4882a593Smuzhiyun {
3740*4882a593Smuzhiyun 	int err;
3741*4882a593Smuzhiyun 	struct publication *p;
3742*4882a593Smuzhiyun 
3743*4882a593Smuzhiyun 	if (*last_publ) {
3744*4882a593Smuzhiyun 		list_for_each_entry(p, &tsk->publications, binding_sock) {
3745*4882a593Smuzhiyun 			if (p->key == *last_publ)
3746*4882a593Smuzhiyun 				break;
3747*4882a593Smuzhiyun 		}
3748*4882a593Smuzhiyun 		if (list_entry_is_head(p, &tsk->publications, binding_sock)) {
3749*4882a593Smuzhiyun 			/* We never set seq or call nl_dump_check_consistent()
3750*4882a593Smuzhiyun 			 * this means that setting prev_seq here will cause the
3751*4882a593Smuzhiyun 			 * consistence check to fail in the netlink callback
3752*4882a593Smuzhiyun 			 * handler. Resulting in the last NLMSG_DONE message
3753*4882a593Smuzhiyun 			 * having the NLM_F_DUMP_INTR flag set.
3754*4882a593Smuzhiyun 			 */
3755*4882a593Smuzhiyun 			cb->prev_seq = 1;
3756*4882a593Smuzhiyun 			*last_publ = 0;
3757*4882a593Smuzhiyun 			return -EPIPE;
3758*4882a593Smuzhiyun 		}
3759*4882a593Smuzhiyun 	} else {
3760*4882a593Smuzhiyun 		p = list_first_entry(&tsk->publications, struct publication,
3761*4882a593Smuzhiyun 				     binding_sock);
3762*4882a593Smuzhiyun 	}
3763*4882a593Smuzhiyun 
3764*4882a593Smuzhiyun 	list_for_each_entry_from(p, &tsk->publications, binding_sock) {
3765*4882a593Smuzhiyun 		err = __tipc_nl_add_sk_publ(skb, cb, p);
3766*4882a593Smuzhiyun 		if (err) {
3767*4882a593Smuzhiyun 			*last_publ = p->key;
3768*4882a593Smuzhiyun 			return err;
3769*4882a593Smuzhiyun 		}
3770*4882a593Smuzhiyun 	}
3771*4882a593Smuzhiyun 	*last_publ = 0;
3772*4882a593Smuzhiyun 
3773*4882a593Smuzhiyun 	return 0;
3774*4882a593Smuzhiyun }
3775*4882a593Smuzhiyun 
tipc_nl_publ_dump(struct sk_buff * skb,struct netlink_callback * cb)3776*4882a593Smuzhiyun int tipc_nl_publ_dump(struct sk_buff *skb, struct netlink_callback *cb)
3777*4882a593Smuzhiyun {
3778*4882a593Smuzhiyun 	int err;
3779*4882a593Smuzhiyun 	u32 tsk_portid = cb->args[0];
3780*4882a593Smuzhiyun 	u32 last_publ = cb->args[1];
3781*4882a593Smuzhiyun 	u32 done = cb->args[2];
3782*4882a593Smuzhiyun 	struct net *net = sock_net(skb->sk);
3783*4882a593Smuzhiyun 	struct tipc_sock *tsk;
3784*4882a593Smuzhiyun 
3785*4882a593Smuzhiyun 	if (!tsk_portid) {
3786*4882a593Smuzhiyun 		struct nlattr **attrs = genl_dumpit_info(cb)->attrs;
3787*4882a593Smuzhiyun 		struct nlattr *sock[TIPC_NLA_SOCK_MAX + 1];
3788*4882a593Smuzhiyun 
3789*4882a593Smuzhiyun 		if (!attrs[TIPC_NLA_SOCK])
3790*4882a593Smuzhiyun 			return -EINVAL;
3791*4882a593Smuzhiyun 
3792*4882a593Smuzhiyun 		err = nla_parse_nested_deprecated(sock, TIPC_NLA_SOCK_MAX,
3793*4882a593Smuzhiyun 						  attrs[TIPC_NLA_SOCK],
3794*4882a593Smuzhiyun 						  tipc_nl_sock_policy, NULL);
3795*4882a593Smuzhiyun 		if (err)
3796*4882a593Smuzhiyun 			return err;
3797*4882a593Smuzhiyun 
3798*4882a593Smuzhiyun 		if (!sock[TIPC_NLA_SOCK_REF])
3799*4882a593Smuzhiyun 			return -EINVAL;
3800*4882a593Smuzhiyun 
3801*4882a593Smuzhiyun 		tsk_portid = nla_get_u32(sock[TIPC_NLA_SOCK_REF]);
3802*4882a593Smuzhiyun 	}
3803*4882a593Smuzhiyun 
3804*4882a593Smuzhiyun 	if (done)
3805*4882a593Smuzhiyun 		return 0;
3806*4882a593Smuzhiyun 
3807*4882a593Smuzhiyun 	tsk = tipc_sk_lookup(net, tsk_portid);
3808*4882a593Smuzhiyun 	if (!tsk)
3809*4882a593Smuzhiyun 		return -EINVAL;
3810*4882a593Smuzhiyun 
3811*4882a593Smuzhiyun 	lock_sock(&tsk->sk);
3812*4882a593Smuzhiyun 	err = __tipc_nl_list_sk_publ(skb, cb, tsk, &last_publ);
3813*4882a593Smuzhiyun 	if (!err)
3814*4882a593Smuzhiyun 		done = 1;
3815*4882a593Smuzhiyun 	release_sock(&tsk->sk);
3816*4882a593Smuzhiyun 	sock_put(&tsk->sk);
3817*4882a593Smuzhiyun 
3818*4882a593Smuzhiyun 	cb->args[0] = tsk_portid;
3819*4882a593Smuzhiyun 	cb->args[1] = last_publ;
3820*4882a593Smuzhiyun 	cb->args[2] = done;
3821*4882a593Smuzhiyun 
3822*4882a593Smuzhiyun 	return skb->len;
3823*4882a593Smuzhiyun }
3824*4882a593Smuzhiyun 
3825*4882a593Smuzhiyun /**
3826*4882a593Smuzhiyun  * tipc_sk_filtering - check if a socket should be traced
3827*4882a593Smuzhiyun  * @sk: the socket to be examined
3828*4882a593Smuzhiyun  * @sysctl_tipc_sk_filter[]: the socket tuple for filtering,
3829*4882a593Smuzhiyun  *  (portid, sock type, name type, name lower, name upper)
3830*4882a593Smuzhiyun  *
3831*4882a593Smuzhiyun  * Returns true if the socket meets the socket tuple data
3832*4882a593Smuzhiyun  * (value 0 = 'any') or when there is no tuple set (all = 0),
3833*4882a593Smuzhiyun  * otherwise false
3834*4882a593Smuzhiyun  */
tipc_sk_filtering(struct sock * sk)3835*4882a593Smuzhiyun bool tipc_sk_filtering(struct sock *sk)
3836*4882a593Smuzhiyun {
3837*4882a593Smuzhiyun 	struct tipc_sock *tsk;
3838*4882a593Smuzhiyun 	struct publication *p;
3839*4882a593Smuzhiyun 	u32 _port, _sktype, _type, _lower, _upper;
3840*4882a593Smuzhiyun 	u32 type = 0, lower = 0, upper = 0;
3841*4882a593Smuzhiyun 
3842*4882a593Smuzhiyun 	if (!sk)
3843*4882a593Smuzhiyun 		return true;
3844*4882a593Smuzhiyun 
3845*4882a593Smuzhiyun 	tsk = tipc_sk(sk);
3846*4882a593Smuzhiyun 
3847*4882a593Smuzhiyun 	_port = sysctl_tipc_sk_filter[0];
3848*4882a593Smuzhiyun 	_sktype = sysctl_tipc_sk_filter[1];
3849*4882a593Smuzhiyun 	_type = sysctl_tipc_sk_filter[2];
3850*4882a593Smuzhiyun 	_lower = sysctl_tipc_sk_filter[3];
3851*4882a593Smuzhiyun 	_upper = sysctl_tipc_sk_filter[4];
3852*4882a593Smuzhiyun 
3853*4882a593Smuzhiyun 	if (!_port && !_sktype && !_type && !_lower && !_upper)
3854*4882a593Smuzhiyun 		return true;
3855*4882a593Smuzhiyun 
3856*4882a593Smuzhiyun 	if (_port)
3857*4882a593Smuzhiyun 		return (_port == tsk->portid);
3858*4882a593Smuzhiyun 
3859*4882a593Smuzhiyun 	if (_sktype && _sktype != sk->sk_type)
3860*4882a593Smuzhiyun 		return false;
3861*4882a593Smuzhiyun 
3862*4882a593Smuzhiyun 	if (tsk->published) {
3863*4882a593Smuzhiyun 		p = list_first_entry_or_null(&tsk->publications,
3864*4882a593Smuzhiyun 					     struct publication, binding_sock);
3865*4882a593Smuzhiyun 		if (p) {
3866*4882a593Smuzhiyun 			type = p->type;
3867*4882a593Smuzhiyun 			lower = p->lower;
3868*4882a593Smuzhiyun 			upper = p->upper;
3869*4882a593Smuzhiyun 		}
3870*4882a593Smuzhiyun 	}
3871*4882a593Smuzhiyun 
3872*4882a593Smuzhiyun 	if (!tipc_sk_type_connectionless(sk)) {
3873*4882a593Smuzhiyun 		type = tsk->conn_type;
3874*4882a593Smuzhiyun 		lower = tsk->conn_instance;
3875*4882a593Smuzhiyun 		upper = tsk->conn_instance;
3876*4882a593Smuzhiyun 	}
3877*4882a593Smuzhiyun 
3878*4882a593Smuzhiyun 	if ((_type && _type != type) || (_lower && _lower != lower) ||
3879*4882a593Smuzhiyun 	    (_upper && _upper != upper))
3880*4882a593Smuzhiyun 		return false;
3881*4882a593Smuzhiyun 
3882*4882a593Smuzhiyun 	return true;
3883*4882a593Smuzhiyun }
3884*4882a593Smuzhiyun 
tipc_sock_get_portid(struct sock * sk)3885*4882a593Smuzhiyun u32 tipc_sock_get_portid(struct sock *sk)
3886*4882a593Smuzhiyun {
3887*4882a593Smuzhiyun 	return (sk) ? (tipc_sk(sk))->portid : 0;
3888*4882a593Smuzhiyun }
3889*4882a593Smuzhiyun 
3890*4882a593Smuzhiyun /**
3891*4882a593Smuzhiyun  * tipc_sk_overlimit1 - check if socket rx queue is about to be overloaded,
3892*4882a593Smuzhiyun  *			both the rcv and backlog queues are considered
3893*4882a593Smuzhiyun  * @sk: tipc sk to be checked
3894*4882a593Smuzhiyun  * @skb: tipc msg to be checked
3895*4882a593Smuzhiyun  *
3896*4882a593Smuzhiyun  * Returns true if the socket rx queue allocation is > 90%, otherwise false
3897*4882a593Smuzhiyun  */
3898*4882a593Smuzhiyun 
tipc_sk_overlimit1(struct sock * sk,struct sk_buff * skb)3899*4882a593Smuzhiyun bool tipc_sk_overlimit1(struct sock *sk, struct sk_buff *skb)
3900*4882a593Smuzhiyun {
3901*4882a593Smuzhiyun 	atomic_t *dcnt = &tipc_sk(sk)->dupl_rcvcnt;
3902*4882a593Smuzhiyun 	unsigned int lim = rcvbuf_limit(sk, skb) + atomic_read(dcnt);
3903*4882a593Smuzhiyun 	unsigned int qsize = sk->sk_backlog.len + sk_rmem_alloc_get(sk);
3904*4882a593Smuzhiyun 
3905*4882a593Smuzhiyun 	return (qsize > lim * 90 / 100);
3906*4882a593Smuzhiyun }
3907*4882a593Smuzhiyun 
3908*4882a593Smuzhiyun /**
3909*4882a593Smuzhiyun  * tipc_sk_overlimit2 - check if socket rx queue is about to be overloaded,
3910*4882a593Smuzhiyun  *			only the rcv queue is considered
3911*4882a593Smuzhiyun  * @sk: tipc sk to be checked
3912*4882a593Smuzhiyun  * @skb: tipc msg to be checked
3913*4882a593Smuzhiyun  *
3914*4882a593Smuzhiyun  * Returns true if the socket rx queue allocation is > 90%, otherwise false
3915*4882a593Smuzhiyun  */
3916*4882a593Smuzhiyun 
tipc_sk_overlimit2(struct sock * sk,struct sk_buff * skb)3917*4882a593Smuzhiyun bool tipc_sk_overlimit2(struct sock *sk, struct sk_buff *skb)
3918*4882a593Smuzhiyun {
3919*4882a593Smuzhiyun 	unsigned int lim = rcvbuf_limit(sk, skb);
3920*4882a593Smuzhiyun 	unsigned int qsize = sk_rmem_alloc_get(sk);
3921*4882a593Smuzhiyun 
3922*4882a593Smuzhiyun 	return (qsize > lim * 90 / 100);
3923*4882a593Smuzhiyun }
3924*4882a593Smuzhiyun 
3925*4882a593Smuzhiyun /**
3926*4882a593Smuzhiyun  * tipc_sk_dump - dump TIPC socket
3927*4882a593Smuzhiyun  * @sk: tipc sk to be dumped
3928*4882a593Smuzhiyun  * @dqueues: bitmask to decide if any socket queue to be dumped?
3929*4882a593Smuzhiyun  *           - TIPC_DUMP_NONE: don't dump socket queues
3930*4882a593Smuzhiyun  *           - TIPC_DUMP_SK_SNDQ: dump socket send queue
3931*4882a593Smuzhiyun  *           - TIPC_DUMP_SK_RCVQ: dump socket rcv queue
3932*4882a593Smuzhiyun  *           - TIPC_DUMP_SK_BKLGQ: dump socket backlog queue
3933*4882a593Smuzhiyun  *           - TIPC_DUMP_ALL: dump all the socket queues above
3934*4882a593Smuzhiyun  * @buf: returned buffer of dump data in format
3935*4882a593Smuzhiyun  */
tipc_sk_dump(struct sock * sk,u16 dqueues,char * buf)3936*4882a593Smuzhiyun int tipc_sk_dump(struct sock *sk, u16 dqueues, char *buf)
3937*4882a593Smuzhiyun {
3938*4882a593Smuzhiyun 	int i = 0;
3939*4882a593Smuzhiyun 	size_t sz = (dqueues) ? SK_LMAX : SK_LMIN;
3940*4882a593Smuzhiyun 	struct tipc_sock *tsk;
3941*4882a593Smuzhiyun 	struct publication *p;
3942*4882a593Smuzhiyun 	bool tsk_connected;
3943*4882a593Smuzhiyun 
3944*4882a593Smuzhiyun 	if (!sk) {
3945*4882a593Smuzhiyun 		i += scnprintf(buf, sz, "sk data: (null)\n");
3946*4882a593Smuzhiyun 		return i;
3947*4882a593Smuzhiyun 	}
3948*4882a593Smuzhiyun 
3949*4882a593Smuzhiyun 	tsk = tipc_sk(sk);
3950*4882a593Smuzhiyun 	tsk_connected = !tipc_sk_type_connectionless(sk);
3951*4882a593Smuzhiyun 
3952*4882a593Smuzhiyun 	i += scnprintf(buf, sz, "sk data: %u", sk->sk_type);
3953*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %d", sk->sk_state);
3954*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %x", tsk_own_node(tsk));
3955*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %u", tsk->portid);
3956*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " | %u", tsk_connected);
3957*4882a593Smuzhiyun 	if (tsk_connected) {
3958*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, " %x", tsk_peer_node(tsk));
3959*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, " %u", tsk_peer_port(tsk));
3960*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, " %u", tsk->conn_type);
3961*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, " %u", tsk->conn_instance);
3962*4882a593Smuzhiyun 	}
3963*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " | %u", tsk->published);
3964*4882a593Smuzhiyun 	if (tsk->published) {
3965*4882a593Smuzhiyun 		p = list_first_entry_or_null(&tsk->publications,
3966*4882a593Smuzhiyun 					     struct publication, binding_sock);
3967*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, " %u", (p) ? p->type : 0);
3968*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, " %u", (p) ? p->lower : 0);
3969*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, " %u", (p) ? p->upper : 0);
3970*4882a593Smuzhiyun 	}
3971*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " | %u", tsk->snd_win);
3972*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %u", tsk->rcv_win);
3973*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %u", tsk->max_pkt);
3974*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %x", tsk->peer_caps);
3975*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %u", tsk->cong_link_cnt);
3976*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %u", tsk->snt_unacked);
3977*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %u", tsk->rcv_unacked);
3978*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %u", atomic_read(&tsk->dupl_rcvcnt));
3979*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %u", sk->sk_shutdown);
3980*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " | %d", sk_wmem_alloc_get(sk));
3981*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %d", sk->sk_sndbuf);
3982*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " | %d", sk_rmem_alloc_get(sk));
3983*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " %d", sk->sk_rcvbuf);
3984*4882a593Smuzhiyun 	i += scnprintf(buf + i, sz - i, " | %d\n", READ_ONCE(sk->sk_backlog.len));
3985*4882a593Smuzhiyun 
3986*4882a593Smuzhiyun 	if (dqueues & TIPC_DUMP_SK_SNDQ) {
3987*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, "sk_write_queue: ");
3988*4882a593Smuzhiyun 		i += tipc_list_dump(&sk->sk_write_queue, false, buf + i);
3989*4882a593Smuzhiyun 	}
3990*4882a593Smuzhiyun 
3991*4882a593Smuzhiyun 	if (dqueues & TIPC_DUMP_SK_RCVQ) {
3992*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, "sk_receive_queue: ");
3993*4882a593Smuzhiyun 		i += tipc_list_dump(&sk->sk_receive_queue, false, buf + i);
3994*4882a593Smuzhiyun 	}
3995*4882a593Smuzhiyun 
3996*4882a593Smuzhiyun 	if (dqueues & TIPC_DUMP_SK_BKLGQ) {
3997*4882a593Smuzhiyun 		i += scnprintf(buf + i, sz - i, "sk_backlog:\n  head ");
3998*4882a593Smuzhiyun 		i += tipc_skb_dump(sk->sk_backlog.head, false, buf + i);
3999*4882a593Smuzhiyun 		if (sk->sk_backlog.tail != sk->sk_backlog.head) {
4000*4882a593Smuzhiyun 			i += scnprintf(buf + i, sz - i, "  tail ");
4001*4882a593Smuzhiyun 			i += tipc_skb_dump(sk->sk_backlog.tail, false,
4002*4882a593Smuzhiyun 					   buf + i);
4003*4882a593Smuzhiyun 		}
4004*4882a593Smuzhiyun 	}
4005*4882a593Smuzhiyun 
4006*4882a593Smuzhiyun 	return i;
4007*4882a593Smuzhiyun }
4008