1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Shared Memory Communications over RDMA (SMC-R) and RoCE
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Monitoring SMC transport protocol sockets
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * Copyright IBM Corp. 2016
8*4882a593Smuzhiyun *
9*4882a593Smuzhiyun * Author(s): Ursula Braun <ubraun@linux.vnet.ibm.com>
10*4882a593Smuzhiyun */
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun #include <linux/kernel.h>
13*4882a593Smuzhiyun #include <linux/module.h>
14*4882a593Smuzhiyun #include <linux/types.h>
15*4882a593Smuzhiyun #include <linux/init.h>
16*4882a593Smuzhiyun #include <linux/sock_diag.h>
17*4882a593Smuzhiyun #include <linux/inet_diag.h>
18*4882a593Smuzhiyun #include <linux/smc_diag.h>
19*4882a593Smuzhiyun #include <net/netlink.h>
20*4882a593Smuzhiyun #include <net/smc.h>
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun #include "smc.h"
23*4882a593Smuzhiyun #include "smc_core.h"
24*4882a593Smuzhiyun
25*4882a593Smuzhiyun struct smc_diag_dump_ctx {
26*4882a593Smuzhiyun int pos[2];
27*4882a593Smuzhiyun };
28*4882a593Smuzhiyun
smc_dump_context(struct netlink_callback * cb)29*4882a593Smuzhiyun static struct smc_diag_dump_ctx *smc_dump_context(struct netlink_callback *cb)
30*4882a593Smuzhiyun {
31*4882a593Smuzhiyun return (struct smc_diag_dump_ctx *)cb->ctx;
32*4882a593Smuzhiyun }
33*4882a593Smuzhiyun
smc_gid_be16_convert(__u8 * buf,u8 * gid_raw)34*4882a593Smuzhiyun static void smc_gid_be16_convert(__u8 *buf, u8 *gid_raw)
35*4882a593Smuzhiyun {
36*4882a593Smuzhiyun sprintf(buf, "%04x:%04x:%04x:%04x:%04x:%04x:%04x:%04x",
37*4882a593Smuzhiyun be16_to_cpu(((__be16 *)gid_raw)[0]),
38*4882a593Smuzhiyun be16_to_cpu(((__be16 *)gid_raw)[1]),
39*4882a593Smuzhiyun be16_to_cpu(((__be16 *)gid_raw)[2]),
40*4882a593Smuzhiyun be16_to_cpu(((__be16 *)gid_raw)[3]),
41*4882a593Smuzhiyun be16_to_cpu(((__be16 *)gid_raw)[4]),
42*4882a593Smuzhiyun be16_to_cpu(((__be16 *)gid_raw)[5]),
43*4882a593Smuzhiyun be16_to_cpu(((__be16 *)gid_raw)[6]),
44*4882a593Smuzhiyun be16_to_cpu(((__be16 *)gid_raw)[7]));
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun
smc_diag_msg_common_fill(struct smc_diag_msg * r,struct sock * sk)47*4882a593Smuzhiyun static void smc_diag_msg_common_fill(struct smc_diag_msg *r, struct sock *sk)
48*4882a593Smuzhiyun {
49*4882a593Smuzhiyun struct smc_sock *smc = smc_sk(sk);
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun memset(r, 0, sizeof(*r));
52*4882a593Smuzhiyun r->diag_family = sk->sk_family;
53*4882a593Smuzhiyun sock_diag_save_cookie(sk, r->id.idiag_cookie);
54*4882a593Smuzhiyun if (!smc->clcsock)
55*4882a593Smuzhiyun return;
56*4882a593Smuzhiyun r->id.idiag_sport = htons(smc->clcsock->sk->sk_num);
57*4882a593Smuzhiyun r->id.idiag_dport = smc->clcsock->sk->sk_dport;
58*4882a593Smuzhiyun r->id.idiag_if = smc->clcsock->sk->sk_bound_dev_if;
59*4882a593Smuzhiyun if (sk->sk_protocol == SMCPROTO_SMC) {
60*4882a593Smuzhiyun r->id.idiag_src[0] = smc->clcsock->sk->sk_rcv_saddr;
61*4882a593Smuzhiyun r->id.idiag_dst[0] = smc->clcsock->sk->sk_daddr;
62*4882a593Smuzhiyun #if IS_ENABLED(CONFIG_IPV6)
63*4882a593Smuzhiyun } else if (sk->sk_protocol == SMCPROTO_SMC6) {
64*4882a593Smuzhiyun memcpy(&r->id.idiag_src, &smc->clcsock->sk->sk_v6_rcv_saddr,
65*4882a593Smuzhiyun sizeof(smc->clcsock->sk->sk_v6_rcv_saddr));
66*4882a593Smuzhiyun memcpy(&r->id.idiag_dst, &smc->clcsock->sk->sk_v6_daddr,
67*4882a593Smuzhiyun sizeof(smc->clcsock->sk->sk_v6_daddr));
68*4882a593Smuzhiyun #endif
69*4882a593Smuzhiyun }
70*4882a593Smuzhiyun }
71*4882a593Smuzhiyun
smc_diag_msg_attrs_fill(struct sock * sk,struct sk_buff * skb,struct smc_diag_msg * r,struct user_namespace * user_ns)72*4882a593Smuzhiyun static int smc_diag_msg_attrs_fill(struct sock *sk, struct sk_buff *skb,
73*4882a593Smuzhiyun struct smc_diag_msg *r,
74*4882a593Smuzhiyun struct user_namespace *user_ns)
75*4882a593Smuzhiyun {
76*4882a593Smuzhiyun if (nla_put_u8(skb, SMC_DIAG_SHUTDOWN, sk->sk_shutdown))
77*4882a593Smuzhiyun return 1;
78*4882a593Smuzhiyun
79*4882a593Smuzhiyun r->diag_uid = from_kuid_munged(user_ns, sock_i_uid(sk));
80*4882a593Smuzhiyun r->diag_inode = sock_i_ino(sk);
81*4882a593Smuzhiyun return 0;
82*4882a593Smuzhiyun }
83*4882a593Smuzhiyun
__smc_diag_dump(struct sock * sk,struct sk_buff * skb,struct netlink_callback * cb,const struct smc_diag_req * req,struct nlattr * bc)84*4882a593Smuzhiyun static int __smc_diag_dump(struct sock *sk, struct sk_buff *skb,
85*4882a593Smuzhiyun struct netlink_callback *cb,
86*4882a593Smuzhiyun const struct smc_diag_req *req,
87*4882a593Smuzhiyun struct nlattr *bc)
88*4882a593Smuzhiyun {
89*4882a593Smuzhiyun struct smc_sock *smc = smc_sk(sk);
90*4882a593Smuzhiyun struct smc_diag_fallback fallback;
91*4882a593Smuzhiyun struct user_namespace *user_ns;
92*4882a593Smuzhiyun struct smc_diag_msg *r;
93*4882a593Smuzhiyun struct nlmsghdr *nlh;
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
96*4882a593Smuzhiyun cb->nlh->nlmsg_type, sizeof(*r), NLM_F_MULTI);
97*4882a593Smuzhiyun if (!nlh)
98*4882a593Smuzhiyun return -EMSGSIZE;
99*4882a593Smuzhiyun
100*4882a593Smuzhiyun r = nlmsg_data(nlh);
101*4882a593Smuzhiyun smc_diag_msg_common_fill(r, sk);
102*4882a593Smuzhiyun r->diag_state = sk->sk_state;
103*4882a593Smuzhiyun if (smc->use_fallback)
104*4882a593Smuzhiyun r->diag_mode = SMC_DIAG_MODE_FALLBACK_TCP;
105*4882a593Smuzhiyun else if (smc->conn.lgr && smc->conn.lgr->is_smcd)
106*4882a593Smuzhiyun r->diag_mode = SMC_DIAG_MODE_SMCD;
107*4882a593Smuzhiyun else
108*4882a593Smuzhiyun r->diag_mode = SMC_DIAG_MODE_SMCR;
109*4882a593Smuzhiyun user_ns = sk_user_ns(NETLINK_CB(cb->skb).sk);
110*4882a593Smuzhiyun if (smc_diag_msg_attrs_fill(sk, skb, r, user_ns))
111*4882a593Smuzhiyun goto errout;
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun fallback.reason = smc->fallback_rsn;
114*4882a593Smuzhiyun fallback.peer_diagnosis = smc->peer_diagnosis;
115*4882a593Smuzhiyun if (nla_put(skb, SMC_DIAG_FALLBACK, sizeof(fallback), &fallback) < 0)
116*4882a593Smuzhiyun goto errout;
117*4882a593Smuzhiyun
118*4882a593Smuzhiyun if ((req->diag_ext & (1 << (SMC_DIAG_CONNINFO - 1))) &&
119*4882a593Smuzhiyun smc->conn.alert_token_local) {
120*4882a593Smuzhiyun struct smc_connection *conn = &smc->conn;
121*4882a593Smuzhiyun struct smc_diag_conninfo cinfo = {
122*4882a593Smuzhiyun .token = conn->alert_token_local,
123*4882a593Smuzhiyun .sndbuf_size = conn->sndbuf_desc ?
124*4882a593Smuzhiyun conn->sndbuf_desc->len : 0,
125*4882a593Smuzhiyun .rmbe_size = conn->rmb_desc ? conn->rmb_desc->len : 0,
126*4882a593Smuzhiyun .peer_rmbe_size = conn->peer_rmbe_size,
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun .rx_prod.wrap = conn->local_rx_ctrl.prod.wrap,
129*4882a593Smuzhiyun .rx_prod.count = conn->local_rx_ctrl.prod.count,
130*4882a593Smuzhiyun .rx_cons.wrap = conn->local_rx_ctrl.cons.wrap,
131*4882a593Smuzhiyun .rx_cons.count = conn->local_rx_ctrl.cons.count,
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun .tx_prod.wrap = conn->local_tx_ctrl.prod.wrap,
134*4882a593Smuzhiyun .tx_prod.count = conn->local_tx_ctrl.prod.count,
135*4882a593Smuzhiyun .tx_cons.wrap = conn->local_tx_ctrl.cons.wrap,
136*4882a593Smuzhiyun .tx_cons.count = conn->local_tx_ctrl.cons.count,
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun .tx_prod_flags =
139*4882a593Smuzhiyun *(u8 *)&conn->local_tx_ctrl.prod_flags,
140*4882a593Smuzhiyun .tx_conn_state_flags =
141*4882a593Smuzhiyun *(u8 *)&conn->local_tx_ctrl.conn_state_flags,
142*4882a593Smuzhiyun .rx_prod_flags = *(u8 *)&conn->local_rx_ctrl.prod_flags,
143*4882a593Smuzhiyun .rx_conn_state_flags =
144*4882a593Smuzhiyun *(u8 *)&conn->local_rx_ctrl.conn_state_flags,
145*4882a593Smuzhiyun
146*4882a593Smuzhiyun .tx_prep.wrap = conn->tx_curs_prep.wrap,
147*4882a593Smuzhiyun .tx_prep.count = conn->tx_curs_prep.count,
148*4882a593Smuzhiyun .tx_sent.wrap = conn->tx_curs_sent.wrap,
149*4882a593Smuzhiyun .tx_sent.count = conn->tx_curs_sent.count,
150*4882a593Smuzhiyun .tx_fin.wrap = conn->tx_curs_fin.wrap,
151*4882a593Smuzhiyun .tx_fin.count = conn->tx_curs_fin.count,
152*4882a593Smuzhiyun };
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun if (nla_put(skb, SMC_DIAG_CONNINFO, sizeof(cinfo), &cinfo) < 0)
155*4882a593Smuzhiyun goto errout;
156*4882a593Smuzhiyun }
157*4882a593Smuzhiyun
158*4882a593Smuzhiyun if (smc->conn.lgr && !smc->conn.lgr->is_smcd &&
159*4882a593Smuzhiyun (req->diag_ext & (1 << (SMC_DIAG_LGRINFO - 1))) &&
160*4882a593Smuzhiyun !list_empty(&smc->conn.lgr->list)) {
161*4882a593Smuzhiyun struct smc_diag_lgrinfo linfo = {
162*4882a593Smuzhiyun .role = smc->conn.lgr->role,
163*4882a593Smuzhiyun .lnk[0].ibport = smc->conn.lgr->lnk[0].ibport,
164*4882a593Smuzhiyun .lnk[0].link_id = smc->conn.lgr->lnk[0].link_id,
165*4882a593Smuzhiyun };
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun memcpy(linfo.lnk[0].ibname,
168*4882a593Smuzhiyun smc->conn.lgr->lnk[0].smcibdev->ibdev->name,
169*4882a593Smuzhiyun sizeof(smc->conn.lgr->lnk[0].smcibdev->ibdev->name));
170*4882a593Smuzhiyun smc_gid_be16_convert(linfo.lnk[0].gid,
171*4882a593Smuzhiyun smc->conn.lgr->lnk[0].gid);
172*4882a593Smuzhiyun smc_gid_be16_convert(linfo.lnk[0].peer_gid,
173*4882a593Smuzhiyun smc->conn.lgr->lnk[0].peer_gid);
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun if (nla_put(skb, SMC_DIAG_LGRINFO, sizeof(linfo), &linfo) < 0)
176*4882a593Smuzhiyun goto errout;
177*4882a593Smuzhiyun }
178*4882a593Smuzhiyun if (smc->conn.lgr && smc->conn.lgr->is_smcd &&
179*4882a593Smuzhiyun (req->diag_ext & (1 << (SMC_DIAG_DMBINFO - 1))) &&
180*4882a593Smuzhiyun !list_empty(&smc->conn.lgr->list)) {
181*4882a593Smuzhiyun struct smc_connection *conn = &smc->conn;
182*4882a593Smuzhiyun struct smcd_diag_dmbinfo dinfo;
183*4882a593Smuzhiyun
184*4882a593Smuzhiyun memset(&dinfo, 0, sizeof(dinfo));
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun dinfo.linkid = *((u32 *)conn->lgr->id);
187*4882a593Smuzhiyun dinfo.peer_gid = conn->lgr->peer_gid;
188*4882a593Smuzhiyun dinfo.my_gid = conn->lgr->smcd->local_gid;
189*4882a593Smuzhiyun dinfo.token = conn->rmb_desc->token;
190*4882a593Smuzhiyun dinfo.peer_token = conn->peer_token;
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun if (nla_put(skb, SMC_DIAG_DMBINFO, sizeof(dinfo), &dinfo) < 0)
193*4882a593Smuzhiyun goto errout;
194*4882a593Smuzhiyun }
195*4882a593Smuzhiyun
196*4882a593Smuzhiyun nlmsg_end(skb, nlh);
197*4882a593Smuzhiyun return 0;
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun errout:
200*4882a593Smuzhiyun nlmsg_cancel(skb, nlh);
201*4882a593Smuzhiyun return -EMSGSIZE;
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun
smc_diag_dump_proto(struct proto * prot,struct sk_buff * skb,struct netlink_callback * cb,int p_type)204*4882a593Smuzhiyun static int smc_diag_dump_proto(struct proto *prot, struct sk_buff *skb,
205*4882a593Smuzhiyun struct netlink_callback *cb, int p_type)
206*4882a593Smuzhiyun {
207*4882a593Smuzhiyun struct smc_diag_dump_ctx *cb_ctx = smc_dump_context(cb);
208*4882a593Smuzhiyun struct net *net = sock_net(skb->sk);
209*4882a593Smuzhiyun int snum = cb_ctx->pos[p_type];
210*4882a593Smuzhiyun struct nlattr *bc = NULL;
211*4882a593Smuzhiyun struct hlist_head *head;
212*4882a593Smuzhiyun int rc = 0, num = 0;
213*4882a593Smuzhiyun struct sock *sk;
214*4882a593Smuzhiyun
215*4882a593Smuzhiyun read_lock(&prot->h.smc_hash->lock);
216*4882a593Smuzhiyun head = &prot->h.smc_hash->ht;
217*4882a593Smuzhiyun if (hlist_empty(head))
218*4882a593Smuzhiyun goto out;
219*4882a593Smuzhiyun
220*4882a593Smuzhiyun sk_for_each(sk, head) {
221*4882a593Smuzhiyun if (!net_eq(sock_net(sk), net))
222*4882a593Smuzhiyun continue;
223*4882a593Smuzhiyun if (num < snum)
224*4882a593Smuzhiyun goto next;
225*4882a593Smuzhiyun rc = __smc_diag_dump(sk, skb, cb, nlmsg_data(cb->nlh), bc);
226*4882a593Smuzhiyun if (rc < 0)
227*4882a593Smuzhiyun goto out;
228*4882a593Smuzhiyun next:
229*4882a593Smuzhiyun num++;
230*4882a593Smuzhiyun }
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun out:
233*4882a593Smuzhiyun read_unlock(&prot->h.smc_hash->lock);
234*4882a593Smuzhiyun cb_ctx->pos[p_type] = num;
235*4882a593Smuzhiyun return rc;
236*4882a593Smuzhiyun }
237*4882a593Smuzhiyun
smc_diag_dump(struct sk_buff * skb,struct netlink_callback * cb)238*4882a593Smuzhiyun static int smc_diag_dump(struct sk_buff *skb, struct netlink_callback *cb)
239*4882a593Smuzhiyun {
240*4882a593Smuzhiyun int rc = 0;
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun rc = smc_diag_dump_proto(&smc_proto, skb, cb, SMCPROTO_SMC);
243*4882a593Smuzhiyun if (!rc)
244*4882a593Smuzhiyun smc_diag_dump_proto(&smc_proto6, skb, cb, SMCPROTO_SMC6);
245*4882a593Smuzhiyun return skb->len;
246*4882a593Smuzhiyun }
247*4882a593Smuzhiyun
smc_diag_handler_dump(struct sk_buff * skb,struct nlmsghdr * h)248*4882a593Smuzhiyun static int smc_diag_handler_dump(struct sk_buff *skb, struct nlmsghdr *h)
249*4882a593Smuzhiyun {
250*4882a593Smuzhiyun struct net *net = sock_net(skb->sk);
251*4882a593Smuzhiyun
252*4882a593Smuzhiyun if (h->nlmsg_type == SOCK_DIAG_BY_FAMILY &&
253*4882a593Smuzhiyun h->nlmsg_flags & NLM_F_DUMP) {
254*4882a593Smuzhiyun {
255*4882a593Smuzhiyun struct netlink_dump_control c = {
256*4882a593Smuzhiyun .dump = smc_diag_dump,
257*4882a593Smuzhiyun .min_dump_alloc = SKB_WITH_OVERHEAD(32768),
258*4882a593Smuzhiyun };
259*4882a593Smuzhiyun return netlink_dump_start(net->diag_nlsk, skb, h, &c);
260*4882a593Smuzhiyun }
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun return 0;
263*4882a593Smuzhiyun }
264*4882a593Smuzhiyun
265*4882a593Smuzhiyun static const struct sock_diag_handler smc_diag_handler = {
266*4882a593Smuzhiyun .family = AF_SMC,
267*4882a593Smuzhiyun .dump = smc_diag_handler_dump,
268*4882a593Smuzhiyun };
269*4882a593Smuzhiyun
smc_diag_init(void)270*4882a593Smuzhiyun static int __init smc_diag_init(void)
271*4882a593Smuzhiyun {
272*4882a593Smuzhiyun return sock_diag_register(&smc_diag_handler);
273*4882a593Smuzhiyun }
274*4882a593Smuzhiyun
smc_diag_exit(void)275*4882a593Smuzhiyun static void __exit smc_diag_exit(void)
276*4882a593Smuzhiyun {
277*4882a593Smuzhiyun sock_diag_unregister(&smc_diag_handler);
278*4882a593Smuzhiyun }
279*4882a593Smuzhiyun
280*4882a593Smuzhiyun module_init(smc_diag_init);
281*4882a593Smuzhiyun module_exit(smc_diag_exit);
282*4882a593Smuzhiyun MODULE_LICENSE("GPL");
283*4882a593Smuzhiyun MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK, NETLINK_SOCK_DIAG, 43 /* AF_SMC */);
284