smc_diag.c 7.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Shared Memory Communications over RDMA (SMC-R) and RoCE
  4. *
  5. * Monitoring SMC transport protocol sockets
  6. *
  7. * Copyright IBM Corp. 2016
  8. *
  9. * Author(s): Ursula Braun <ubraun@linux.vnet.ibm.com>
  10. */
  11. #include <linux/kernel.h>
  12. #include <linux/module.h>
  13. #include <linux/types.h>
  14. #include <linux/init.h>
  15. #include <linux/sock_diag.h>
  16. #include <linux/inet_diag.h>
  17. #include <linux/smc_diag.h>
  18. #include <net/netlink.h>
  19. #include <net/smc.h>
  20. #include "smc.h"
  21. #include "smc_core.h"
  22. #include "smc_ism.h"
  23. struct smc_diag_dump_ctx {
  24. int pos[2];
  25. };
  26. static struct smc_diag_dump_ctx *smc_dump_context(struct netlink_callback *cb)
  27. {
  28. return (struct smc_diag_dump_ctx *)cb->ctx;
  29. }
  30. static void smc_diag_msg_common_fill(struct smc_diag_msg *r, struct sock *sk)
  31. {
  32. struct smc_sock *smc = smc_sk(sk);
  33. memset(r, 0, sizeof(*r));
  34. r->diag_family = sk->sk_family;
  35. sock_diag_save_cookie(sk, r->id.idiag_cookie);
  36. if (!smc->clcsock)
  37. return;
  38. r->id.idiag_sport = htons(smc->clcsock->sk->sk_num);
  39. r->id.idiag_dport = smc->clcsock->sk->sk_dport;
  40. r->id.idiag_if = smc->clcsock->sk->sk_bound_dev_if;
  41. if (sk->sk_protocol == SMCPROTO_SMC) {
  42. r->id.idiag_src[0] = smc->clcsock->sk->sk_rcv_saddr;
  43. r->id.idiag_dst[0] = smc->clcsock->sk->sk_daddr;
  44. #if IS_ENABLED(CONFIG_IPV6)
  45. } else if (sk->sk_protocol == SMCPROTO_SMC6) {
  46. memcpy(&r->id.idiag_src, &smc->clcsock->sk->sk_v6_rcv_saddr,
  47. sizeof(smc->clcsock->sk->sk_v6_rcv_saddr));
  48. memcpy(&r->id.idiag_dst, &smc->clcsock->sk->sk_v6_daddr,
  49. sizeof(smc->clcsock->sk->sk_v6_daddr));
  50. #endif
  51. }
  52. }
  53. static int smc_diag_msg_attrs_fill(struct sock *sk, struct sk_buff *skb,
  54. struct smc_diag_msg *r,
  55. struct user_namespace *user_ns)
  56. {
  57. if (nla_put_u8(skb, SMC_DIAG_SHUTDOWN, sk->sk_shutdown))
  58. return 1;
  59. r->diag_uid = from_kuid_munged(user_ns, sock_i_uid(sk));
  60. r->diag_inode = sock_i_ino(sk);
  61. return 0;
  62. }
  63. static int __smc_diag_dump(struct sock *sk, struct sk_buff *skb,
  64. struct netlink_callback *cb,
  65. const struct smc_diag_req *req,
  66. struct nlattr *bc)
  67. {
  68. struct smc_sock *smc = smc_sk(sk);
  69. struct smc_diag_fallback fallback;
  70. struct user_namespace *user_ns;
  71. struct smc_diag_msg *r;
  72. struct nlmsghdr *nlh;
  73. nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
  74. cb->nlh->nlmsg_type, sizeof(*r), NLM_F_MULTI);
  75. if (!nlh)
  76. return -EMSGSIZE;
  77. r = nlmsg_data(nlh);
  78. smc_diag_msg_common_fill(r, sk);
  79. r->diag_state = sk->sk_state;
  80. if (smc->use_fallback)
  81. r->diag_mode = SMC_DIAG_MODE_FALLBACK_TCP;
  82. else if (smc_conn_lgr_valid(&smc->conn) && smc->conn.lgr->is_smcd)
  83. r->diag_mode = SMC_DIAG_MODE_SMCD;
  84. else
  85. r->diag_mode = SMC_DIAG_MODE_SMCR;
  86. user_ns = sk_user_ns(NETLINK_CB(cb->skb).sk);
  87. if (smc_diag_msg_attrs_fill(sk, skb, r, user_ns))
  88. goto errout;
  89. fallback.reason = smc->fallback_rsn;
  90. fallback.peer_diagnosis = smc->peer_diagnosis;
  91. if (nla_put(skb, SMC_DIAG_FALLBACK, sizeof(fallback), &fallback) < 0)
  92. goto errout;
  93. if ((req->diag_ext & (1 << (SMC_DIAG_CONNINFO - 1))) &&
  94. smc->conn.alert_token_local) {
  95. struct smc_connection *conn = &smc->conn;
  96. struct smc_diag_conninfo cinfo = {
  97. .token = conn->alert_token_local,
  98. .sndbuf_size = conn->sndbuf_desc ?
  99. conn->sndbuf_desc->len : 0,
  100. .rmbe_size = conn->rmb_desc ? conn->rmb_desc->len : 0,
  101. .peer_rmbe_size = conn->peer_rmbe_size,
  102. .rx_prod.wrap = conn->local_rx_ctrl.prod.wrap,
  103. .rx_prod.count = conn->local_rx_ctrl.prod.count,
  104. .rx_cons.wrap = conn->local_rx_ctrl.cons.wrap,
  105. .rx_cons.count = conn->local_rx_ctrl.cons.count,
  106. .tx_prod.wrap = conn->local_tx_ctrl.prod.wrap,
  107. .tx_prod.count = conn->local_tx_ctrl.prod.count,
  108. .tx_cons.wrap = conn->local_tx_ctrl.cons.wrap,
  109. .tx_cons.count = conn->local_tx_ctrl.cons.count,
  110. .tx_prod_flags =
  111. *(u8 *)&conn->local_tx_ctrl.prod_flags,
  112. .tx_conn_state_flags =
  113. *(u8 *)&conn->local_tx_ctrl.conn_state_flags,
  114. .rx_prod_flags = *(u8 *)&conn->local_rx_ctrl.prod_flags,
  115. .rx_conn_state_flags =
  116. *(u8 *)&conn->local_rx_ctrl.conn_state_flags,
  117. .tx_prep.wrap = conn->tx_curs_prep.wrap,
  118. .tx_prep.count = conn->tx_curs_prep.count,
  119. .tx_sent.wrap = conn->tx_curs_sent.wrap,
  120. .tx_sent.count = conn->tx_curs_sent.count,
  121. .tx_fin.wrap = conn->tx_curs_fin.wrap,
  122. .tx_fin.count = conn->tx_curs_fin.count,
  123. };
  124. if (nla_put(skb, SMC_DIAG_CONNINFO, sizeof(cinfo), &cinfo) < 0)
  125. goto errout;
  126. }
  127. if (smc_conn_lgr_valid(&smc->conn) && !smc->conn.lgr->is_smcd &&
  128. (req->diag_ext & (1 << (SMC_DIAG_LGRINFO - 1))) &&
  129. !list_empty(&smc->conn.lgr->list)) {
  130. struct smc_link *link = smc->conn.lnk;
  131. struct smc_diag_lgrinfo linfo = {
  132. .role = smc->conn.lgr->role,
  133. .lnk[0].ibport = link->ibport,
  134. .lnk[0].link_id = link->link_id,
  135. };
  136. memcpy(linfo.lnk[0].ibname, link->smcibdev->ibdev->name,
  137. sizeof(link->smcibdev->ibdev->name));
  138. smc_gid_be16_convert(linfo.lnk[0].gid, link->gid);
  139. smc_gid_be16_convert(linfo.lnk[0].peer_gid, link->peer_gid);
  140. if (nla_put(skb, SMC_DIAG_LGRINFO, sizeof(linfo), &linfo) < 0)
  141. goto errout;
  142. }
  143. if (smc_conn_lgr_valid(&smc->conn) && smc->conn.lgr->is_smcd &&
  144. (req->diag_ext & (1 << (SMC_DIAG_DMBINFO - 1))) &&
  145. !list_empty(&smc->conn.lgr->list) && smc->conn.rmb_desc) {
  146. struct smc_connection *conn = &smc->conn;
  147. struct smcd_diag_dmbinfo dinfo;
  148. struct smcd_dev *smcd = conn->lgr->smcd;
  149. struct smcd_gid smcd_gid;
  150. memset(&dinfo, 0, sizeof(dinfo));
  151. dinfo.linkid = *((u32 *)conn->lgr->id);
  152. dinfo.peer_gid = conn->lgr->peer_gid.gid;
  153. dinfo.peer_gid_ext = conn->lgr->peer_gid.gid_ext;
  154. smcd->ops->get_local_gid(smcd, &smcd_gid);
  155. dinfo.my_gid = smcd_gid.gid;
  156. dinfo.my_gid_ext = smcd_gid.gid_ext;
  157. dinfo.token = conn->rmb_desc->token;
  158. dinfo.peer_token = conn->peer_token;
  159. if (nla_put(skb, SMC_DIAG_DMBINFO, sizeof(dinfo), &dinfo) < 0)
  160. goto errout;
  161. }
  162. nlmsg_end(skb, nlh);
  163. return 0;
  164. errout:
  165. nlmsg_cancel(skb, nlh);
  166. return -EMSGSIZE;
  167. }
  168. static int smc_diag_dump_proto(struct proto *prot, struct sk_buff *skb,
  169. struct netlink_callback *cb, int p_type)
  170. {
  171. struct smc_diag_dump_ctx *cb_ctx = smc_dump_context(cb);
  172. struct net *net = sock_net(skb->sk);
  173. int snum = cb_ctx->pos[p_type];
  174. struct nlattr *bc = NULL;
  175. struct hlist_head *head;
  176. int rc = 0, num = 0;
  177. struct sock *sk;
  178. read_lock(&prot->h.smc_hash->lock);
  179. head = &prot->h.smc_hash->ht;
  180. if (hlist_empty(head))
  181. goto out;
  182. sk_for_each(sk, head) {
  183. if (!net_eq(sock_net(sk), net))
  184. continue;
  185. if (num < snum)
  186. goto next;
  187. rc = __smc_diag_dump(sk, skb, cb, nlmsg_data(cb->nlh), bc);
  188. if (rc < 0)
  189. goto out;
  190. next:
  191. num++;
  192. }
  193. out:
  194. read_unlock(&prot->h.smc_hash->lock);
  195. cb_ctx->pos[p_type] = num;
  196. return rc;
  197. }
  198. static int smc_diag_dump(struct sk_buff *skb, struct netlink_callback *cb)
  199. {
  200. int rc = 0;
  201. rc = smc_diag_dump_proto(&smc_proto, skb, cb, SMCPROTO_SMC);
  202. if (!rc)
  203. smc_diag_dump_proto(&smc_proto6, skb, cb, SMCPROTO_SMC6);
  204. return skb->len;
  205. }
  206. static int smc_diag_handler_dump(struct sk_buff *skb, struct nlmsghdr *h)
  207. {
  208. struct net *net = sock_net(skb->sk);
  209. if (h->nlmsg_type == SOCK_DIAG_BY_FAMILY &&
  210. h->nlmsg_flags & NLM_F_DUMP) {
  211. {
  212. struct netlink_dump_control c = {
  213. .dump = smc_diag_dump,
  214. .min_dump_alloc = SKB_WITH_OVERHEAD(32768),
  215. };
  216. return netlink_dump_start(net->diag_nlsk, skb, h, &c);
  217. }
  218. }
  219. return 0;
  220. }
  221. static const struct sock_diag_handler smc_diag_handler = {
  222. .owner = THIS_MODULE,
  223. .family = AF_SMC,
  224. .dump = smc_diag_handler_dump,
  225. };
  226. static int __init smc_diag_init(void)
  227. {
  228. return sock_diag_register(&smc_diag_handler);
  229. }
  230. static void __exit smc_diag_exit(void)
  231. {
  232. sock_diag_unregister(&smc_diag_handler);
  233. }
  234. module_init(smc_diag_init);
  235. module_exit(smc_diag_exit);
  236. MODULE_LICENSE("GPL");
  237. MODULE_DESCRIPTION("SMC socket monitoring via SOCK_DIAG");
  238. MODULE_ALIAS_NET_PF_PROTO_TYPE(PF_NETLINK, NETLINK_SOCK_DIAG, 43 /* AF_SMC */);
  239. MODULE_ALIAS_GENL_FAMILY(SMCR_GENL_FAMILY_NAME);