br_arp_nd_proxy.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475
  1. /*
  2. * Handle bridge arp/nd proxy/suppress
  3. *
  4. * Copyright (C) 2017 Cumulus Networks
  5. * Copyright (c) 2017 Roopa Prabhu <roopa@cumulusnetworks.com>
  6. *
  7. * Authors:
  8. * Roopa Prabhu <roopa@cumulusnetworks.com>
  9. *
  10. * This program is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU General Public License
  12. * as published by the Free Software Foundation; either version
  13. * 2 of the License, or (at your option) any later version.
  14. */
  15. #include <linux/kernel.h>
  16. #include <linux/netdevice.h>
  17. #include <linux/etherdevice.h>
  18. #include <linux/neighbour.h>
  19. #include <net/arp.h>
  20. #include <linux/if_vlan.h>
  21. #include <linux/inetdevice.h>
  22. #include <net/addrconf.h>
  23. #if IS_ENABLED(CONFIG_IPV6)
  24. #include <net/ip6_checksum.h>
  25. #endif
  26. #include "br_private.h"
  27. void br_recalculate_neigh_suppress_enabled(struct net_bridge *br)
  28. {
  29. struct net_bridge_port *p;
  30. bool neigh_suppress = false;
  31. list_for_each_entry(p, &br->port_list, list) {
  32. if (p->flags & BR_NEIGH_SUPPRESS) {
  33. neigh_suppress = true;
  34. break;
  35. }
  36. }
  37. br->neigh_suppress_enabled = neigh_suppress;
  38. }
  39. #if IS_ENABLED(CONFIG_INET)
  40. static void br_arp_send(struct net_bridge *br, struct net_bridge_port *p,
  41. struct net_device *dev, __be32 dest_ip, __be32 src_ip,
  42. const unsigned char *dest_hw,
  43. const unsigned char *src_hw,
  44. const unsigned char *target_hw,
  45. __be16 vlan_proto, u16 vlan_tci)
  46. {
  47. struct net_bridge_vlan_group *vg;
  48. struct sk_buff *skb;
  49. u16 pvid;
  50. netdev_dbg(dev, "arp send dev %s dst %pI4 dst_hw %pM src %pI4 src_hw %pM\n",
  51. dev->name, &dest_ip, dest_hw, &src_ip, src_hw);
  52. if (!vlan_tci) {
  53. arp_send(ARPOP_REPLY, ETH_P_ARP, dest_ip, dev, src_ip,
  54. dest_hw, src_hw, target_hw);
  55. return;
  56. }
  57. skb = arp_create(ARPOP_REPLY, ETH_P_ARP, dest_ip, dev, src_ip,
  58. dest_hw, src_hw, target_hw);
  59. if (!skb)
  60. return;
  61. if (p)
  62. vg = nbp_vlan_group_rcu(p);
  63. else
  64. vg = br_vlan_group_rcu(br);
  65. pvid = br_get_pvid(vg);
  66. if (pvid == (vlan_tci & VLAN_VID_MASK))
  67. vlan_tci = 0;
  68. if (vlan_tci)
  69. __vlan_hwaccel_put_tag(skb, vlan_proto, vlan_tci);
  70. if (p) {
  71. arp_xmit(skb);
  72. } else {
  73. skb_reset_mac_header(skb);
  74. __skb_pull(skb, skb_network_offset(skb));
  75. skb->ip_summed = CHECKSUM_UNNECESSARY;
  76. skb->pkt_type = PACKET_HOST;
  77. netif_rx_ni(skb);
  78. }
  79. }
  80. static int br_chk_addr_ip(struct net_device *dev, void *data)
  81. {
  82. __be32 ip = *(__be32 *)data;
  83. struct in_device *in_dev;
  84. __be32 addr = 0;
  85. in_dev = __in_dev_get_rcu(dev);
  86. if (in_dev)
  87. addr = inet_confirm_addr(dev_net(dev), in_dev, 0, ip,
  88. RT_SCOPE_HOST);
  89. if (addr == ip)
  90. return 1;
  91. return 0;
  92. }
  93. static bool br_is_local_ip(struct net_device *dev, __be32 ip)
  94. {
  95. if (br_chk_addr_ip(dev, &ip))
  96. return true;
  97. /* check if ip is configured on upper dev */
  98. if (netdev_walk_all_upper_dev_rcu(dev, br_chk_addr_ip, &ip))
  99. return true;
  100. return false;
  101. }
  102. void br_do_proxy_suppress_arp(struct sk_buff *skb, struct net_bridge *br,
  103. u16 vid, struct net_bridge_port *p)
  104. {
  105. struct net_device *dev = br->dev;
  106. struct net_device *vlandev = dev;
  107. struct neighbour *n;
  108. struct arphdr *parp;
  109. u8 *arpptr, *sha;
  110. __be32 sip, tip;
  111. BR_INPUT_SKB_CB(skb)->proxyarp_replied = false;
  112. if ((dev->flags & IFF_NOARP) ||
  113. !pskb_may_pull(skb, arp_hdr_len(dev)))
  114. return;
  115. parp = arp_hdr(skb);
  116. if (parp->ar_pro != htons(ETH_P_IP) ||
  117. parp->ar_hln != dev->addr_len ||
  118. parp->ar_pln != 4)
  119. return;
  120. arpptr = (u8 *)parp + sizeof(struct arphdr);
  121. sha = arpptr;
  122. arpptr += dev->addr_len; /* sha */
  123. memcpy(&sip, arpptr, sizeof(sip));
  124. arpptr += sizeof(sip);
  125. arpptr += dev->addr_len; /* tha */
  126. memcpy(&tip, arpptr, sizeof(tip));
  127. if (ipv4_is_loopback(tip) ||
  128. ipv4_is_multicast(tip))
  129. return;
  130. if (br->neigh_suppress_enabled) {
  131. if (p && (p->flags & BR_NEIGH_SUPPRESS))
  132. return;
  133. if (parp->ar_op != htons(ARPOP_RREQUEST) &&
  134. parp->ar_op != htons(ARPOP_RREPLY) &&
  135. (ipv4_is_zeronet(sip) || sip == tip)) {
  136. /* prevent flooding to neigh suppress ports */
  137. BR_INPUT_SKB_CB(skb)->proxyarp_replied = true;
  138. return;
  139. }
  140. }
  141. if (parp->ar_op != htons(ARPOP_REQUEST))
  142. return;
  143. if (vid != 0) {
  144. vlandev = __vlan_find_dev_deep_rcu(br->dev, skb->vlan_proto,
  145. vid);
  146. if (!vlandev)
  147. return;
  148. }
  149. if (br->neigh_suppress_enabled && br_is_local_ip(vlandev, tip)) {
  150. /* its our local ip, so don't proxy reply
  151. * and don't forward to neigh suppress ports
  152. */
  153. BR_INPUT_SKB_CB(skb)->proxyarp_replied = true;
  154. return;
  155. }
  156. n = neigh_lookup(&arp_tbl, &tip, vlandev);
  157. if (n) {
  158. struct net_bridge_fdb_entry *f;
  159. if (!(n->nud_state & NUD_VALID)) {
  160. neigh_release(n);
  161. return;
  162. }
  163. f = br_fdb_find_rcu(br, n->ha, vid);
  164. if (f) {
  165. bool replied = false;
  166. if ((p && (p->flags & BR_PROXYARP)) ||
  167. (f->dst && (f->dst->flags & (BR_PROXYARP_WIFI |
  168. BR_NEIGH_SUPPRESS)))) {
  169. if (!vid)
  170. br_arp_send(br, p, skb->dev, sip, tip,
  171. sha, n->ha, sha, 0, 0);
  172. else
  173. br_arp_send(br, p, skb->dev, sip, tip,
  174. sha, n->ha, sha,
  175. skb->vlan_proto,
  176. skb_vlan_tag_get(skb));
  177. replied = true;
  178. }
  179. /* If we have replied or as long as we know the
  180. * mac, indicate to arp replied
  181. */
  182. if (replied || br->neigh_suppress_enabled)
  183. BR_INPUT_SKB_CB(skb)->proxyarp_replied = true;
  184. }
  185. neigh_release(n);
  186. }
  187. }
  188. #endif
  189. #if IS_ENABLED(CONFIG_IPV6)
  190. struct nd_msg *br_is_nd_neigh_msg(struct sk_buff *skb, struct nd_msg *msg)
  191. {
  192. struct nd_msg *m;
  193. m = skb_header_pointer(skb, skb_network_offset(skb) +
  194. sizeof(struct ipv6hdr), sizeof(*msg), msg);
  195. if (!m)
  196. return NULL;
  197. if (m->icmph.icmp6_code != 0 ||
  198. (m->icmph.icmp6_type != NDISC_NEIGHBOUR_SOLICITATION &&
  199. m->icmph.icmp6_type != NDISC_NEIGHBOUR_ADVERTISEMENT))
  200. return NULL;
  201. return m;
  202. }
  203. static void br_nd_send(struct net_bridge *br, struct net_bridge_port *p,
  204. struct sk_buff *request, struct neighbour *n,
  205. __be16 vlan_proto, u16 vlan_tci, struct nd_msg *ns)
  206. {
  207. struct net_device *dev = request->dev;
  208. struct net_bridge_vlan_group *vg;
  209. struct sk_buff *reply;
  210. struct nd_msg *na;
  211. struct ipv6hdr *pip6;
  212. int na_olen = 8; /* opt hdr + ETH_ALEN for target */
  213. int ns_olen;
  214. int i, len;
  215. u8 *daddr;
  216. u16 pvid;
  217. if (!dev)
  218. return;
  219. len = LL_RESERVED_SPACE(dev) + sizeof(struct ipv6hdr) +
  220. sizeof(*na) + na_olen + dev->needed_tailroom;
  221. reply = alloc_skb(len, GFP_ATOMIC);
  222. if (!reply)
  223. return;
  224. reply->protocol = htons(ETH_P_IPV6);
  225. reply->dev = dev;
  226. skb_reserve(reply, LL_RESERVED_SPACE(dev));
  227. skb_push(reply, sizeof(struct ethhdr));
  228. skb_set_mac_header(reply, 0);
  229. daddr = eth_hdr(request)->h_source;
  230. /* Do we need option processing ? */
  231. ns_olen = request->len - (skb_network_offset(request) +
  232. sizeof(struct ipv6hdr)) - sizeof(*ns);
  233. for (i = 0; i < ns_olen - 1; i += (ns->opt[i + 1] << 3)) {
  234. if (!ns->opt[i + 1]) {
  235. kfree_skb(reply);
  236. return;
  237. }
  238. if (ns->opt[i] == ND_OPT_SOURCE_LL_ADDR) {
  239. daddr = ns->opt + i + sizeof(struct nd_opt_hdr);
  240. break;
  241. }
  242. }
  243. /* Ethernet header */
  244. ether_addr_copy(eth_hdr(reply)->h_dest, daddr);
  245. ether_addr_copy(eth_hdr(reply)->h_source, n->ha);
  246. eth_hdr(reply)->h_proto = htons(ETH_P_IPV6);
  247. reply->protocol = htons(ETH_P_IPV6);
  248. skb_pull(reply, sizeof(struct ethhdr));
  249. skb_set_network_header(reply, 0);
  250. skb_put(reply, sizeof(struct ipv6hdr));
  251. /* IPv6 header */
  252. pip6 = ipv6_hdr(reply);
  253. memset(pip6, 0, sizeof(struct ipv6hdr));
  254. pip6->version = 6;
  255. pip6->priority = ipv6_hdr(request)->priority;
  256. pip6->nexthdr = IPPROTO_ICMPV6;
  257. pip6->hop_limit = 255;
  258. pip6->daddr = ipv6_hdr(request)->saddr;
  259. pip6->saddr = *(struct in6_addr *)n->primary_key;
  260. skb_pull(reply, sizeof(struct ipv6hdr));
  261. skb_set_transport_header(reply, 0);
  262. na = (struct nd_msg *)skb_put(reply, sizeof(*na) + na_olen);
  263. /* Neighbor Advertisement */
  264. memset(na, 0, sizeof(*na) + na_olen);
  265. na->icmph.icmp6_type = NDISC_NEIGHBOUR_ADVERTISEMENT;
  266. na->icmph.icmp6_router = (n->flags & NTF_ROUTER) ? 1 : 0;
  267. na->icmph.icmp6_override = 1;
  268. na->icmph.icmp6_solicited = 1;
  269. na->target = ns->target;
  270. ether_addr_copy(&na->opt[2], n->ha);
  271. na->opt[0] = ND_OPT_TARGET_LL_ADDR;
  272. na->opt[1] = na_olen >> 3;
  273. na->icmph.icmp6_cksum = csum_ipv6_magic(&pip6->saddr,
  274. &pip6->daddr,
  275. sizeof(*na) + na_olen,
  276. IPPROTO_ICMPV6,
  277. csum_partial(na, sizeof(*na) + na_olen, 0));
  278. pip6->payload_len = htons(sizeof(*na) + na_olen);
  279. skb_push(reply, sizeof(struct ipv6hdr));
  280. skb_push(reply, sizeof(struct ethhdr));
  281. reply->ip_summed = CHECKSUM_UNNECESSARY;
  282. if (p)
  283. vg = nbp_vlan_group_rcu(p);
  284. else
  285. vg = br_vlan_group_rcu(br);
  286. pvid = br_get_pvid(vg);
  287. if (pvid == (vlan_tci & VLAN_VID_MASK))
  288. vlan_tci = 0;
  289. if (vlan_tci)
  290. __vlan_hwaccel_put_tag(reply, vlan_proto, vlan_tci);
  291. netdev_dbg(dev, "nd send dev %s dst %pI6 dst_hw %pM src %pI6 src_hw %pM\n",
  292. dev->name, &pip6->daddr, daddr, &pip6->saddr, n->ha);
  293. if (p) {
  294. dev_queue_xmit(reply);
  295. } else {
  296. skb_reset_mac_header(reply);
  297. __skb_pull(reply, skb_network_offset(reply));
  298. reply->ip_summed = CHECKSUM_UNNECESSARY;
  299. reply->pkt_type = PACKET_HOST;
  300. netif_rx_ni(reply);
  301. }
  302. }
  303. static int br_chk_addr_ip6(struct net_device *dev, void *data)
  304. {
  305. struct in6_addr *addr = (struct in6_addr *)data;
  306. if (ipv6_chk_addr(dev_net(dev), addr, dev, 0))
  307. return 1;
  308. return 0;
  309. }
  310. static bool br_is_local_ip6(struct net_device *dev, struct in6_addr *addr)
  311. {
  312. if (br_chk_addr_ip6(dev, addr))
  313. return true;
  314. /* check if ip is configured on upper dev */
  315. if (netdev_walk_all_upper_dev_rcu(dev, br_chk_addr_ip6, addr))
  316. return true;
  317. return false;
  318. }
  319. void br_do_suppress_nd(struct sk_buff *skb, struct net_bridge *br,
  320. u16 vid, struct net_bridge_port *p, struct nd_msg *msg)
  321. {
  322. struct net_device *dev = br->dev;
  323. struct net_device *vlandev = NULL;
  324. struct in6_addr *saddr, *daddr;
  325. struct ipv6hdr *iphdr;
  326. struct neighbour *n;
  327. BR_INPUT_SKB_CB(skb)->proxyarp_replied = false;
  328. if (p && (p->flags & BR_NEIGH_SUPPRESS))
  329. return;
  330. if (msg->icmph.icmp6_type == NDISC_NEIGHBOUR_ADVERTISEMENT &&
  331. !msg->icmph.icmp6_solicited) {
  332. /* prevent flooding to neigh suppress ports */
  333. BR_INPUT_SKB_CB(skb)->proxyarp_replied = true;
  334. return;
  335. }
  336. if (msg->icmph.icmp6_type != NDISC_NEIGHBOUR_SOLICITATION)
  337. return;
  338. iphdr = ipv6_hdr(skb);
  339. saddr = &iphdr->saddr;
  340. daddr = &iphdr->daddr;
  341. if (ipv6_addr_any(saddr) || !ipv6_addr_cmp(saddr, daddr)) {
  342. /* prevent flooding to neigh suppress ports */
  343. BR_INPUT_SKB_CB(skb)->proxyarp_replied = true;
  344. return;
  345. }
  346. if (vid != 0) {
  347. /* build neigh table lookup on the vlan device */
  348. vlandev = __vlan_find_dev_deep_rcu(br->dev, skb->vlan_proto,
  349. vid);
  350. if (!vlandev)
  351. return;
  352. } else {
  353. vlandev = dev;
  354. }
  355. if (br_is_local_ip6(vlandev, &msg->target)) {
  356. /* its our own ip, so don't proxy reply
  357. * and don't forward to arp suppress ports
  358. */
  359. BR_INPUT_SKB_CB(skb)->proxyarp_replied = true;
  360. return;
  361. }
  362. n = neigh_lookup(ipv6_stub->nd_tbl, &msg->target, vlandev);
  363. if (n) {
  364. struct net_bridge_fdb_entry *f;
  365. if (!(n->nud_state & NUD_VALID)) {
  366. neigh_release(n);
  367. return;
  368. }
  369. f = br_fdb_find_rcu(br, n->ha, vid);
  370. if (f) {
  371. bool replied = false;
  372. if (f->dst && (f->dst->flags & BR_NEIGH_SUPPRESS)) {
  373. if (vid != 0)
  374. br_nd_send(br, p, skb, n,
  375. skb->vlan_proto,
  376. skb_vlan_tag_get(skb), msg);
  377. else
  378. br_nd_send(br, p, skb, n, 0, 0, msg);
  379. replied = true;
  380. }
  381. /* If we have replied or as long as we know the
  382. * mac, indicate to NEIGH_SUPPRESS ports that we
  383. * have replied
  384. */
  385. if (replied || br->neigh_suppress_enabled)
  386. BR_INPUT_SKB_CB(skb)->proxyarp_replied = true;
  387. }
  388. neigh_release(n);
  389. }
  390. }
  391. #endif