br_arp_nd_proxy.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517
  1. // SPDX-License-Identifier: GPL-2.0-or-later
  2. /*
  3. * Handle bridge arp/nd proxy/suppress
  4. *
  5. * Copyright (C) 2017 Cumulus Networks
  6. * Copyright (c) 2017 Roopa Prabhu <roopa@cumulusnetworks.com>
  7. *
  8. * Authors:
  9. * Roopa Prabhu <roopa@cumulusnetworks.com>
  10. */
  11. #include <linux/kernel.h>
  12. #include <linux/netdevice.h>
  13. #include <linux/etherdevice.h>
  14. #include <linux/neighbour.h>
  15. #include <net/arp.h>
  16. #include <linux/if_vlan.h>
  17. #include <linux/inetdevice.h>
  18. #include <net/addrconf.h>
  19. #include <net/ipv6_stubs.h>
  20. #if IS_ENABLED(CONFIG_IPV6)
  21. #include <net/ip6_checksum.h>
  22. #endif
  23. #include "br_private.h"
  24. void br_recalculate_neigh_suppress_enabled(struct net_bridge *br)
  25. {
  26. struct net_bridge_port *p;
  27. bool neigh_suppress = false;
  28. list_for_each_entry(p, &br->port_list, list) {
  29. if (p->flags & (BR_NEIGH_SUPPRESS | BR_NEIGH_VLAN_SUPPRESS)) {
  30. neigh_suppress = true;
  31. break;
  32. }
  33. }
  34. br_opt_toggle(br, BROPT_NEIGH_SUPPRESS_ENABLED, neigh_suppress);
  35. }
  36. #if IS_ENABLED(CONFIG_INET)
  37. static void br_arp_send(struct net_bridge *br, struct net_bridge_port *p,
  38. struct net_device *dev, __be32 dest_ip, __be32 src_ip,
  39. const unsigned char *dest_hw,
  40. const unsigned char *src_hw,
  41. const unsigned char *target_hw,
  42. __be16 vlan_proto, u16 vlan_tci)
  43. {
  44. struct net_bridge_vlan_group *vg;
  45. struct sk_buff *skb;
  46. u16 pvid;
  47. netdev_dbg(dev, "arp send dev %s dst %pI4 dst_hw %pM src %pI4 src_hw %pM\n",
  48. dev->name, &dest_ip, dest_hw, &src_ip, src_hw);
  49. if (!vlan_tci) {
  50. arp_send(ARPOP_REPLY, ETH_P_ARP, dest_ip, dev, src_ip,
  51. dest_hw, src_hw, target_hw);
  52. return;
  53. }
  54. skb = arp_create(ARPOP_REPLY, ETH_P_ARP, dest_ip, dev, src_ip,
  55. dest_hw, src_hw, target_hw);
  56. if (!skb)
  57. return;
  58. if (p)
  59. vg = nbp_vlan_group_rcu(p);
  60. else
  61. vg = br_vlan_group_rcu(br);
  62. pvid = br_get_pvid(vg);
  63. if (pvid == (vlan_tci & VLAN_VID_MASK))
  64. vlan_tci = 0;
  65. if (vlan_tci)
  66. __vlan_hwaccel_put_tag(skb, vlan_proto, vlan_tci);
  67. if (p) {
  68. arp_xmit(skb);
  69. } else {
  70. skb_reset_mac_header(skb);
  71. __skb_pull(skb, skb_network_offset(skb));
  72. skb->ip_summed = CHECKSUM_UNNECESSARY;
  73. skb->pkt_type = PACKET_HOST;
  74. netif_rx(skb);
  75. }
  76. }
  77. static int br_chk_addr_ip(struct net_device *dev,
  78. struct netdev_nested_priv *priv)
  79. {
  80. __be32 ip = *(__be32 *)priv->data;
  81. struct in_device *in_dev;
  82. __be32 addr = 0;
  83. in_dev = __in_dev_get_rcu(dev);
  84. if (in_dev)
  85. addr = inet_confirm_addr(dev_net(dev), in_dev, 0, ip,
  86. RT_SCOPE_HOST);
  87. if (addr == ip)
  88. return 1;
  89. return 0;
  90. }
  91. static bool br_is_local_ip(struct net_device *dev, __be32 ip)
  92. {
  93. struct netdev_nested_priv priv = {
  94. .data = (void *)&ip,
  95. };
  96. if (br_chk_addr_ip(dev, &priv))
  97. return true;
  98. /* check if ip is configured on upper dev */
  99. if (netdev_walk_all_upper_dev_rcu(dev, br_chk_addr_ip, &priv))
  100. return true;
  101. return false;
  102. }
  103. void br_do_proxy_suppress_arp(struct sk_buff *skb, struct net_bridge *br,
  104. u16 vid, struct net_bridge_port *p)
  105. {
  106. struct net_device *dev = br->dev;
  107. struct net_device *vlandev = dev;
  108. struct neighbour *n;
  109. struct arphdr *parp;
  110. u8 *arpptr, *sha;
  111. __be32 sip, tip;
  112. BR_INPUT_SKB_CB(skb)->proxyarp_replied = 0;
  113. if ((dev->flags & IFF_NOARP) ||
  114. !pskb_may_pull(skb, arp_hdr_len(dev)))
  115. return;
  116. parp = arp_hdr(skb);
  117. if (parp->ar_pro != htons(ETH_P_IP) ||
  118. parp->ar_hln != dev->addr_len ||
  119. parp->ar_pln != 4)
  120. return;
  121. arpptr = (u8 *)parp + sizeof(struct arphdr);
  122. sha = arpptr;
  123. arpptr += dev->addr_len; /* sha */
  124. memcpy(&sip, arpptr, sizeof(sip));
  125. arpptr += sizeof(sip);
  126. arpptr += dev->addr_len; /* tha */
  127. memcpy(&tip, arpptr, sizeof(tip));
  128. if (ipv4_is_loopback(tip) ||
  129. ipv4_is_multicast(tip))
  130. return;
  131. if (br_opt_get(br, BROPT_NEIGH_SUPPRESS_ENABLED)) {
  132. if (br_is_neigh_suppress_enabled(p, vid))
  133. return;
  134. if (is_unicast_ether_addr(eth_hdr(skb)->h_dest) &&
  135. parp->ar_op == htons(ARPOP_REQUEST))
  136. return;
  137. if (parp->ar_op != htons(ARPOP_RREQUEST) &&
  138. parp->ar_op != htons(ARPOP_RREPLY) &&
  139. (ipv4_is_zeronet(sip) || sip == tip)) {
  140. /* prevent flooding to neigh suppress ports */
  141. BR_INPUT_SKB_CB(skb)->proxyarp_replied = 1;
  142. return;
  143. }
  144. }
  145. if (parp->ar_op != htons(ARPOP_REQUEST))
  146. return;
  147. if (vid != 0) {
  148. vlandev = __vlan_find_dev_deep_rcu(br->dev, skb->vlan_proto,
  149. vid);
  150. if (!vlandev)
  151. return;
  152. }
  153. if (br_opt_get(br, BROPT_NEIGH_SUPPRESS_ENABLED) &&
  154. br_is_local_ip(vlandev, tip)) {
  155. /* its our local ip, so don't proxy reply
  156. * and don't forward to neigh suppress ports
  157. */
  158. BR_INPUT_SKB_CB(skb)->proxyarp_replied = 1;
  159. return;
  160. }
  161. n = neigh_lookup(&arp_tbl, &tip, vlandev);
  162. if (n) {
  163. struct net_bridge_fdb_entry *f;
  164. if (!(READ_ONCE(n->nud_state) & NUD_VALID)) {
  165. neigh_release(n);
  166. return;
  167. }
  168. f = br_fdb_find_rcu(br, n->ha, vid);
  169. if (f) {
  170. bool replied = false;
  171. if ((p && (p->flags & BR_PROXYARP)) ||
  172. (f->dst && (f->dst->flags & BR_PROXYARP_WIFI)) ||
  173. br_is_neigh_suppress_enabled(f->dst, vid)) {
  174. if (!vid)
  175. br_arp_send(br, p, skb->dev, sip, tip,
  176. sha, n->ha, sha, 0, 0);
  177. else
  178. br_arp_send(br, p, skb->dev, sip, tip,
  179. sha, n->ha, sha,
  180. skb->vlan_proto,
  181. skb_vlan_tag_get(skb));
  182. replied = true;
  183. }
  184. /* If we have replied or as long as we know the
  185. * mac, indicate to arp replied
  186. */
  187. if (replied ||
  188. br_opt_get(br, BROPT_NEIGH_SUPPRESS_ENABLED))
  189. BR_INPUT_SKB_CB(skb)->proxyarp_replied = 1;
  190. }
  191. neigh_release(n);
  192. }
  193. }
  194. #endif
  195. #if IS_ENABLED(CONFIG_IPV6)
  196. struct nd_msg *br_is_nd_neigh_msg(const struct sk_buff *skb, struct nd_msg *msg)
  197. {
  198. struct nd_msg *m;
  199. m = skb_header_pointer(skb, skb_network_offset(skb) +
  200. sizeof(struct ipv6hdr), sizeof(*msg), msg);
  201. if (!m)
  202. return NULL;
  203. if (m->icmph.icmp6_code != 0 ||
  204. (m->icmph.icmp6_type != NDISC_NEIGHBOUR_SOLICITATION &&
  205. m->icmph.icmp6_type != NDISC_NEIGHBOUR_ADVERTISEMENT))
  206. return NULL;
  207. return m;
  208. }
  209. static void br_nd_send(struct net_bridge *br, struct net_bridge_port *p,
  210. struct sk_buff *request, struct neighbour *n,
  211. __be16 vlan_proto, u16 vlan_tci)
  212. {
  213. struct net_device *dev = request->dev;
  214. struct net_bridge_vlan_group *vg;
  215. struct nd_msg *na, *ns;
  216. struct sk_buff *reply;
  217. struct ipv6hdr *pip6;
  218. int na_olen = 8; /* opt hdr + ETH_ALEN for target */
  219. int ns_olen;
  220. int i, len;
  221. u8 *daddr;
  222. u16 pvid;
  223. if (!dev || skb_linearize(request))
  224. return;
  225. len = LL_RESERVED_SPACE(dev) + sizeof(struct ipv6hdr) +
  226. sizeof(*na) + na_olen + dev->needed_tailroom;
  227. reply = alloc_skb(len, GFP_ATOMIC);
  228. if (!reply)
  229. return;
  230. reply->protocol = htons(ETH_P_IPV6);
  231. reply->dev = dev;
  232. skb_reserve(reply, LL_RESERVED_SPACE(dev));
  233. skb_push(reply, sizeof(struct ethhdr));
  234. skb_set_mac_header(reply, 0);
  235. daddr = eth_hdr(request)->h_source;
  236. ns = (struct nd_msg *)(skb_network_header(request) +
  237. sizeof(struct ipv6hdr));
  238. /* Do we need option processing ? */
  239. ns_olen = request->len - (skb_network_offset(request) +
  240. sizeof(struct ipv6hdr)) - sizeof(*ns);
  241. for (i = 0; i < ns_olen - 1; i += (ns->opt[i + 1] << 3)) {
  242. if (!ns->opt[i + 1] || i + (ns->opt[i + 1] << 3) > ns_olen) {
  243. kfree_skb(reply);
  244. return;
  245. }
  246. if (ns->opt[i] == ND_OPT_SOURCE_LL_ADDR) {
  247. if ((ns->opt[i + 1] << 3) >=
  248. sizeof(struct nd_opt_hdr) + ETH_ALEN)
  249. daddr = ns->opt + i + sizeof(struct nd_opt_hdr);
  250. break;
  251. }
  252. }
  253. /* Ethernet header */
  254. ether_addr_copy(eth_hdr(reply)->h_dest, daddr);
  255. ether_addr_copy(eth_hdr(reply)->h_source, n->ha);
  256. eth_hdr(reply)->h_proto = htons(ETH_P_IPV6);
  257. reply->protocol = htons(ETH_P_IPV6);
  258. skb_pull(reply, sizeof(struct ethhdr));
  259. skb_set_network_header(reply, 0);
  260. skb_put(reply, sizeof(struct ipv6hdr));
  261. /* IPv6 header */
  262. pip6 = ipv6_hdr(reply);
  263. memset(pip6, 0, sizeof(struct ipv6hdr));
  264. pip6->version = 6;
  265. pip6->priority = ipv6_hdr(request)->priority;
  266. pip6->nexthdr = IPPROTO_ICMPV6;
  267. pip6->hop_limit = 255;
  268. pip6->daddr = ipv6_hdr(request)->saddr;
  269. pip6->saddr = *(struct in6_addr *)n->primary_key;
  270. skb_pull(reply, sizeof(struct ipv6hdr));
  271. skb_set_transport_header(reply, 0);
  272. na = (struct nd_msg *)skb_put(reply, sizeof(*na) + na_olen);
  273. /* Neighbor Advertisement */
  274. memset(na, 0, sizeof(*na) + na_olen);
  275. na->icmph.icmp6_type = NDISC_NEIGHBOUR_ADVERTISEMENT;
  276. na->icmph.icmp6_router = (n->flags & NTF_ROUTER) ? 1 : 0;
  277. na->icmph.icmp6_override = 1;
  278. na->icmph.icmp6_solicited = 1;
  279. na->target = ns->target;
  280. ether_addr_copy(&na->opt[2], n->ha);
  281. na->opt[0] = ND_OPT_TARGET_LL_ADDR;
  282. na->opt[1] = na_olen >> 3;
  283. na->icmph.icmp6_cksum = csum_ipv6_magic(&pip6->saddr,
  284. &pip6->daddr,
  285. sizeof(*na) + na_olen,
  286. IPPROTO_ICMPV6,
  287. csum_partial(na, sizeof(*na) + na_olen, 0));
  288. pip6->payload_len = htons(sizeof(*na) + na_olen);
  289. skb_push(reply, sizeof(struct ipv6hdr));
  290. skb_push(reply, sizeof(struct ethhdr));
  291. reply->ip_summed = CHECKSUM_UNNECESSARY;
  292. if (p)
  293. vg = nbp_vlan_group_rcu(p);
  294. else
  295. vg = br_vlan_group_rcu(br);
  296. pvid = br_get_pvid(vg);
  297. if (pvid == (vlan_tci & VLAN_VID_MASK))
  298. vlan_tci = 0;
  299. if (vlan_tci)
  300. __vlan_hwaccel_put_tag(reply, vlan_proto, vlan_tci);
  301. netdev_dbg(dev, "nd send dev %s dst %pI6 dst_hw %pM src %pI6 src_hw %pM\n",
  302. dev->name, &pip6->daddr, daddr, &pip6->saddr, n->ha);
  303. if (p) {
  304. dev_queue_xmit(reply);
  305. } else {
  306. skb_reset_mac_header(reply);
  307. __skb_pull(reply, skb_network_offset(reply));
  308. reply->ip_summed = CHECKSUM_UNNECESSARY;
  309. reply->pkt_type = PACKET_HOST;
  310. netif_rx(reply);
  311. }
  312. }
  313. static int br_chk_addr_ip6(struct net_device *dev,
  314. struct netdev_nested_priv *priv)
  315. {
  316. struct in6_addr *addr = (struct in6_addr *)priv->data;
  317. if (ipv6_chk_addr(dev_net(dev), addr, dev, 0))
  318. return 1;
  319. return 0;
  320. }
  321. static bool br_is_local_ip6(struct net_device *dev, struct in6_addr *addr)
  322. {
  323. struct netdev_nested_priv priv = {
  324. .data = (void *)addr,
  325. };
  326. if (br_chk_addr_ip6(dev, &priv))
  327. return true;
  328. /* check if ip is configured on upper dev */
  329. if (netdev_walk_all_upper_dev_rcu(dev, br_chk_addr_ip6, &priv))
  330. return true;
  331. return false;
  332. }
  333. void br_do_suppress_nd(struct sk_buff *skb, struct net_bridge *br,
  334. u16 vid, struct net_bridge_port *p, struct nd_msg *msg)
  335. {
  336. struct net_device *dev = br->dev;
  337. struct net_device *vlandev = NULL;
  338. struct in6_addr *saddr, *daddr;
  339. struct ipv6hdr *iphdr;
  340. struct neighbour *n;
  341. BR_INPUT_SKB_CB(skb)->proxyarp_replied = 0;
  342. if (br_is_neigh_suppress_enabled(p, vid))
  343. return;
  344. if (is_unicast_ether_addr(eth_hdr(skb)->h_dest) &&
  345. msg->icmph.icmp6_type == NDISC_NEIGHBOUR_SOLICITATION)
  346. return;
  347. if (msg->icmph.icmp6_type == NDISC_NEIGHBOUR_ADVERTISEMENT &&
  348. !msg->icmph.icmp6_solicited) {
  349. /* prevent flooding to neigh suppress ports */
  350. BR_INPUT_SKB_CB(skb)->proxyarp_replied = 1;
  351. return;
  352. }
  353. if (msg->icmph.icmp6_type != NDISC_NEIGHBOUR_SOLICITATION)
  354. return;
  355. iphdr = ipv6_hdr(skb);
  356. saddr = &iphdr->saddr;
  357. daddr = &iphdr->daddr;
  358. if (ipv6_addr_any(saddr) || !ipv6_addr_cmp(saddr, daddr)) {
  359. /* prevent flooding to neigh suppress ports */
  360. BR_INPUT_SKB_CB(skb)->proxyarp_replied = 1;
  361. return;
  362. }
  363. if (vid != 0) {
  364. /* build neigh table lookup on the vlan device */
  365. vlandev = __vlan_find_dev_deep_rcu(br->dev, skb->vlan_proto,
  366. vid);
  367. if (!vlandev)
  368. return;
  369. } else {
  370. vlandev = dev;
  371. }
  372. if (br_is_local_ip6(vlandev, &msg->target)) {
  373. /* its our own ip, so don't proxy reply
  374. * and don't forward to arp suppress ports
  375. */
  376. BR_INPUT_SKB_CB(skb)->proxyarp_replied = 1;
  377. return;
  378. }
  379. n = neigh_lookup(ipv6_stub->nd_tbl, &msg->target, vlandev);
  380. if (n) {
  381. struct net_bridge_fdb_entry *f;
  382. if (!(READ_ONCE(n->nud_state) & NUD_VALID)) {
  383. neigh_release(n);
  384. return;
  385. }
  386. f = br_fdb_find_rcu(br, n->ha, vid);
  387. if (f) {
  388. bool replied = false;
  389. if (br_is_neigh_suppress_enabled(f->dst, vid)) {
  390. if (vid != 0)
  391. br_nd_send(br, p, skb, n,
  392. skb->vlan_proto,
  393. skb_vlan_tag_get(skb));
  394. else
  395. br_nd_send(br, p, skb, n, 0, 0);
  396. replied = true;
  397. }
  398. /* If we have replied or as long as we know the
  399. * mac, indicate to NEIGH_SUPPRESS ports that we
  400. * have replied
  401. */
  402. if (replied ||
  403. br_opt_get(br, BROPT_NEIGH_SUPPRESS_ENABLED))
  404. BR_INPUT_SKB_CB(skb)->proxyarp_replied = 1;
  405. }
  406. neigh_release(n);
  407. }
  408. }
  409. #endif
  410. bool br_is_neigh_suppress_enabled(const struct net_bridge_port *p, u16 vid)
  411. {
  412. if (!p)
  413. return false;
  414. if (!vid)
  415. return !!(p->flags & BR_NEIGH_SUPPRESS);
  416. if (p->flags & BR_NEIGH_VLAN_SUPPRESS) {
  417. struct net_bridge_vlan_group *vg = nbp_vlan_group_rcu(p);
  418. struct net_bridge_vlan *v;
  419. v = br_vlan_find(vg, vid);
  420. if (!v)
  421. return false;
  422. return !!(v->priv_flags & BR_VLFLAG_NEIGH_SUPPRESS_ENABLED);
  423. } else {
  424. return !!(p->flags & BR_NEIGH_SUPPRESS);
  425. }
  426. }