rpl_iptunnel.c 8.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Authors:
  4. * (C) 2020 Alexander Aring <alex.aring@gmail.com>
  5. */
  6. #include <linux/rpl_iptunnel.h>
  7. #include <net/dst_cache.h>
  8. #include <net/ip6_route.h>
  9. #include <net/lwtunnel.h>
  10. #include <net/ipv6.h>
  11. #include <net/rpl.h>
  12. struct rpl_iptunnel_encap {
  13. DECLARE_FLEX_ARRAY(struct ipv6_rpl_sr_hdr, srh);
  14. };
  15. struct rpl_lwt {
  16. struct dst_cache cache;
  17. struct rpl_iptunnel_encap tuninfo;
  18. };
  19. static inline struct rpl_lwt *rpl_lwt_lwtunnel(struct lwtunnel_state *lwt)
  20. {
  21. return (struct rpl_lwt *)lwt->data;
  22. }
  23. static inline struct rpl_iptunnel_encap *
  24. rpl_encap_lwtunnel(struct lwtunnel_state *lwt)
  25. {
  26. return &rpl_lwt_lwtunnel(lwt)->tuninfo;
  27. }
  28. static const struct nla_policy rpl_iptunnel_policy[RPL_IPTUNNEL_MAX + 1] = {
  29. [RPL_IPTUNNEL_SRH] = { .type = NLA_BINARY },
  30. };
  31. static bool rpl_validate_srh(struct net *net, struct ipv6_rpl_sr_hdr *srh,
  32. size_t seglen)
  33. {
  34. int err;
  35. if ((srh->hdrlen << 3) != seglen)
  36. return false;
  37. /* check at least one segment and seglen fit with segments_left */
  38. if (!srh->segments_left ||
  39. (srh->segments_left * sizeof(struct in6_addr)) != seglen)
  40. return false;
  41. if (srh->cmpri || srh->cmpre)
  42. return false;
  43. err = ipv6_chk_rpl_srh_loop(net, srh->rpl_segaddr,
  44. srh->segments_left);
  45. if (err)
  46. return false;
  47. if (ipv6_addr_type(&srh->rpl_segaddr[srh->segments_left - 1]) &
  48. IPV6_ADDR_MULTICAST)
  49. return false;
  50. return true;
  51. }
  52. static int rpl_build_state(struct net *net, struct nlattr *nla,
  53. unsigned int family, const void *cfg,
  54. struct lwtunnel_state **ts,
  55. struct netlink_ext_ack *extack)
  56. {
  57. struct nlattr *tb[RPL_IPTUNNEL_MAX + 1];
  58. struct lwtunnel_state *newts;
  59. struct ipv6_rpl_sr_hdr *srh;
  60. struct rpl_lwt *rlwt;
  61. int err, srh_len;
  62. if (family != AF_INET6)
  63. return -EINVAL;
  64. err = nla_parse_nested(tb, RPL_IPTUNNEL_MAX, nla,
  65. rpl_iptunnel_policy, extack);
  66. if (err < 0)
  67. return err;
  68. if (!tb[RPL_IPTUNNEL_SRH])
  69. return -EINVAL;
  70. srh = nla_data(tb[RPL_IPTUNNEL_SRH]);
  71. srh_len = nla_len(tb[RPL_IPTUNNEL_SRH]);
  72. if (srh_len < sizeof(*srh))
  73. return -EINVAL;
  74. /* verify that SRH is consistent */
  75. if (!rpl_validate_srh(net, srh, srh_len - sizeof(*srh)))
  76. return -EINVAL;
  77. newts = lwtunnel_state_alloc(srh_len + sizeof(*rlwt));
  78. if (!newts)
  79. return -ENOMEM;
  80. rlwt = rpl_lwt_lwtunnel(newts);
  81. err = dst_cache_init(&rlwt->cache, GFP_ATOMIC);
  82. if (err) {
  83. kfree(newts);
  84. return err;
  85. }
  86. memcpy(&rlwt->tuninfo.srh, srh, srh_len);
  87. newts->type = LWTUNNEL_ENCAP_RPL;
  88. newts->flags |= LWTUNNEL_STATE_INPUT_REDIRECT;
  89. newts->flags |= LWTUNNEL_STATE_OUTPUT_REDIRECT;
  90. *ts = newts;
  91. return 0;
  92. }
  93. static void rpl_destroy_state(struct lwtunnel_state *lwt)
  94. {
  95. dst_cache_destroy(&rpl_lwt_lwtunnel(lwt)->cache);
  96. }
  97. static int rpl_do_srh_inline(struct sk_buff *skb, const struct rpl_lwt *rlwt,
  98. const struct ipv6_rpl_sr_hdr *srh,
  99. struct dst_entry *cache_dst)
  100. {
  101. struct ipv6_rpl_sr_hdr *isrh, *csrh;
  102. struct ipv6hdr oldhdr;
  103. struct ipv6hdr *hdr;
  104. unsigned char *buf;
  105. size_t hdrlen;
  106. int err;
  107. memcpy(&oldhdr, ipv6_hdr(skb), sizeof(oldhdr));
  108. buf = kcalloc(struct_size(srh, segments.addr, srh->segments_left), 2, GFP_ATOMIC);
  109. if (!buf)
  110. return -ENOMEM;
  111. isrh = (struct ipv6_rpl_sr_hdr *)buf;
  112. csrh = (struct ipv6_rpl_sr_hdr *)(buf + ((srh->hdrlen + 1) << 3));
  113. memcpy(isrh, srh, sizeof(*isrh));
  114. memcpy(isrh->rpl_segaddr, &srh->rpl_segaddr[1],
  115. (srh->segments_left - 1) * 16);
  116. isrh->rpl_segaddr[srh->segments_left - 1] = oldhdr.daddr;
  117. ipv6_rpl_srh_compress(csrh, isrh, &srh->rpl_segaddr[0],
  118. isrh->segments_left - 1);
  119. hdrlen = ((csrh->hdrlen + 1) << 3);
  120. err = skb_cow_head(skb, hdrlen + dst_dev_overhead(cache_dst, skb));
  121. if (unlikely(err)) {
  122. kfree(buf);
  123. return err;
  124. }
  125. skb_pull(skb, sizeof(struct ipv6hdr));
  126. skb_postpull_rcsum(skb, skb_network_header(skb),
  127. sizeof(struct ipv6hdr));
  128. skb_push(skb, sizeof(struct ipv6hdr) + hdrlen);
  129. skb_reset_network_header(skb);
  130. skb_mac_header_rebuild(skb);
  131. hdr = ipv6_hdr(skb);
  132. memmove(hdr, &oldhdr, sizeof(*hdr));
  133. isrh = (void *)hdr + sizeof(*hdr);
  134. memcpy(isrh, csrh, hdrlen);
  135. isrh->nexthdr = hdr->nexthdr;
  136. hdr->nexthdr = NEXTHDR_ROUTING;
  137. hdr->daddr = srh->rpl_segaddr[0];
  138. ipv6_hdr(skb)->payload_len = htons(skb->len - sizeof(struct ipv6hdr));
  139. skb_set_transport_header(skb, sizeof(struct ipv6hdr));
  140. skb_postpush_rcsum(skb, hdr, sizeof(struct ipv6hdr) + hdrlen);
  141. kfree(buf);
  142. return 0;
  143. }
  144. static int rpl_do_srh(struct sk_buff *skb, const struct rpl_lwt *rlwt,
  145. struct dst_entry *cache_dst)
  146. {
  147. struct dst_entry *dst = skb_dst(skb);
  148. struct rpl_iptunnel_encap *tinfo;
  149. if (skb->protocol != htons(ETH_P_IPV6))
  150. return -EINVAL;
  151. tinfo = rpl_encap_lwtunnel(dst->lwtstate);
  152. return rpl_do_srh_inline(skb, rlwt, tinfo->srh, cache_dst);
  153. }
  154. static int rpl_output(struct net *net, struct sock *sk, struct sk_buff *skb)
  155. {
  156. struct dst_entry *orig_dst = skb_dst(skb);
  157. struct dst_entry *dst = NULL;
  158. struct rpl_lwt *rlwt;
  159. int err;
  160. rlwt = rpl_lwt_lwtunnel(orig_dst->lwtstate);
  161. local_bh_disable();
  162. dst = dst_cache_get(&rlwt->cache);
  163. local_bh_enable();
  164. err = rpl_do_srh(skb, rlwt, dst);
  165. if (unlikely(err))
  166. goto drop;
  167. if (unlikely(!dst)) {
  168. struct ipv6hdr *hdr = ipv6_hdr(skb);
  169. struct flowi6 fl6;
  170. memset(&fl6, 0, sizeof(fl6));
  171. fl6.daddr = hdr->daddr;
  172. fl6.saddr = hdr->saddr;
  173. fl6.flowlabel = ip6_flowinfo(hdr);
  174. fl6.flowi6_mark = skb->mark;
  175. fl6.flowi6_proto = hdr->nexthdr;
  176. dst = ip6_route_output(net, NULL, &fl6);
  177. if (dst->error) {
  178. err = dst->error;
  179. goto drop;
  180. }
  181. /* cache only if we don't create a dst reference loop */
  182. if (orig_dst->lwtstate != dst->lwtstate) {
  183. local_bh_disable();
  184. dst_cache_set_ip6(&rlwt->cache, dst, &fl6.saddr);
  185. local_bh_enable();
  186. }
  187. err = skb_cow_head(skb, LL_RESERVED_SPACE(dst_dev(dst)));
  188. if (unlikely(err))
  189. goto drop;
  190. }
  191. skb_dst_drop(skb);
  192. skb_dst_set(skb, dst);
  193. return dst_output(net, sk, skb);
  194. drop:
  195. dst_release(dst);
  196. kfree_skb(skb);
  197. return err;
  198. }
  199. static int rpl_input(struct sk_buff *skb)
  200. {
  201. struct dst_entry *orig_dst = skb_dst(skb);
  202. struct dst_entry *dst = NULL;
  203. struct lwtunnel_state *lwtst;
  204. struct rpl_lwt *rlwt;
  205. int err;
  206. /* We cannot dereference "orig_dst" once ip6_route_input() or
  207. * skb_dst_drop() is called. However, in order to detect a dst loop, we
  208. * need the address of its lwtstate. So, save the address of lwtstate
  209. * now and use it later as a comparison.
  210. */
  211. lwtst = orig_dst->lwtstate;
  212. rlwt = rpl_lwt_lwtunnel(lwtst);
  213. local_bh_disable();
  214. dst = dst_cache_get(&rlwt->cache);
  215. local_bh_enable();
  216. err = rpl_do_srh(skb, rlwt, dst);
  217. if (unlikely(err)) {
  218. dst_release(dst);
  219. goto drop;
  220. }
  221. if (!dst) {
  222. ip6_route_input(skb);
  223. dst = skb_dst(skb);
  224. /* cache only if we don't create a dst reference loop */
  225. if (!dst->error && lwtst != dst->lwtstate) {
  226. local_bh_disable();
  227. dst_cache_set_ip6(&rlwt->cache, dst,
  228. &ipv6_hdr(skb)->saddr);
  229. local_bh_enable();
  230. }
  231. err = skb_cow_head(skb, LL_RESERVED_SPACE(dst_dev(dst)));
  232. if (unlikely(err))
  233. goto drop;
  234. } else {
  235. skb_dst_drop(skb);
  236. skb_dst_set(skb, dst);
  237. }
  238. return dst_input(skb);
  239. drop:
  240. kfree_skb(skb);
  241. return err;
  242. }
  243. static int nla_put_rpl_srh(struct sk_buff *skb, int attrtype,
  244. struct rpl_iptunnel_encap *tuninfo)
  245. {
  246. struct rpl_iptunnel_encap *data;
  247. struct nlattr *nla;
  248. int len;
  249. len = RPL_IPTUNNEL_SRH_SIZE(tuninfo->srh);
  250. nla = nla_reserve(skb, attrtype, len);
  251. if (!nla)
  252. return -EMSGSIZE;
  253. data = nla_data(nla);
  254. memcpy(data, tuninfo->srh, len);
  255. return 0;
  256. }
  257. static int rpl_fill_encap_info(struct sk_buff *skb,
  258. struct lwtunnel_state *lwtstate)
  259. {
  260. struct rpl_iptunnel_encap *tuninfo = rpl_encap_lwtunnel(lwtstate);
  261. if (nla_put_rpl_srh(skb, RPL_IPTUNNEL_SRH, tuninfo))
  262. return -EMSGSIZE;
  263. return 0;
  264. }
  265. static int rpl_encap_nlsize(struct lwtunnel_state *lwtstate)
  266. {
  267. struct rpl_iptunnel_encap *tuninfo = rpl_encap_lwtunnel(lwtstate);
  268. return nla_total_size(RPL_IPTUNNEL_SRH_SIZE(tuninfo->srh));
  269. }
  270. static int rpl_encap_cmp(struct lwtunnel_state *a, struct lwtunnel_state *b)
  271. {
  272. struct rpl_iptunnel_encap *a_hdr = rpl_encap_lwtunnel(a);
  273. struct rpl_iptunnel_encap *b_hdr = rpl_encap_lwtunnel(b);
  274. int len = RPL_IPTUNNEL_SRH_SIZE(a_hdr->srh);
  275. if (len != RPL_IPTUNNEL_SRH_SIZE(b_hdr->srh))
  276. return 1;
  277. return memcmp(a_hdr, b_hdr, len);
  278. }
  279. static const struct lwtunnel_encap_ops rpl_ops = {
  280. .build_state = rpl_build_state,
  281. .destroy_state = rpl_destroy_state,
  282. .output = rpl_output,
  283. .input = rpl_input,
  284. .fill_encap = rpl_fill_encap_info,
  285. .get_encap_size = rpl_encap_nlsize,
  286. .cmp_encap = rpl_encap_cmp,
  287. .owner = THIS_MODULE,
  288. };
  289. int __init rpl_init(void)
  290. {
  291. int err;
  292. err = lwtunnel_encap_add_ops(&rpl_ops, LWTUNNEL_ENCAP_RPL);
  293. if (err)
  294. goto out;
  295. pr_info("RPL Segment Routing with IPv6\n");
  296. return 0;
  297. out:
  298. return err;
  299. }
  300. void rpl_exit(void)
  301. {
  302. lwtunnel_encap_del_ops(&rpl_ops, LWTUNNEL_ENCAP_RPL);
  303. }