page_pool_user.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441
  1. // SPDX-License-Identifier: GPL-2.0
  2. #include <linux/mutex.h>
  3. #include <linux/netdevice.h>
  4. #include <linux/xarray.h>
  5. #include <net/busy_poll.h>
  6. #include <net/net_debug.h>
  7. #include <net/netdev_rx_queue.h>
  8. #include <net/page_pool/helpers.h>
  9. #include <net/page_pool/types.h>
  10. #include <net/page_pool/memory_provider.h>
  11. #include <net/sock.h>
  12. #include "page_pool_priv.h"
  13. #include "netdev-genl-gen.h"
  14. static DEFINE_XARRAY_FLAGS(page_pools, XA_FLAGS_ALLOC1);
  15. /* Protects: page_pools, netdevice->page_pools, pool->p.napi, pool->slow.netdev,
  16. * pool->user.
  17. * Ordering: inside rtnl_lock
  18. */
  19. DEFINE_MUTEX(page_pools_lock);
  20. /* Page pools are only reachable from user space (via netlink) if they are
  21. * linked to a netdev at creation time. Following page pool "visibility"
  22. * states are possible:
  23. * - normal
  24. * - user.list: linked to real netdev, netdev: real netdev
  25. * - orphaned - real netdev has disappeared
  26. * - user.list: linked to lo, netdev: lo
  27. * - invisible - either (a) created without netdev linking, (b) unlisted due
  28. * to error, or (c) the entire namespace which owned this pool disappeared
  29. * - user.list: unhashed, netdev: unknown
  30. */
  31. typedef int (*pp_nl_fill_cb)(struct sk_buff *rsp, const struct page_pool *pool,
  32. const struct genl_info *info);
  33. static int
  34. netdev_nl_page_pool_get_do(struct genl_info *info, u32 id, pp_nl_fill_cb fill)
  35. {
  36. struct page_pool *pool;
  37. struct sk_buff *rsp;
  38. int err;
  39. mutex_lock(&page_pools_lock);
  40. pool = xa_load(&page_pools, id);
  41. if (!pool || hlist_unhashed(&pool->user.list) ||
  42. !net_eq(dev_net(pool->slow.netdev), genl_info_net(info))) {
  43. err = -ENOENT;
  44. goto err_unlock;
  45. }
  46. rsp = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL);
  47. if (!rsp) {
  48. err = -ENOMEM;
  49. goto err_unlock;
  50. }
  51. err = fill(rsp, pool, info);
  52. if (err)
  53. goto err_free_msg;
  54. mutex_unlock(&page_pools_lock);
  55. return genlmsg_reply(rsp, info);
  56. err_free_msg:
  57. nlmsg_free(rsp);
  58. err_unlock:
  59. mutex_unlock(&page_pools_lock);
  60. return err;
  61. }
  62. struct page_pool_dump_cb {
  63. unsigned long ifindex;
  64. u32 pp_id;
  65. };
  66. static int
  67. netdev_nl_page_pool_get_dump(struct sk_buff *skb, struct netlink_callback *cb,
  68. pp_nl_fill_cb fill)
  69. {
  70. struct page_pool_dump_cb *state = (void *)cb->ctx;
  71. const struct genl_info *info = genl_info_dump(cb);
  72. struct net *net = sock_net(skb->sk);
  73. struct net_device *netdev;
  74. struct page_pool *pool;
  75. int err = 0;
  76. rtnl_lock();
  77. mutex_lock(&page_pools_lock);
  78. for_each_netdev_dump(net, netdev, state->ifindex) {
  79. hlist_for_each_entry(pool, &netdev->page_pools, user.list) {
  80. if (state->pp_id && state->pp_id < pool->user.id)
  81. continue;
  82. state->pp_id = pool->user.id;
  83. err = fill(skb, pool, info);
  84. if (err)
  85. goto out;
  86. }
  87. state->pp_id = 0;
  88. }
  89. out:
  90. mutex_unlock(&page_pools_lock);
  91. rtnl_unlock();
  92. return err;
  93. }
  94. static int
  95. page_pool_nl_stats_fill(struct sk_buff *rsp, const struct page_pool *pool,
  96. const struct genl_info *info)
  97. {
  98. #ifdef CONFIG_PAGE_POOL_STATS
  99. struct page_pool_stats stats = {};
  100. struct nlattr *nest;
  101. void *hdr;
  102. if (!page_pool_get_stats(pool, &stats))
  103. return 0;
  104. hdr = genlmsg_iput(rsp, info);
  105. if (!hdr)
  106. return -EMSGSIZE;
  107. nest = nla_nest_start(rsp, NETDEV_A_PAGE_POOL_STATS_INFO);
  108. if (nla_put_uint(rsp, NETDEV_A_PAGE_POOL_ID, pool->user.id) ||
  109. (pool->slow.netdev->ifindex != LOOPBACK_IFINDEX &&
  110. nla_put_u32(rsp, NETDEV_A_PAGE_POOL_IFINDEX,
  111. pool->slow.netdev->ifindex)))
  112. goto err_cancel_nest;
  113. nla_nest_end(rsp, nest);
  114. if (nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_ALLOC_FAST,
  115. stats.alloc_stats.fast) ||
  116. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_ALLOC_SLOW,
  117. stats.alloc_stats.slow) ||
  118. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_ALLOC_SLOW_HIGH_ORDER,
  119. stats.alloc_stats.slow_high_order) ||
  120. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_ALLOC_EMPTY,
  121. stats.alloc_stats.empty) ||
  122. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_ALLOC_REFILL,
  123. stats.alloc_stats.refill) ||
  124. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_ALLOC_WAIVE,
  125. stats.alloc_stats.waive) ||
  126. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_RECYCLE_CACHED,
  127. stats.recycle_stats.cached) ||
  128. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_RECYCLE_CACHE_FULL,
  129. stats.recycle_stats.cache_full) ||
  130. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_RECYCLE_RING,
  131. stats.recycle_stats.ring) ||
  132. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_RECYCLE_RING_FULL,
  133. stats.recycle_stats.ring_full) ||
  134. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_STATS_RECYCLE_RELEASED_REFCNT,
  135. stats.recycle_stats.released_refcnt))
  136. goto err_cancel_msg;
  137. genlmsg_end(rsp, hdr);
  138. return 0;
  139. err_cancel_nest:
  140. nla_nest_cancel(rsp, nest);
  141. err_cancel_msg:
  142. genlmsg_cancel(rsp, hdr);
  143. return -EMSGSIZE;
  144. #else
  145. GENL_SET_ERR_MSG(info, "kernel built without CONFIG_PAGE_POOL_STATS");
  146. return -EOPNOTSUPP;
  147. #endif
  148. }
  149. int netdev_nl_page_pool_stats_get_doit(struct sk_buff *skb,
  150. struct genl_info *info)
  151. {
  152. struct nlattr *tb[ARRAY_SIZE(netdev_page_pool_info_nl_policy)];
  153. struct nlattr *nest;
  154. int err;
  155. u32 id;
  156. if (GENL_REQ_ATTR_CHECK(info, NETDEV_A_PAGE_POOL_STATS_INFO))
  157. return -EINVAL;
  158. nest = info->attrs[NETDEV_A_PAGE_POOL_STATS_INFO];
  159. err = nla_parse_nested(tb, ARRAY_SIZE(tb) - 1, nest,
  160. netdev_page_pool_info_nl_policy,
  161. info->extack);
  162. if (err)
  163. return err;
  164. if (NL_REQ_ATTR_CHECK(info->extack, nest, tb, NETDEV_A_PAGE_POOL_ID))
  165. return -EINVAL;
  166. if (tb[NETDEV_A_PAGE_POOL_IFINDEX]) {
  167. NL_SET_ERR_MSG_ATTR(info->extack,
  168. tb[NETDEV_A_PAGE_POOL_IFINDEX],
  169. "selecting by ifindex not supported");
  170. return -EINVAL;
  171. }
  172. id = nla_get_uint(tb[NETDEV_A_PAGE_POOL_ID]);
  173. return netdev_nl_page_pool_get_do(info, id, page_pool_nl_stats_fill);
  174. }
  175. int netdev_nl_page_pool_stats_get_dumpit(struct sk_buff *skb,
  176. struct netlink_callback *cb)
  177. {
  178. return netdev_nl_page_pool_get_dump(skb, cb, page_pool_nl_stats_fill);
  179. }
  180. static int
  181. page_pool_nl_fill(struct sk_buff *rsp, const struct page_pool *pool,
  182. const struct genl_info *info)
  183. {
  184. size_t inflight, refsz;
  185. unsigned int napi_id;
  186. void *hdr;
  187. hdr = genlmsg_iput(rsp, info);
  188. if (!hdr)
  189. return -EMSGSIZE;
  190. if (nla_put_uint(rsp, NETDEV_A_PAGE_POOL_ID, pool->user.id))
  191. goto err_cancel;
  192. if (pool->slow.netdev->ifindex != LOOPBACK_IFINDEX &&
  193. nla_put_u32(rsp, NETDEV_A_PAGE_POOL_IFINDEX,
  194. pool->slow.netdev->ifindex))
  195. goto err_cancel;
  196. napi_id = pool->p.napi ? READ_ONCE(pool->p.napi->napi_id) : 0;
  197. if (napi_id_valid(napi_id) &&
  198. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_NAPI_ID, napi_id))
  199. goto err_cancel;
  200. inflight = page_pool_inflight(pool, false);
  201. refsz = PAGE_SIZE << pool->p.order;
  202. if (nla_put_uint(rsp, NETDEV_A_PAGE_POOL_INFLIGHT, inflight) ||
  203. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_INFLIGHT_MEM,
  204. inflight * refsz))
  205. goto err_cancel;
  206. if (pool->user.detach_time &&
  207. nla_put_uint(rsp, NETDEV_A_PAGE_POOL_DETACH_TIME,
  208. ktime_divns(pool->user.detach_time, NSEC_PER_SEC)))
  209. goto err_cancel;
  210. if (pool->mp_ops && pool->mp_ops->nl_fill(pool->mp_priv, rsp, NULL))
  211. goto err_cancel;
  212. genlmsg_end(rsp, hdr);
  213. return 0;
  214. err_cancel:
  215. genlmsg_cancel(rsp, hdr);
  216. return -EMSGSIZE;
  217. }
  218. static void netdev_nl_page_pool_event(const struct page_pool *pool, u32 cmd)
  219. {
  220. struct genl_info info;
  221. struct sk_buff *ntf;
  222. struct net *net;
  223. lockdep_assert_held(&page_pools_lock);
  224. /* 'invisible' page pools don't matter */
  225. if (hlist_unhashed(&pool->user.list))
  226. return;
  227. net = dev_net(pool->slow.netdev);
  228. if (!genl_has_listeners(&netdev_nl_family, net, NETDEV_NLGRP_PAGE_POOL))
  229. return;
  230. genl_info_init_ntf(&info, &netdev_nl_family, cmd);
  231. ntf = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL);
  232. if (!ntf)
  233. return;
  234. if (page_pool_nl_fill(ntf, pool, &info)) {
  235. nlmsg_free(ntf);
  236. return;
  237. }
  238. genlmsg_multicast_netns(&netdev_nl_family, net, ntf,
  239. 0, NETDEV_NLGRP_PAGE_POOL, GFP_KERNEL);
  240. }
  241. int netdev_nl_page_pool_get_doit(struct sk_buff *skb, struct genl_info *info)
  242. {
  243. u32 id;
  244. if (GENL_REQ_ATTR_CHECK(info, NETDEV_A_PAGE_POOL_ID))
  245. return -EINVAL;
  246. id = nla_get_uint(info->attrs[NETDEV_A_PAGE_POOL_ID]);
  247. return netdev_nl_page_pool_get_do(info, id, page_pool_nl_fill);
  248. }
  249. int netdev_nl_page_pool_get_dumpit(struct sk_buff *skb,
  250. struct netlink_callback *cb)
  251. {
  252. return netdev_nl_page_pool_get_dump(skb, cb, page_pool_nl_fill);
  253. }
  254. int page_pool_list(struct page_pool *pool)
  255. {
  256. static u32 id_alloc_next;
  257. int err;
  258. mutex_lock(&page_pools_lock);
  259. err = xa_alloc_cyclic(&page_pools, &pool->user.id, pool, xa_limit_32b,
  260. &id_alloc_next, GFP_KERNEL);
  261. if (err < 0)
  262. goto err_unlock;
  263. INIT_HLIST_NODE(&pool->user.list);
  264. if (pool->slow.netdev) {
  265. hlist_add_head(&pool->user.list,
  266. &pool->slow.netdev->page_pools);
  267. netdev_nl_page_pool_event(pool, NETDEV_CMD_PAGE_POOL_ADD_NTF);
  268. }
  269. mutex_unlock(&page_pools_lock);
  270. return 0;
  271. err_unlock:
  272. mutex_unlock(&page_pools_lock);
  273. return err;
  274. }
  275. void page_pool_detached(struct page_pool *pool)
  276. {
  277. mutex_lock(&page_pools_lock);
  278. pool->user.detach_time = ktime_get_boottime();
  279. netdev_nl_page_pool_event(pool, NETDEV_CMD_PAGE_POOL_CHANGE_NTF);
  280. mutex_unlock(&page_pools_lock);
  281. }
  282. void page_pool_unlist(struct page_pool *pool)
  283. {
  284. mutex_lock(&page_pools_lock);
  285. netdev_nl_page_pool_event(pool, NETDEV_CMD_PAGE_POOL_DEL_NTF);
  286. xa_erase(&page_pools, pool->user.id);
  287. if (!hlist_unhashed(&pool->user.list))
  288. hlist_del(&pool->user.list);
  289. mutex_unlock(&page_pools_lock);
  290. }
  291. int page_pool_check_memory_provider(struct net_device *dev,
  292. struct netdev_rx_queue *rxq)
  293. {
  294. void *binding = rxq->mp_params.mp_priv;
  295. struct page_pool *pool;
  296. struct hlist_node *n;
  297. if (!binding)
  298. return 0;
  299. mutex_lock(&page_pools_lock);
  300. hlist_for_each_entry_safe(pool, n, &dev->page_pools, user.list) {
  301. if (pool->mp_priv != binding)
  302. continue;
  303. if (pool->slow.queue_idx == get_netdev_rx_queue_index(rxq)) {
  304. mutex_unlock(&page_pools_lock);
  305. return 0;
  306. }
  307. }
  308. mutex_unlock(&page_pools_lock);
  309. return -ENODATA;
  310. }
  311. static void page_pool_unreg_netdev_wipe(struct net_device *netdev)
  312. {
  313. struct page_pool *pool;
  314. struct hlist_node *n;
  315. mutex_lock(&page_pools_lock);
  316. hlist_for_each_entry_safe(pool, n, &netdev->page_pools, user.list) {
  317. hlist_del_init(&pool->user.list);
  318. pool->slow.netdev = NET_PTR_POISON;
  319. }
  320. mutex_unlock(&page_pools_lock);
  321. }
  322. static void page_pool_unreg_netdev(struct net_device *netdev)
  323. {
  324. struct page_pool *pool, *last;
  325. struct net_device *lo;
  326. lo = dev_net(netdev)->loopback_dev;
  327. mutex_lock(&page_pools_lock);
  328. last = NULL;
  329. hlist_for_each_entry(pool, &netdev->page_pools, user.list) {
  330. pool->slow.netdev = lo;
  331. netdev_nl_page_pool_event(pool,
  332. NETDEV_CMD_PAGE_POOL_CHANGE_NTF);
  333. last = pool;
  334. }
  335. if (last)
  336. hlist_splice_init(&netdev->page_pools, &last->user.list,
  337. &lo->page_pools);
  338. mutex_unlock(&page_pools_lock);
  339. }
  340. static int
  341. page_pool_netdevice_event(struct notifier_block *nb,
  342. unsigned long event, void *ptr)
  343. {
  344. struct net_device *netdev = netdev_notifier_info_to_dev(ptr);
  345. if (event != NETDEV_UNREGISTER)
  346. return NOTIFY_DONE;
  347. if (hlist_empty(&netdev->page_pools))
  348. return NOTIFY_OK;
  349. if (netdev->ifindex != LOOPBACK_IFINDEX)
  350. page_pool_unreg_netdev(netdev);
  351. else
  352. page_pool_unreg_netdev_wipe(netdev);
  353. return NOTIFY_OK;
  354. }
  355. static struct notifier_block page_pool_netdevice_nb = {
  356. .notifier_call = page_pool_netdevice_event,
  357. };
  358. static int __init page_pool_user_init(void)
  359. {
  360. return register_netdevice_notifier(&page_pool_netdevice_nb);
  361. }
  362. subsys_initcall(page_pool_user_init);