core.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549
  1. // SPDX-License-Identifier: GPL-2.0-or-later
  2. /*
  3. * Copyright (c) 2016 Mellanox Technologies. All rights reserved.
  4. * Copyright (c) 2016 Jiri Pirko <jiri@mellanox.com>
  5. */
  6. #include <net/genetlink.h>
  7. #define CREATE_TRACE_POINTS
  8. #include <trace/events/devlink.h>
  9. #include "devl_internal.h"
  10. EXPORT_TRACEPOINT_SYMBOL_GPL(devlink_hwmsg);
  11. EXPORT_TRACEPOINT_SYMBOL_GPL(devlink_hwerr);
  12. EXPORT_TRACEPOINT_SYMBOL_GPL(devlink_trap_report);
  13. DEFINE_XARRAY_FLAGS(devlinks, XA_FLAGS_ALLOC);
  14. static struct devlink *devlinks_xa_get(unsigned long index)
  15. {
  16. struct devlink *devlink;
  17. rcu_read_lock();
  18. devlink = xa_find(&devlinks, &index, index, DEVLINK_REGISTERED);
  19. if (!devlink || !devlink_try_get(devlink))
  20. devlink = NULL;
  21. rcu_read_unlock();
  22. return devlink;
  23. }
  24. /* devlink_rels xarray contains 1:1 relationships between
  25. * devlink object and related nested devlink instance.
  26. * The xarray index is used to get the nested object from
  27. * the nested-in object code.
  28. */
  29. static DEFINE_XARRAY_FLAGS(devlink_rels, XA_FLAGS_ALLOC1);
  30. #define DEVLINK_REL_IN_USE XA_MARK_0
  31. struct devlink_rel {
  32. u32 index;
  33. refcount_t refcount;
  34. u32 devlink_index;
  35. struct {
  36. u32 devlink_index;
  37. u32 obj_index;
  38. devlink_rel_notify_cb_t *notify_cb;
  39. devlink_rel_cleanup_cb_t *cleanup_cb;
  40. struct delayed_work notify_work;
  41. } nested_in;
  42. };
  43. static void devlink_rel_free(struct devlink_rel *rel)
  44. {
  45. xa_erase(&devlink_rels, rel->index);
  46. kfree(rel);
  47. }
  48. static void __devlink_rel_get(struct devlink_rel *rel)
  49. {
  50. refcount_inc(&rel->refcount);
  51. }
  52. static void __devlink_rel_put(struct devlink_rel *rel)
  53. {
  54. if (refcount_dec_and_test(&rel->refcount))
  55. devlink_rel_free(rel);
  56. }
  57. static void devlink_rel_nested_in_notify_work(struct work_struct *work)
  58. {
  59. struct devlink_rel *rel = container_of(work, struct devlink_rel,
  60. nested_in.notify_work.work);
  61. struct devlink *devlink;
  62. devlink = devlinks_xa_get(rel->nested_in.devlink_index);
  63. if (!devlink)
  64. goto rel_put;
  65. if (!devl_trylock(devlink)) {
  66. devlink_put(devlink);
  67. goto reschedule_work;
  68. }
  69. if (!devl_is_registered(devlink)) {
  70. devl_unlock(devlink);
  71. devlink_put(devlink);
  72. goto rel_put;
  73. }
  74. if (!xa_get_mark(&devlink_rels, rel->index, DEVLINK_REL_IN_USE))
  75. rel->nested_in.cleanup_cb(devlink, rel->nested_in.obj_index, rel->index);
  76. rel->nested_in.notify_cb(devlink, rel->nested_in.obj_index);
  77. devl_unlock(devlink);
  78. devlink_put(devlink);
  79. rel_put:
  80. __devlink_rel_put(rel);
  81. return;
  82. reschedule_work:
  83. schedule_delayed_work(&rel->nested_in.notify_work, 1);
  84. }
  85. static void devlink_rel_nested_in_notify_work_schedule(struct devlink_rel *rel)
  86. {
  87. __devlink_rel_get(rel);
  88. schedule_delayed_work(&rel->nested_in.notify_work, 0);
  89. }
  90. static struct devlink_rel *devlink_rel_alloc(void)
  91. {
  92. struct devlink_rel *rel;
  93. static u32 next;
  94. int err;
  95. rel = kzalloc_obj(*rel);
  96. if (!rel)
  97. return ERR_PTR(-ENOMEM);
  98. err = xa_alloc_cyclic(&devlink_rels, &rel->index, rel,
  99. xa_limit_32b, &next, GFP_KERNEL);
  100. if (err < 0) {
  101. kfree(rel);
  102. return ERR_PTR(err);
  103. }
  104. refcount_set(&rel->refcount, 1);
  105. INIT_DELAYED_WORK(&rel->nested_in.notify_work,
  106. &devlink_rel_nested_in_notify_work);
  107. return rel;
  108. }
  109. static void devlink_rel_put(struct devlink *devlink)
  110. {
  111. struct devlink_rel *rel = devlink->rel;
  112. if (!rel)
  113. return;
  114. xa_clear_mark(&devlink_rels, rel->index, DEVLINK_REL_IN_USE);
  115. devlink_rel_nested_in_notify_work_schedule(rel);
  116. __devlink_rel_put(rel);
  117. devlink->rel = NULL;
  118. }
  119. void devlink_rel_nested_in_clear(u32 rel_index)
  120. {
  121. xa_clear_mark(&devlink_rels, rel_index, DEVLINK_REL_IN_USE);
  122. }
  123. int devlink_rel_nested_in_add(u32 *rel_index, u32 devlink_index,
  124. u32 obj_index, devlink_rel_notify_cb_t *notify_cb,
  125. devlink_rel_cleanup_cb_t *cleanup_cb,
  126. struct devlink *devlink)
  127. {
  128. struct devlink_rel *rel = devlink_rel_alloc();
  129. ASSERT_DEVLINK_NOT_REGISTERED(devlink);
  130. if (IS_ERR(rel))
  131. return PTR_ERR(rel);
  132. rel->devlink_index = devlink->index;
  133. rel->nested_in.devlink_index = devlink_index;
  134. rel->nested_in.obj_index = obj_index;
  135. rel->nested_in.notify_cb = notify_cb;
  136. rel->nested_in.cleanup_cb = cleanup_cb;
  137. *rel_index = rel->index;
  138. xa_set_mark(&devlink_rels, rel->index, DEVLINK_REL_IN_USE);
  139. devlink->rel = rel;
  140. return 0;
  141. }
  142. /**
  143. * devlink_rel_nested_in_notify - Notify the object this devlink
  144. * instance is nested in.
  145. * @devlink: devlink
  146. *
  147. * This is called upon network namespace change of devlink instance.
  148. * In case this devlink instance is nested in another devlink object,
  149. * a notification of a change of this object should be sent
  150. * over netlink. The parent devlink instance lock needs to be
  151. * taken during the notification preparation.
  152. * Since the parent may or may not be locked, 'work' is utilized.
  153. */
  154. void devlink_rel_nested_in_notify(struct devlink *devlink)
  155. {
  156. struct devlink_rel *rel = devlink->rel;
  157. if (!rel)
  158. return;
  159. devlink_rel_nested_in_notify_work_schedule(rel);
  160. }
  161. static struct devlink_rel *devlink_rel_find(unsigned long rel_index)
  162. {
  163. return xa_find(&devlink_rels, &rel_index, rel_index,
  164. DEVLINK_REL_IN_USE);
  165. }
  166. static struct devlink *devlink_rel_devlink_get(u32 rel_index)
  167. {
  168. struct devlink_rel *rel;
  169. u32 devlink_index;
  170. if (!rel_index)
  171. return NULL;
  172. xa_lock(&devlink_rels);
  173. rel = devlink_rel_find(rel_index);
  174. if (rel)
  175. devlink_index = rel->devlink_index;
  176. xa_unlock(&devlink_rels);
  177. if (!rel)
  178. return NULL;
  179. return devlinks_xa_get(devlink_index);
  180. }
  181. int devlink_rel_devlink_handle_put(struct sk_buff *msg, struct devlink *devlink,
  182. u32 rel_index, int attrtype,
  183. bool *msg_updated)
  184. {
  185. struct net *net = devlink_net(devlink);
  186. struct devlink *rel_devlink;
  187. int err;
  188. rel_devlink = devlink_rel_devlink_get(rel_index);
  189. if (!rel_devlink)
  190. return 0;
  191. err = devlink_nl_put_nested_handle(msg, net, rel_devlink, attrtype);
  192. devlink_put(rel_devlink);
  193. if (!err && msg_updated)
  194. *msg_updated = true;
  195. return err;
  196. }
  197. void *devlink_priv(struct devlink *devlink)
  198. {
  199. return &devlink->priv;
  200. }
  201. EXPORT_SYMBOL_GPL(devlink_priv);
  202. struct devlink *priv_to_devlink(void *priv)
  203. {
  204. return container_of(priv, struct devlink, priv);
  205. }
  206. EXPORT_SYMBOL_GPL(priv_to_devlink);
  207. struct device *devlink_to_dev(const struct devlink *devlink)
  208. {
  209. return devlink->dev;
  210. }
  211. EXPORT_SYMBOL_GPL(devlink_to_dev);
  212. struct net *devlink_net(const struct devlink *devlink)
  213. {
  214. return read_pnet(&devlink->_net);
  215. }
  216. EXPORT_SYMBOL_GPL(devlink_net);
  217. void devl_assert_locked(struct devlink *devlink)
  218. {
  219. lockdep_assert_held(&devlink->lock);
  220. }
  221. EXPORT_SYMBOL_GPL(devl_assert_locked);
  222. #ifdef CONFIG_LOCKDEP
  223. /* For use in conjunction with LOCKDEP only e.g. rcu_dereference_protected() */
  224. bool devl_lock_is_held(struct devlink *devlink)
  225. {
  226. return lockdep_is_held(&devlink->lock);
  227. }
  228. EXPORT_SYMBOL_GPL(devl_lock_is_held);
  229. #endif
  230. void devl_lock(struct devlink *devlink)
  231. {
  232. mutex_lock(&devlink->lock);
  233. }
  234. EXPORT_SYMBOL_GPL(devl_lock);
  235. int devl_trylock(struct devlink *devlink)
  236. {
  237. return mutex_trylock(&devlink->lock);
  238. }
  239. EXPORT_SYMBOL_GPL(devl_trylock);
  240. void devl_unlock(struct devlink *devlink)
  241. {
  242. mutex_unlock(&devlink->lock);
  243. }
  244. EXPORT_SYMBOL_GPL(devl_unlock);
  245. /**
  246. * devlink_try_get() - try to obtain a reference on a devlink instance
  247. * @devlink: instance to reference
  248. *
  249. * Obtain a reference on a devlink instance. A reference on a devlink instance
  250. * only implies that it's safe to take the instance lock. It does not imply
  251. * that the instance is registered, use devl_is_registered() after taking
  252. * the instance lock to check registration status.
  253. */
  254. struct devlink *__must_check devlink_try_get(struct devlink *devlink)
  255. {
  256. if (refcount_inc_not_zero(&devlink->refcount))
  257. return devlink;
  258. return NULL;
  259. }
  260. static void devlink_release(struct work_struct *work)
  261. {
  262. struct devlink *devlink;
  263. devlink = container_of(to_rcu_work(work), struct devlink, rwork);
  264. mutex_destroy(&devlink->lock);
  265. lockdep_unregister_key(&devlink->lock_key);
  266. put_device(devlink->dev);
  267. kvfree(devlink);
  268. }
  269. void devlink_put(struct devlink *devlink)
  270. {
  271. if (refcount_dec_and_test(&devlink->refcount))
  272. queue_rcu_work(system_percpu_wq, &devlink->rwork);
  273. }
  274. struct devlink *devlinks_xa_find_get(struct net *net, unsigned long *indexp)
  275. {
  276. struct devlink *devlink = NULL;
  277. rcu_read_lock();
  278. retry:
  279. devlink = xa_find(&devlinks, indexp, ULONG_MAX, DEVLINK_REGISTERED);
  280. if (!devlink)
  281. goto unlock;
  282. if (!devlink_try_get(devlink))
  283. goto next;
  284. if (!net_eq(devlink_net(devlink), net)) {
  285. devlink_put(devlink);
  286. goto next;
  287. }
  288. unlock:
  289. rcu_read_unlock();
  290. return devlink;
  291. next:
  292. (*indexp)++;
  293. goto retry;
  294. }
  295. /**
  296. * devl_register - Register devlink instance
  297. * @devlink: devlink
  298. */
  299. int devl_register(struct devlink *devlink)
  300. {
  301. ASSERT_DEVLINK_NOT_REGISTERED(devlink);
  302. devl_assert_locked(devlink);
  303. xa_set_mark(&devlinks, devlink->index, DEVLINK_REGISTERED);
  304. devlink_notify_register(devlink);
  305. devlink_rel_nested_in_notify(devlink);
  306. return 0;
  307. }
  308. EXPORT_SYMBOL_GPL(devl_register);
  309. void devlink_register(struct devlink *devlink)
  310. {
  311. devl_lock(devlink);
  312. devl_register(devlink);
  313. devl_unlock(devlink);
  314. }
  315. EXPORT_SYMBOL_GPL(devlink_register);
  316. /**
  317. * devl_unregister - Unregister devlink instance
  318. * @devlink: devlink
  319. */
  320. void devl_unregister(struct devlink *devlink)
  321. {
  322. ASSERT_DEVLINK_REGISTERED(devlink);
  323. devl_assert_locked(devlink);
  324. devlink_notify_unregister(devlink);
  325. xa_clear_mark(&devlinks, devlink->index, DEVLINK_REGISTERED);
  326. devlink_rel_put(devlink);
  327. }
  328. EXPORT_SYMBOL_GPL(devl_unregister);
  329. void devlink_unregister(struct devlink *devlink)
  330. {
  331. devl_lock(devlink);
  332. devl_unregister(devlink);
  333. devl_unlock(devlink);
  334. }
  335. EXPORT_SYMBOL_GPL(devlink_unregister);
  336. /**
  337. * devlink_alloc_ns - Allocate new devlink instance resources
  338. * in specific namespace
  339. *
  340. * @ops: ops
  341. * @priv_size: size of user private data
  342. * @net: net namespace
  343. * @dev: parent device
  344. *
  345. * Allocate new devlink instance resources, including devlink index
  346. * and name.
  347. */
  348. struct devlink *devlink_alloc_ns(const struct devlink_ops *ops,
  349. size_t priv_size, struct net *net,
  350. struct device *dev)
  351. {
  352. struct devlink *devlink;
  353. static u32 last_id;
  354. int ret;
  355. WARN_ON(!ops || !dev);
  356. if (!devlink_reload_actions_valid(ops))
  357. return NULL;
  358. devlink = kvzalloc_flex(*devlink, priv, priv_size);
  359. if (!devlink)
  360. return NULL;
  361. ret = xa_alloc_cyclic(&devlinks, &devlink->index, devlink, xa_limit_31b,
  362. &last_id, GFP_KERNEL);
  363. if (ret < 0)
  364. goto err_xa_alloc;
  365. devlink->dev = get_device(dev);
  366. devlink->ops = ops;
  367. xa_init_flags(&devlink->ports, XA_FLAGS_ALLOC);
  368. xa_init_flags(&devlink->params, XA_FLAGS_ALLOC);
  369. xa_init_flags(&devlink->snapshot_ids, XA_FLAGS_ALLOC);
  370. xa_init_flags(&devlink->nested_rels, XA_FLAGS_ALLOC);
  371. write_pnet(&devlink->_net, net);
  372. INIT_LIST_HEAD(&devlink->rate_list);
  373. INIT_LIST_HEAD(&devlink->linecard_list);
  374. INIT_LIST_HEAD(&devlink->sb_list);
  375. INIT_LIST_HEAD_RCU(&devlink->dpipe_table_list);
  376. INIT_LIST_HEAD(&devlink->resource_list);
  377. INIT_LIST_HEAD(&devlink->region_list);
  378. INIT_LIST_HEAD(&devlink->reporter_list);
  379. INIT_LIST_HEAD(&devlink->trap_list);
  380. INIT_LIST_HEAD(&devlink->trap_group_list);
  381. INIT_LIST_HEAD(&devlink->trap_policer_list);
  382. INIT_RCU_WORK(&devlink->rwork, devlink_release);
  383. lockdep_register_key(&devlink->lock_key);
  384. mutex_init(&devlink->lock);
  385. lockdep_set_class(&devlink->lock, &devlink->lock_key);
  386. refcount_set(&devlink->refcount, 1);
  387. return devlink;
  388. err_xa_alloc:
  389. kvfree(devlink);
  390. return NULL;
  391. }
  392. EXPORT_SYMBOL_GPL(devlink_alloc_ns);
  393. /**
  394. * devlink_free - Free devlink instance resources
  395. *
  396. * @devlink: devlink
  397. */
  398. void devlink_free(struct devlink *devlink)
  399. {
  400. ASSERT_DEVLINK_NOT_REGISTERED(devlink);
  401. WARN_ON(!list_empty(&devlink->trap_policer_list));
  402. WARN_ON(!list_empty(&devlink->trap_group_list));
  403. WARN_ON(!list_empty(&devlink->trap_list));
  404. WARN_ON(!list_empty(&devlink->reporter_list));
  405. WARN_ON(!list_empty(&devlink->region_list));
  406. WARN_ON(!list_empty(&devlink->resource_list));
  407. WARN_ON(!list_empty(&devlink->dpipe_table_list));
  408. WARN_ON(!list_empty(&devlink->sb_list));
  409. WARN_ON(devlink_rates_check(devlink, NULL, NULL));
  410. WARN_ON(!list_empty(&devlink->linecard_list));
  411. WARN_ON(!xa_empty(&devlink->ports));
  412. xa_destroy(&devlink->nested_rels);
  413. xa_destroy(&devlink->snapshot_ids);
  414. xa_destroy(&devlink->params);
  415. xa_destroy(&devlink->ports);
  416. xa_erase(&devlinks, devlink->index);
  417. devlink_put(devlink);
  418. }
  419. EXPORT_SYMBOL_GPL(devlink_free);
  420. static void __net_exit devlink_pernet_pre_exit(struct net *net)
  421. {
  422. struct devlink *devlink;
  423. u32 actions_performed;
  424. unsigned long index;
  425. int err;
  426. /* In case network namespace is getting destroyed, reload
  427. * all devlink instances from this namespace into init_net.
  428. */
  429. devlinks_xa_for_each_registered_get(net, index, devlink) {
  430. devl_dev_lock(devlink, true);
  431. err = 0;
  432. if (devl_is_registered(devlink))
  433. err = devlink_reload(devlink, &init_net,
  434. DEVLINK_RELOAD_ACTION_DRIVER_REINIT,
  435. DEVLINK_RELOAD_LIMIT_UNSPEC,
  436. &actions_performed, NULL);
  437. devl_dev_unlock(devlink, true);
  438. devlink_put(devlink);
  439. if (err && err != -EOPNOTSUPP)
  440. pr_warn("Failed to reload devlink instance into init_net\n");
  441. }
  442. }
  443. static struct pernet_operations devlink_pernet_ops __net_initdata = {
  444. .pre_exit = devlink_pernet_pre_exit,
  445. };
  446. static struct notifier_block devlink_port_netdevice_nb = {
  447. .notifier_call = devlink_port_netdevice_event,
  448. };
  449. static int __init devlink_init(void)
  450. {
  451. int err;
  452. err = register_pernet_subsys(&devlink_pernet_ops);
  453. if (err)
  454. goto out;
  455. err = genl_register_family(&devlink_nl_family);
  456. if (err)
  457. goto out_unreg_pernet_subsys;
  458. err = register_netdevice_notifier(&devlink_port_netdevice_nb);
  459. if (!err)
  460. return 0;
  461. genl_unregister_family(&devlink_nl_family);
  462. out_unreg_pernet_subsys:
  463. unregister_pernet_subsys(&devlink_pernet_ops);
  464. out:
  465. WARN_ON(err);
  466. return err;
  467. }
  468. subsys_initcall(devlink_init);