nldev.c 75 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920
  1. /*
  2. * Copyright (c) 2017 Mellanox Technologies. All rights reserved.
  3. *
  4. * Redistribution and use in source and binary forms, with or without
  5. * modification, are permitted provided that the following conditions are met:
  6. *
  7. * 1. Redistributions of source code must retain the above copyright
  8. * notice, this list of conditions and the following disclaimer.
  9. * 2. Redistributions in binary form must reproduce the above copyright
  10. * notice, this list of conditions and the following disclaimer in the
  11. * documentation and/or other materials provided with the distribution.
  12. * 3. Neither the names of the copyright holders nor the names of its
  13. * contributors may be used to endorse or promote products derived from
  14. * this software without specific prior written permission.
  15. *
  16. * Alternatively, this software may be distributed under the terms of the
  17. * GNU General Public License ("GPL") version 2 as published by the Free
  18. * Software Foundation.
  19. *
  20. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  21. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  22. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  23. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  24. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  25. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  26. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  27. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  28. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  29. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  30. * POSSIBILITY OF SUCH DAMAGE.
  31. */
  32. #include <linux/module.h>
  33. #include <linux/pid.h>
  34. #include <linux/pid_namespace.h>
  35. #include <linux/mutex.h>
  36. #include <net/netlink.h>
  37. #include <rdma/rdma_cm.h>
  38. #include <rdma/rdma_netlink.h>
  39. #include "core_priv.h"
  40. #include "cma_priv.h"
  41. #include "restrack.h"
  42. #include "uverbs.h"
  43. /*
  44. * This determines whether a non-privileged user is allowed to specify a
  45. * controlled QKEY or not, when true non-privileged user is allowed to specify
  46. * a controlled QKEY.
  47. */
  48. static bool privileged_qkey;
  49. typedef int (*res_fill_func_t)(struct sk_buff*, bool,
  50. struct rdma_restrack_entry*, uint32_t);
  51. /*
  52. * Sort array elements by the netlink attribute name
  53. */
  54. static const struct nla_policy nldev_policy[RDMA_NLDEV_ATTR_MAX] = {
  55. [RDMA_NLDEV_ATTR_CHARDEV] = { .type = NLA_U64 },
  56. [RDMA_NLDEV_ATTR_CHARDEV_ABI] = { .type = NLA_U64 },
  57. [RDMA_NLDEV_ATTR_CHARDEV_NAME] = { .type = NLA_NUL_STRING,
  58. .len = RDMA_NLDEV_ATTR_EMPTY_STRING },
  59. [RDMA_NLDEV_ATTR_CHARDEV_TYPE] = { .type = NLA_NUL_STRING,
  60. .len = RDMA_NLDEV_ATTR_CHARDEV_TYPE_SIZE },
  61. [RDMA_NLDEV_ATTR_DEV_DIM] = { .type = NLA_U8 },
  62. [RDMA_NLDEV_ATTR_DEV_INDEX] = { .type = NLA_U32 },
  63. [RDMA_NLDEV_ATTR_DEV_NAME] = { .type = NLA_NUL_STRING,
  64. .len = IB_DEVICE_NAME_MAX },
  65. [RDMA_NLDEV_ATTR_DEV_NODE_TYPE] = { .type = NLA_U8 },
  66. [RDMA_NLDEV_ATTR_DEV_PROTOCOL] = { .type = NLA_NUL_STRING,
  67. .len = RDMA_NLDEV_ATTR_EMPTY_STRING },
  68. [RDMA_NLDEV_ATTR_DRIVER] = { .type = NLA_NESTED },
  69. [RDMA_NLDEV_ATTR_DRIVER_ENTRY] = { .type = NLA_NESTED },
  70. [RDMA_NLDEV_ATTR_DRIVER_PRINT_TYPE] = { .type = NLA_U8 },
  71. [RDMA_NLDEV_ATTR_DRIVER_STRING] = { .type = NLA_NUL_STRING,
  72. .len = RDMA_NLDEV_ATTR_EMPTY_STRING },
  73. [RDMA_NLDEV_ATTR_DRIVER_S32] = { .type = NLA_S32 },
  74. [RDMA_NLDEV_ATTR_DRIVER_S64] = { .type = NLA_S64 },
  75. [RDMA_NLDEV_ATTR_DRIVER_U32] = { .type = NLA_U32 },
  76. [RDMA_NLDEV_ATTR_DRIVER_U64] = { .type = NLA_U64 },
  77. [RDMA_NLDEV_ATTR_FW_VERSION] = { .type = NLA_NUL_STRING,
  78. .len = RDMA_NLDEV_ATTR_EMPTY_STRING },
  79. [RDMA_NLDEV_ATTR_LID] = { .type = NLA_U32 },
  80. [RDMA_NLDEV_ATTR_LINK_TYPE] = { .type = NLA_NUL_STRING,
  81. .len = IFNAMSIZ },
  82. [RDMA_NLDEV_ATTR_LMC] = { .type = NLA_U8 },
  83. [RDMA_NLDEV_ATTR_NDEV_INDEX] = { .type = NLA_U32 },
  84. [RDMA_NLDEV_ATTR_NDEV_NAME] = { .type = NLA_NUL_STRING,
  85. .len = IFNAMSIZ },
  86. [RDMA_NLDEV_ATTR_NODE_GUID] = { .type = NLA_U64 },
  87. [RDMA_NLDEV_ATTR_PORT_INDEX] = { .type = NLA_U32 },
  88. [RDMA_NLDEV_ATTR_PORT_PHYS_STATE] = { .type = NLA_U8 },
  89. [RDMA_NLDEV_ATTR_PORT_STATE] = { .type = NLA_U8 },
  90. [RDMA_NLDEV_ATTR_RES_CM_ID] = { .type = NLA_NESTED },
  91. [RDMA_NLDEV_ATTR_RES_CM_IDN] = { .type = NLA_U32 },
  92. [RDMA_NLDEV_ATTR_RES_CM_ID_ENTRY] = { .type = NLA_NESTED },
  93. [RDMA_NLDEV_ATTR_RES_CQ] = { .type = NLA_NESTED },
  94. [RDMA_NLDEV_ATTR_RES_CQE] = { .type = NLA_U32 },
  95. [RDMA_NLDEV_ATTR_RES_CQN] = { .type = NLA_U32 },
  96. [RDMA_NLDEV_ATTR_RES_CQ_ENTRY] = { .type = NLA_NESTED },
  97. [RDMA_NLDEV_ATTR_RES_CTX] = { .type = NLA_NESTED },
  98. [RDMA_NLDEV_ATTR_RES_CTXN] = { .type = NLA_U32 },
  99. [RDMA_NLDEV_ATTR_RES_CTX_ENTRY] = { .type = NLA_NESTED },
  100. [RDMA_NLDEV_ATTR_RES_DST_ADDR] = {
  101. .len = sizeof(struct __kernel_sockaddr_storage) },
  102. [RDMA_NLDEV_ATTR_RES_IOVA] = { .type = NLA_U64 },
  103. [RDMA_NLDEV_ATTR_RES_KERN_NAME] = { .type = NLA_NUL_STRING,
  104. .len = RDMA_NLDEV_ATTR_EMPTY_STRING },
  105. [RDMA_NLDEV_ATTR_RES_LKEY] = { .type = NLA_U32 },
  106. [RDMA_NLDEV_ATTR_RES_LOCAL_DMA_LKEY] = { .type = NLA_U32 },
  107. [RDMA_NLDEV_ATTR_RES_LQPN] = { .type = NLA_U32 },
  108. [RDMA_NLDEV_ATTR_RES_MR] = { .type = NLA_NESTED },
  109. [RDMA_NLDEV_ATTR_RES_MRLEN] = { .type = NLA_U64 },
  110. [RDMA_NLDEV_ATTR_RES_MRN] = { .type = NLA_U32 },
  111. [RDMA_NLDEV_ATTR_RES_MR_ENTRY] = { .type = NLA_NESTED },
  112. [RDMA_NLDEV_ATTR_RES_PATH_MIG_STATE] = { .type = NLA_U8 },
  113. [RDMA_NLDEV_ATTR_RES_PD] = { .type = NLA_NESTED },
  114. [RDMA_NLDEV_ATTR_RES_PDN] = { .type = NLA_U32 },
  115. [RDMA_NLDEV_ATTR_RES_PD_ENTRY] = { .type = NLA_NESTED },
  116. [RDMA_NLDEV_ATTR_RES_PID] = { .type = NLA_U32 },
  117. [RDMA_NLDEV_ATTR_RES_POLL_CTX] = { .type = NLA_U8 },
  118. [RDMA_NLDEV_ATTR_RES_PS] = { .type = NLA_U32 },
  119. [RDMA_NLDEV_ATTR_RES_QP] = { .type = NLA_NESTED },
  120. [RDMA_NLDEV_ATTR_RES_QP_ENTRY] = { .type = NLA_NESTED },
  121. [RDMA_NLDEV_ATTR_RES_RAW] = { .type = NLA_BINARY },
  122. [RDMA_NLDEV_ATTR_RES_RKEY] = { .type = NLA_U32 },
  123. [RDMA_NLDEV_ATTR_RES_RQPN] = { .type = NLA_U32 },
  124. [RDMA_NLDEV_ATTR_RES_RQ_PSN] = { .type = NLA_U32 },
  125. [RDMA_NLDEV_ATTR_RES_SQ_PSN] = { .type = NLA_U32 },
  126. [RDMA_NLDEV_ATTR_RES_SRC_ADDR] = {
  127. .len = sizeof(struct __kernel_sockaddr_storage) },
  128. [RDMA_NLDEV_ATTR_RES_STATE] = { .type = NLA_U8 },
  129. [RDMA_NLDEV_ATTR_RES_SUMMARY] = { .type = NLA_NESTED },
  130. [RDMA_NLDEV_ATTR_RES_SUMMARY_ENTRY] = { .type = NLA_NESTED },
  131. [RDMA_NLDEV_ATTR_RES_SUMMARY_ENTRY_CURR]= { .type = NLA_U64 },
  132. [RDMA_NLDEV_ATTR_RES_SUMMARY_ENTRY_NAME]= { .type = NLA_NUL_STRING,
  133. .len = RDMA_NLDEV_ATTR_EMPTY_STRING },
  134. [RDMA_NLDEV_ATTR_RES_TYPE] = { .type = NLA_U8 },
  135. [RDMA_NLDEV_ATTR_RES_SUBTYPE] = { .type = NLA_NUL_STRING,
  136. .len = RDMA_NLDEV_ATTR_EMPTY_STRING },
  137. [RDMA_NLDEV_ATTR_RES_UNSAFE_GLOBAL_RKEY]= { .type = NLA_U32 },
  138. [RDMA_NLDEV_ATTR_RES_USECNT] = { .type = NLA_U64 },
  139. [RDMA_NLDEV_ATTR_RES_SRQ] = { .type = NLA_NESTED },
  140. [RDMA_NLDEV_ATTR_RES_SRQN] = { .type = NLA_U32 },
  141. [RDMA_NLDEV_ATTR_RES_SRQ_ENTRY] = { .type = NLA_NESTED },
  142. [RDMA_NLDEV_ATTR_MIN_RANGE] = { .type = NLA_U32 },
  143. [RDMA_NLDEV_ATTR_MAX_RANGE] = { .type = NLA_U32 },
  144. [RDMA_NLDEV_ATTR_SM_LID] = { .type = NLA_U32 },
  145. [RDMA_NLDEV_ATTR_SUBNET_PREFIX] = { .type = NLA_U64 },
  146. [RDMA_NLDEV_ATTR_STAT_AUTO_MODE_MASK] = { .type = NLA_U32 },
  147. [RDMA_NLDEV_ATTR_STAT_MODE] = { .type = NLA_U32 },
  148. [RDMA_NLDEV_ATTR_STAT_RES] = { .type = NLA_U32 },
  149. [RDMA_NLDEV_ATTR_STAT_COUNTER] = { .type = NLA_NESTED },
  150. [RDMA_NLDEV_ATTR_STAT_COUNTER_ENTRY] = { .type = NLA_NESTED },
  151. [RDMA_NLDEV_ATTR_STAT_COUNTER_ID] = { .type = NLA_U32 },
  152. [RDMA_NLDEV_ATTR_STAT_HWCOUNTERS] = { .type = NLA_NESTED },
  153. [RDMA_NLDEV_ATTR_STAT_HWCOUNTER_ENTRY] = { .type = NLA_NESTED },
  154. [RDMA_NLDEV_ATTR_STAT_HWCOUNTER_ENTRY_NAME] = { .type = NLA_NUL_STRING },
  155. [RDMA_NLDEV_ATTR_STAT_HWCOUNTER_ENTRY_VALUE] = { .type = NLA_U64 },
  156. [RDMA_NLDEV_ATTR_SYS_IMAGE_GUID] = { .type = NLA_U64 },
  157. [RDMA_NLDEV_ATTR_UVERBS_DRIVER_ID] = { .type = NLA_U32 },
  158. [RDMA_NLDEV_NET_NS_FD] = { .type = NLA_U32 },
  159. [RDMA_NLDEV_SYS_ATTR_NETNS_MODE] = { .type = NLA_U8 },
  160. [RDMA_NLDEV_SYS_ATTR_COPY_ON_FORK] = { .type = NLA_U8 },
  161. [RDMA_NLDEV_ATTR_STAT_HWCOUNTER_INDEX] = { .type = NLA_U32 },
  162. [RDMA_NLDEV_ATTR_STAT_HWCOUNTER_DYNAMIC] = { .type = NLA_U8 },
  163. [RDMA_NLDEV_SYS_ATTR_PRIVILEGED_QKEY_MODE] = { .type = NLA_U8 },
  164. [RDMA_NLDEV_ATTR_DRIVER_DETAILS] = { .type = NLA_U8 },
  165. [RDMA_NLDEV_ATTR_DEV_TYPE] = { .type = NLA_U8 },
  166. [RDMA_NLDEV_ATTR_PARENT_NAME] = { .type = NLA_NUL_STRING },
  167. [RDMA_NLDEV_ATTR_NAME_ASSIGN_TYPE] = { .type = NLA_U8 },
  168. [RDMA_NLDEV_ATTR_EVENT_TYPE] = { .type = NLA_U8 },
  169. [RDMA_NLDEV_ATTR_STAT_OPCOUNTER_ENABLED] = { .type = NLA_U8 },
  170. };
  171. static int put_driver_name_print_type(struct sk_buff *msg, const char *name,
  172. enum rdma_nldev_print_type print_type)
  173. {
  174. if (nla_put_string(msg, RDMA_NLDEV_ATTR_DRIVER_STRING, name))
  175. return -EMSGSIZE;
  176. if (print_type != RDMA_NLDEV_PRINT_TYPE_UNSPEC &&
  177. nla_put_u8(msg, RDMA_NLDEV_ATTR_DRIVER_PRINT_TYPE, print_type))
  178. return -EMSGSIZE;
  179. return 0;
  180. }
  181. static int _rdma_nl_put_driver_u32(struct sk_buff *msg, const char *name,
  182. enum rdma_nldev_print_type print_type,
  183. u32 value)
  184. {
  185. if (put_driver_name_print_type(msg, name, print_type))
  186. return -EMSGSIZE;
  187. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_DRIVER_U32, value))
  188. return -EMSGSIZE;
  189. return 0;
  190. }
  191. static int _rdma_nl_put_driver_u64(struct sk_buff *msg, const char *name,
  192. enum rdma_nldev_print_type print_type,
  193. u64 value)
  194. {
  195. if (put_driver_name_print_type(msg, name, print_type))
  196. return -EMSGSIZE;
  197. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_DRIVER_U64, value,
  198. RDMA_NLDEV_ATTR_PAD))
  199. return -EMSGSIZE;
  200. return 0;
  201. }
  202. int rdma_nl_put_driver_string(struct sk_buff *msg, const char *name,
  203. const char *str)
  204. {
  205. if (put_driver_name_print_type(msg, name,
  206. RDMA_NLDEV_PRINT_TYPE_UNSPEC))
  207. return -EMSGSIZE;
  208. if (nla_put_string(msg, RDMA_NLDEV_ATTR_DRIVER_STRING, str))
  209. return -EMSGSIZE;
  210. return 0;
  211. }
  212. EXPORT_SYMBOL(rdma_nl_put_driver_string);
  213. int rdma_nl_put_driver_u32(struct sk_buff *msg, const char *name, u32 value)
  214. {
  215. return _rdma_nl_put_driver_u32(msg, name, RDMA_NLDEV_PRINT_TYPE_UNSPEC,
  216. value);
  217. }
  218. EXPORT_SYMBOL(rdma_nl_put_driver_u32);
  219. int rdma_nl_put_driver_u32_hex(struct sk_buff *msg, const char *name,
  220. u32 value)
  221. {
  222. return _rdma_nl_put_driver_u32(msg, name, RDMA_NLDEV_PRINT_TYPE_HEX,
  223. value);
  224. }
  225. EXPORT_SYMBOL(rdma_nl_put_driver_u32_hex);
  226. int rdma_nl_put_driver_u64(struct sk_buff *msg, const char *name, u64 value)
  227. {
  228. return _rdma_nl_put_driver_u64(msg, name, RDMA_NLDEV_PRINT_TYPE_UNSPEC,
  229. value);
  230. }
  231. EXPORT_SYMBOL(rdma_nl_put_driver_u64);
  232. int rdma_nl_put_driver_u64_hex(struct sk_buff *msg, const char *name, u64 value)
  233. {
  234. return _rdma_nl_put_driver_u64(msg, name, RDMA_NLDEV_PRINT_TYPE_HEX,
  235. value);
  236. }
  237. EXPORT_SYMBOL(rdma_nl_put_driver_u64_hex);
  238. bool rdma_nl_get_privileged_qkey(void)
  239. {
  240. return privileged_qkey;
  241. }
  242. EXPORT_SYMBOL(rdma_nl_get_privileged_qkey);
  243. static int fill_nldev_handle(struct sk_buff *msg, struct ib_device *device)
  244. {
  245. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_DEV_INDEX, device->index))
  246. return -EMSGSIZE;
  247. if (nla_put_string(msg, RDMA_NLDEV_ATTR_DEV_NAME,
  248. dev_name(&device->dev)))
  249. return -EMSGSIZE;
  250. return 0;
  251. }
  252. static int fill_dev_info(struct sk_buff *msg, struct ib_device *device)
  253. {
  254. char fw[IB_FW_VERSION_NAME_MAX];
  255. int ret = 0;
  256. u32 port;
  257. if (fill_nldev_handle(msg, device))
  258. return -EMSGSIZE;
  259. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, rdma_end_port(device)))
  260. return -EMSGSIZE;
  261. BUILD_BUG_ON(sizeof(device->attrs.device_cap_flags) != sizeof(u64));
  262. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_CAP_FLAGS,
  263. device->attrs.device_cap_flags,
  264. RDMA_NLDEV_ATTR_PAD))
  265. return -EMSGSIZE;
  266. ib_get_device_fw_str(device, fw);
  267. /* Device without FW has strlen(fw) = 0 */
  268. if (strlen(fw) && nla_put_string(msg, RDMA_NLDEV_ATTR_FW_VERSION, fw))
  269. return -EMSGSIZE;
  270. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_NODE_GUID,
  271. be64_to_cpu(device->node_guid),
  272. RDMA_NLDEV_ATTR_PAD))
  273. return -EMSGSIZE;
  274. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_SYS_IMAGE_GUID,
  275. be64_to_cpu(device->attrs.sys_image_guid),
  276. RDMA_NLDEV_ATTR_PAD))
  277. return -EMSGSIZE;
  278. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_DEV_NODE_TYPE, device->node_type))
  279. return -EMSGSIZE;
  280. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_DEV_DIM, device->use_cq_dim))
  281. return -EMSGSIZE;
  282. if (device->type &&
  283. nla_put_u8(msg, RDMA_NLDEV_ATTR_DEV_TYPE, device->type))
  284. return -EMSGSIZE;
  285. if (device->parent &&
  286. nla_put_string(msg, RDMA_NLDEV_ATTR_PARENT_NAME,
  287. dev_name(&device->parent->dev)))
  288. return -EMSGSIZE;
  289. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_NAME_ASSIGN_TYPE,
  290. device->name_assign_type))
  291. return -EMSGSIZE;
  292. /*
  293. * Link type is determined on first port and mlx4 device
  294. * which can potentially have two different link type for the same
  295. * IB device is considered as better to be avoided in the future,
  296. */
  297. port = rdma_start_port(device);
  298. if (rdma_cap_opa_mad(device, port))
  299. ret = nla_put_string(msg, RDMA_NLDEV_ATTR_DEV_PROTOCOL, "opa");
  300. else if (rdma_protocol_ib(device, port))
  301. ret = nla_put_string(msg, RDMA_NLDEV_ATTR_DEV_PROTOCOL, "ib");
  302. else if (rdma_protocol_iwarp(device, port))
  303. ret = nla_put_string(msg, RDMA_NLDEV_ATTR_DEV_PROTOCOL, "iw");
  304. else if (rdma_protocol_roce(device, port))
  305. ret = nla_put_string(msg, RDMA_NLDEV_ATTR_DEV_PROTOCOL, "roce");
  306. else if (rdma_protocol_usnic(device, port))
  307. ret = nla_put_string(msg, RDMA_NLDEV_ATTR_DEV_PROTOCOL,
  308. "usnic");
  309. return ret;
  310. }
  311. static int fill_port_info(struct sk_buff *msg,
  312. struct ib_device *device, u32 port,
  313. const struct net *net)
  314. {
  315. struct net_device *netdev = NULL;
  316. struct ib_port_attr attr;
  317. int ret;
  318. u64 cap_flags = 0;
  319. if (fill_nldev_handle(msg, device))
  320. return -EMSGSIZE;
  321. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, port))
  322. return -EMSGSIZE;
  323. ret = ib_query_port(device, port, &attr);
  324. if (ret)
  325. return ret;
  326. if (rdma_protocol_ib(device, port)) {
  327. BUILD_BUG_ON((sizeof(attr.port_cap_flags) +
  328. sizeof(attr.port_cap_flags2)) > sizeof(u64));
  329. cap_flags = attr.port_cap_flags |
  330. ((u64)attr.port_cap_flags2 << 32);
  331. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_CAP_FLAGS,
  332. cap_flags, RDMA_NLDEV_ATTR_PAD))
  333. return -EMSGSIZE;
  334. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_SUBNET_PREFIX,
  335. attr.subnet_prefix, RDMA_NLDEV_ATTR_PAD))
  336. return -EMSGSIZE;
  337. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_LID, attr.lid))
  338. return -EMSGSIZE;
  339. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_SM_LID, attr.sm_lid))
  340. return -EMSGSIZE;
  341. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_LMC, attr.lmc))
  342. return -EMSGSIZE;
  343. }
  344. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_PORT_STATE, attr.state))
  345. return -EMSGSIZE;
  346. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_PORT_PHYS_STATE, attr.phys_state))
  347. return -EMSGSIZE;
  348. netdev = ib_device_get_netdev(device, port);
  349. if (netdev && net_eq(dev_net(netdev), net)) {
  350. ret = nla_put_u32(msg,
  351. RDMA_NLDEV_ATTR_NDEV_INDEX, netdev->ifindex);
  352. if (ret)
  353. goto out;
  354. ret = nla_put_string(msg,
  355. RDMA_NLDEV_ATTR_NDEV_NAME, netdev->name);
  356. }
  357. out:
  358. dev_put(netdev);
  359. return ret;
  360. }
  361. static int fill_res_info_entry(struct sk_buff *msg,
  362. const char *name, u64 curr)
  363. {
  364. struct nlattr *entry_attr;
  365. entry_attr = nla_nest_start_noflag(msg,
  366. RDMA_NLDEV_ATTR_RES_SUMMARY_ENTRY);
  367. if (!entry_attr)
  368. return -EMSGSIZE;
  369. if (nla_put_string(msg, RDMA_NLDEV_ATTR_RES_SUMMARY_ENTRY_NAME, name))
  370. goto err;
  371. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_RES_SUMMARY_ENTRY_CURR, curr,
  372. RDMA_NLDEV_ATTR_PAD))
  373. goto err;
  374. nla_nest_end(msg, entry_attr);
  375. return 0;
  376. err:
  377. nla_nest_cancel(msg, entry_attr);
  378. return -EMSGSIZE;
  379. }
  380. static int fill_res_info(struct sk_buff *msg, struct ib_device *device,
  381. bool show_details)
  382. {
  383. static const char * const names[RDMA_RESTRACK_MAX] = {
  384. [RDMA_RESTRACK_PD] = "pd",
  385. [RDMA_RESTRACK_CQ] = "cq",
  386. [RDMA_RESTRACK_QP] = "qp",
  387. [RDMA_RESTRACK_CM_ID] = "cm_id",
  388. [RDMA_RESTRACK_MR] = "mr",
  389. [RDMA_RESTRACK_CTX] = "ctx",
  390. [RDMA_RESTRACK_SRQ] = "srq",
  391. };
  392. struct nlattr *table_attr;
  393. int ret, i, curr;
  394. if (fill_nldev_handle(msg, device))
  395. return -EMSGSIZE;
  396. table_attr = nla_nest_start_noflag(msg, RDMA_NLDEV_ATTR_RES_SUMMARY);
  397. if (!table_attr)
  398. return -EMSGSIZE;
  399. for (i = 0; i < RDMA_RESTRACK_MAX; i++) {
  400. if (!names[i])
  401. continue;
  402. curr = rdma_restrack_count(device, i, show_details);
  403. ret = fill_res_info_entry(msg, names[i], curr);
  404. if (ret)
  405. goto err;
  406. }
  407. nla_nest_end(msg, table_attr);
  408. return 0;
  409. err:
  410. nla_nest_cancel(msg, table_attr);
  411. return ret;
  412. }
  413. static int fill_res_name_pid(struct sk_buff *msg,
  414. struct rdma_restrack_entry *res)
  415. {
  416. int err = 0;
  417. /*
  418. * For user resources, user is should read /proc/PID/comm to get the
  419. * name of the task file.
  420. */
  421. if (rdma_is_kernel_res(res)) {
  422. err = nla_put_string(msg, RDMA_NLDEV_ATTR_RES_KERN_NAME,
  423. res->kern_name);
  424. } else {
  425. pid_t pid;
  426. pid = task_pid_vnr(res->task);
  427. /*
  428. * Task is dead and in zombie state.
  429. * There is no need to print PID anymore.
  430. */
  431. if (pid)
  432. /*
  433. * This part is racy, task can be killed and PID will
  434. * be zero right here but it is ok, next query won't
  435. * return PID. We don't promise real-time reflection
  436. * of SW objects.
  437. */
  438. err = nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_PID, pid);
  439. }
  440. return err ? -EMSGSIZE : 0;
  441. }
  442. static int fill_res_qp_entry_query(struct sk_buff *msg,
  443. struct rdma_restrack_entry *res,
  444. struct ib_device *dev,
  445. struct ib_qp *qp)
  446. {
  447. struct ib_qp_init_attr qp_init_attr;
  448. struct ib_qp_attr qp_attr;
  449. int ret;
  450. ret = ib_query_qp(qp, &qp_attr, 0, &qp_init_attr);
  451. if (ret)
  452. return ret;
  453. if (qp->qp_type == IB_QPT_RC || qp->qp_type == IB_QPT_UC) {
  454. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_RQPN,
  455. qp_attr.dest_qp_num))
  456. goto err;
  457. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_RQ_PSN,
  458. qp_attr.rq_psn))
  459. goto err;
  460. }
  461. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_SQ_PSN, qp_attr.sq_psn))
  462. goto err;
  463. if (qp->qp_type == IB_QPT_RC || qp->qp_type == IB_QPT_UC ||
  464. qp->qp_type == IB_QPT_XRC_INI || qp->qp_type == IB_QPT_XRC_TGT) {
  465. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_RES_PATH_MIG_STATE,
  466. qp_attr.path_mig_state))
  467. goto err;
  468. }
  469. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_RES_TYPE, qp->qp_type))
  470. goto err;
  471. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_RES_STATE, qp_attr.qp_state))
  472. goto err;
  473. if (dev->ops.fill_res_qp_entry)
  474. return dev->ops.fill_res_qp_entry(msg, qp);
  475. return 0;
  476. err: return -EMSGSIZE;
  477. }
  478. static int fill_res_qp_entry(struct sk_buff *msg, bool has_cap_net_admin,
  479. struct rdma_restrack_entry *res, uint32_t port)
  480. {
  481. struct ib_qp *qp = container_of(res, struct ib_qp, res);
  482. struct ib_device *dev = qp->device;
  483. int ret;
  484. if (port && port != qp->port)
  485. return -EAGAIN;
  486. /* In create_qp() port is not set yet */
  487. if (qp->port && nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, qp->port))
  488. return -EMSGSIZE;
  489. ret = nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_LQPN, qp->qp_num);
  490. if (ret)
  491. return -EMSGSIZE;
  492. if (!rdma_is_kernel_res(res) &&
  493. nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_PDN, qp->pd->res.id))
  494. return -EMSGSIZE;
  495. ret = fill_res_name_pid(msg, res);
  496. if (ret)
  497. return -EMSGSIZE;
  498. return fill_res_qp_entry_query(msg, res, dev, qp);
  499. }
  500. static int fill_res_qp_raw_entry(struct sk_buff *msg, bool has_cap_net_admin,
  501. struct rdma_restrack_entry *res, uint32_t port)
  502. {
  503. struct ib_qp *qp = container_of(res, struct ib_qp, res);
  504. struct ib_device *dev = qp->device;
  505. if (port && port != qp->port)
  506. return -EAGAIN;
  507. if (!dev->ops.fill_res_qp_entry_raw)
  508. return -EINVAL;
  509. return dev->ops.fill_res_qp_entry_raw(msg, qp);
  510. }
  511. static int fill_res_cm_id_entry(struct sk_buff *msg, bool has_cap_net_admin,
  512. struct rdma_restrack_entry *res, uint32_t port)
  513. {
  514. struct rdma_id_private *id_priv =
  515. container_of(res, struct rdma_id_private, res);
  516. struct ib_device *dev = id_priv->id.device;
  517. struct rdma_cm_id *cm_id = &id_priv->id;
  518. if (port && port != cm_id->port_num)
  519. return -EAGAIN;
  520. if (cm_id->port_num &&
  521. nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, cm_id->port_num))
  522. goto err;
  523. if (id_priv->qp_num) {
  524. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_LQPN, id_priv->qp_num))
  525. goto err;
  526. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_RES_TYPE, cm_id->qp_type))
  527. goto err;
  528. }
  529. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_PS, cm_id->ps))
  530. goto err;
  531. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_RES_STATE, id_priv->state))
  532. goto err;
  533. if (cm_id->route.addr.src_addr.ss_family &&
  534. nla_put(msg, RDMA_NLDEV_ATTR_RES_SRC_ADDR,
  535. sizeof(cm_id->route.addr.src_addr),
  536. &cm_id->route.addr.src_addr))
  537. goto err;
  538. if (cm_id->route.addr.dst_addr.ss_family &&
  539. nla_put(msg, RDMA_NLDEV_ATTR_RES_DST_ADDR,
  540. sizeof(cm_id->route.addr.dst_addr),
  541. &cm_id->route.addr.dst_addr))
  542. goto err;
  543. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_CM_IDN, res->id))
  544. goto err;
  545. if (fill_res_name_pid(msg, res))
  546. goto err;
  547. if (dev->ops.fill_res_cm_id_entry)
  548. return dev->ops.fill_res_cm_id_entry(msg, cm_id);
  549. return 0;
  550. err: return -EMSGSIZE;
  551. }
  552. static int fill_res_cq_entry(struct sk_buff *msg, bool has_cap_net_admin,
  553. struct rdma_restrack_entry *res, uint32_t port)
  554. {
  555. struct ib_cq *cq = container_of(res, struct ib_cq, res);
  556. struct ib_device *dev = cq->device;
  557. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_CQE, cq->cqe))
  558. return -EMSGSIZE;
  559. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_RES_USECNT,
  560. atomic_read(&cq->usecnt), RDMA_NLDEV_ATTR_PAD))
  561. return -EMSGSIZE;
  562. /* Poll context is only valid for kernel CQs */
  563. if (rdma_is_kernel_res(res) &&
  564. nla_put_u8(msg, RDMA_NLDEV_ATTR_RES_POLL_CTX, cq->poll_ctx))
  565. return -EMSGSIZE;
  566. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_DEV_DIM, (cq->dim != NULL)))
  567. return -EMSGSIZE;
  568. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_CQN, res->id))
  569. return -EMSGSIZE;
  570. if (!rdma_is_kernel_res(res) &&
  571. nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_CTXN,
  572. cq->uobject->uevent.uobject.context->res.id))
  573. return -EMSGSIZE;
  574. if (fill_res_name_pid(msg, res))
  575. return -EMSGSIZE;
  576. return (dev->ops.fill_res_cq_entry) ?
  577. dev->ops.fill_res_cq_entry(msg, cq) : 0;
  578. }
  579. static int fill_res_cq_raw_entry(struct sk_buff *msg, bool has_cap_net_admin,
  580. struct rdma_restrack_entry *res, uint32_t port)
  581. {
  582. struct ib_cq *cq = container_of(res, struct ib_cq, res);
  583. struct ib_device *dev = cq->device;
  584. if (!dev->ops.fill_res_cq_entry_raw)
  585. return -EINVAL;
  586. return dev->ops.fill_res_cq_entry_raw(msg, cq);
  587. }
  588. static int fill_res_mr_entry(struct sk_buff *msg, bool has_cap_net_admin,
  589. struct rdma_restrack_entry *res, uint32_t port)
  590. {
  591. struct ib_mr *mr = container_of(res, struct ib_mr, res);
  592. struct ib_device *dev = mr->pd->device;
  593. if (has_cap_net_admin) {
  594. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_RKEY, mr->rkey))
  595. return -EMSGSIZE;
  596. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_LKEY, mr->lkey))
  597. return -EMSGSIZE;
  598. }
  599. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_RES_MRLEN, mr->length,
  600. RDMA_NLDEV_ATTR_PAD))
  601. return -EMSGSIZE;
  602. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_MRN, res->id))
  603. return -EMSGSIZE;
  604. if (!rdma_is_kernel_res(res) &&
  605. nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_PDN, mr->pd->res.id))
  606. return -EMSGSIZE;
  607. if (fill_res_name_pid(msg, res))
  608. return -EMSGSIZE;
  609. return (dev->ops.fill_res_mr_entry) ?
  610. dev->ops.fill_res_mr_entry(msg, mr) :
  611. 0;
  612. }
  613. static int fill_res_mr_raw_entry(struct sk_buff *msg, bool has_cap_net_admin,
  614. struct rdma_restrack_entry *res, uint32_t port)
  615. {
  616. struct ib_mr *mr = container_of(res, struct ib_mr, res);
  617. struct ib_device *dev = mr->pd->device;
  618. if (!dev->ops.fill_res_mr_entry_raw)
  619. return -EINVAL;
  620. return dev->ops.fill_res_mr_entry_raw(msg, mr);
  621. }
  622. static int fill_res_pd_entry(struct sk_buff *msg, bool has_cap_net_admin,
  623. struct rdma_restrack_entry *res, uint32_t port)
  624. {
  625. struct ib_pd *pd = container_of(res, struct ib_pd, res);
  626. if (has_cap_net_admin) {
  627. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_LOCAL_DMA_LKEY,
  628. pd->local_dma_lkey))
  629. goto err;
  630. if ((pd->flags & IB_PD_UNSAFE_GLOBAL_RKEY) &&
  631. nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_UNSAFE_GLOBAL_RKEY,
  632. pd->unsafe_global_rkey))
  633. goto err;
  634. }
  635. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_RES_USECNT,
  636. atomic_read(&pd->usecnt), RDMA_NLDEV_ATTR_PAD))
  637. goto err;
  638. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_PDN, res->id))
  639. goto err;
  640. if (!rdma_is_kernel_res(res) &&
  641. nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_CTXN,
  642. pd->uobject->context->res.id))
  643. goto err;
  644. return fill_res_name_pid(msg, res);
  645. err: return -EMSGSIZE;
  646. }
  647. static int fill_res_ctx_entry(struct sk_buff *msg, bool has_cap_net_admin,
  648. struct rdma_restrack_entry *res, uint32_t port)
  649. {
  650. struct ib_ucontext *ctx = container_of(res, struct ib_ucontext, res);
  651. if (rdma_is_kernel_res(res))
  652. return 0;
  653. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_CTXN, ctx->res.id))
  654. return -EMSGSIZE;
  655. return fill_res_name_pid(msg, res);
  656. }
  657. static int fill_res_range_qp_entry(struct sk_buff *msg, uint32_t min_range,
  658. uint32_t max_range)
  659. {
  660. struct nlattr *entry_attr;
  661. if (!min_range)
  662. return 0;
  663. entry_attr = nla_nest_start(msg, RDMA_NLDEV_ATTR_RES_QP_ENTRY);
  664. if (!entry_attr)
  665. return -EMSGSIZE;
  666. if (min_range == max_range) {
  667. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_LQPN, min_range))
  668. goto err;
  669. } else {
  670. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_MIN_RANGE, min_range))
  671. goto err;
  672. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_MAX_RANGE, max_range))
  673. goto err;
  674. }
  675. nla_nest_end(msg, entry_attr);
  676. return 0;
  677. err:
  678. nla_nest_cancel(msg, entry_attr);
  679. return -EMSGSIZE;
  680. }
  681. static int fill_res_srq_qps(struct sk_buff *msg, struct ib_srq *srq)
  682. {
  683. uint32_t min_range = 0, prev = 0;
  684. struct rdma_restrack_entry *res;
  685. struct rdma_restrack_root *rt;
  686. struct nlattr *table_attr;
  687. struct ib_qp *qp = NULL;
  688. unsigned long id = 0;
  689. table_attr = nla_nest_start(msg, RDMA_NLDEV_ATTR_RES_QP);
  690. if (!table_attr)
  691. return -EMSGSIZE;
  692. rt = &srq->device->res[RDMA_RESTRACK_QP];
  693. xa_lock(&rt->xa);
  694. xa_for_each(&rt->xa, id, res) {
  695. if (!rdma_restrack_get(res))
  696. continue;
  697. qp = container_of(res, struct ib_qp, res);
  698. if (!qp->srq || (qp->srq->res.id != srq->res.id)) {
  699. rdma_restrack_put(res);
  700. continue;
  701. }
  702. if (qp->qp_num < prev)
  703. /* qp_num should be ascending */
  704. goto err_loop;
  705. if (min_range == 0) {
  706. min_range = qp->qp_num;
  707. } else if (qp->qp_num > (prev + 1)) {
  708. if (fill_res_range_qp_entry(msg, min_range, prev))
  709. goto err_loop;
  710. min_range = qp->qp_num;
  711. }
  712. prev = qp->qp_num;
  713. rdma_restrack_put(res);
  714. }
  715. xa_unlock(&rt->xa);
  716. if (fill_res_range_qp_entry(msg, min_range, prev))
  717. goto err;
  718. nla_nest_end(msg, table_attr);
  719. return 0;
  720. err_loop:
  721. rdma_restrack_put(res);
  722. xa_unlock(&rt->xa);
  723. err:
  724. nla_nest_cancel(msg, table_attr);
  725. return -EMSGSIZE;
  726. }
  727. static int fill_res_srq_entry(struct sk_buff *msg, bool has_cap_net_admin,
  728. struct rdma_restrack_entry *res, uint32_t port)
  729. {
  730. struct ib_srq *srq = container_of(res, struct ib_srq, res);
  731. struct ib_device *dev = srq->device;
  732. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_SRQN, srq->res.id))
  733. goto err;
  734. if (nla_put_u8(msg, RDMA_NLDEV_ATTR_RES_TYPE, srq->srq_type))
  735. goto err;
  736. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_PDN, srq->pd->res.id))
  737. goto err;
  738. if (ib_srq_has_cq(srq->srq_type)) {
  739. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_CQN,
  740. srq->ext.cq->res.id))
  741. goto err;
  742. }
  743. if (fill_res_srq_qps(msg, srq))
  744. goto err;
  745. if (fill_res_name_pid(msg, res))
  746. goto err;
  747. if (dev->ops.fill_res_srq_entry)
  748. return dev->ops.fill_res_srq_entry(msg, srq);
  749. return 0;
  750. err:
  751. return -EMSGSIZE;
  752. }
  753. static int fill_res_srq_raw_entry(struct sk_buff *msg, bool has_cap_net_admin,
  754. struct rdma_restrack_entry *res, uint32_t port)
  755. {
  756. struct ib_srq *srq = container_of(res, struct ib_srq, res);
  757. struct ib_device *dev = srq->device;
  758. if (!dev->ops.fill_res_srq_entry_raw)
  759. return -EINVAL;
  760. return dev->ops.fill_res_srq_entry_raw(msg, srq);
  761. }
  762. static int fill_stat_counter_mode(struct sk_buff *msg,
  763. struct rdma_counter *counter)
  764. {
  765. struct rdma_counter_mode *m = &counter->mode;
  766. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_STAT_MODE, m->mode))
  767. return -EMSGSIZE;
  768. if (m->mode == RDMA_COUNTER_MODE_AUTO) {
  769. if ((m->mask & RDMA_COUNTER_MASK_QP_TYPE) &&
  770. nla_put_u8(msg, RDMA_NLDEV_ATTR_RES_TYPE, m->param.qp_type))
  771. return -EMSGSIZE;
  772. if ((m->mask & RDMA_COUNTER_MASK_PID) &&
  773. fill_res_name_pid(msg, &counter->res))
  774. return -EMSGSIZE;
  775. }
  776. return 0;
  777. }
  778. static int fill_stat_counter_qp_entry(struct sk_buff *msg, u32 qpn)
  779. {
  780. struct nlattr *entry_attr;
  781. entry_attr = nla_nest_start(msg, RDMA_NLDEV_ATTR_RES_QP_ENTRY);
  782. if (!entry_attr)
  783. return -EMSGSIZE;
  784. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_LQPN, qpn))
  785. goto err;
  786. nla_nest_end(msg, entry_attr);
  787. return 0;
  788. err:
  789. nla_nest_cancel(msg, entry_attr);
  790. return -EMSGSIZE;
  791. }
  792. static int fill_stat_counter_qps(struct sk_buff *msg,
  793. struct rdma_counter *counter)
  794. {
  795. struct rdma_restrack_entry *res;
  796. struct rdma_restrack_root *rt;
  797. struct nlattr *table_attr;
  798. struct ib_qp *qp = NULL;
  799. unsigned long id = 0;
  800. int ret = 0;
  801. table_attr = nla_nest_start(msg, RDMA_NLDEV_ATTR_RES_QP);
  802. if (!table_attr)
  803. return -EMSGSIZE;
  804. rt = &counter->device->res[RDMA_RESTRACK_QP];
  805. xa_lock(&rt->xa);
  806. xa_for_each(&rt->xa, id, res) {
  807. qp = container_of(res, struct ib_qp, res);
  808. if (!qp->counter || (qp->counter->id != counter->id))
  809. continue;
  810. ret = fill_stat_counter_qp_entry(msg, qp->qp_num);
  811. if (ret)
  812. goto err;
  813. }
  814. xa_unlock(&rt->xa);
  815. nla_nest_end(msg, table_attr);
  816. return 0;
  817. err:
  818. xa_unlock(&rt->xa);
  819. nla_nest_cancel(msg, table_attr);
  820. return ret;
  821. }
  822. int rdma_nl_stat_hwcounter_entry(struct sk_buff *msg, const char *name,
  823. u64 value)
  824. {
  825. struct nlattr *entry_attr;
  826. entry_attr = nla_nest_start(msg, RDMA_NLDEV_ATTR_STAT_HWCOUNTER_ENTRY);
  827. if (!entry_attr)
  828. return -EMSGSIZE;
  829. if (nla_put_string(msg, RDMA_NLDEV_ATTR_STAT_HWCOUNTER_ENTRY_NAME,
  830. name))
  831. goto err;
  832. if (nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_STAT_HWCOUNTER_ENTRY_VALUE,
  833. value, RDMA_NLDEV_ATTR_PAD))
  834. goto err;
  835. nla_nest_end(msg, entry_attr);
  836. return 0;
  837. err:
  838. nla_nest_cancel(msg, entry_attr);
  839. return -EMSGSIZE;
  840. }
  841. EXPORT_SYMBOL(rdma_nl_stat_hwcounter_entry);
  842. static int fill_stat_mr_entry(struct sk_buff *msg, bool has_cap_net_admin,
  843. struct rdma_restrack_entry *res, uint32_t port)
  844. {
  845. struct ib_mr *mr = container_of(res, struct ib_mr, res);
  846. struct ib_device *dev = mr->pd->device;
  847. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_MRN, res->id))
  848. goto err;
  849. if (dev->ops.fill_stat_mr_entry)
  850. return dev->ops.fill_stat_mr_entry(msg, mr);
  851. return 0;
  852. err:
  853. return -EMSGSIZE;
  854. }
  855. static int fill_stat_counter_hwcounters(struct sk_buff *msg,
  856. struct rdma_counter *counter)
  857. {
  858. struct rdma_hw_stats *st = counter->stats;
  859. struct nlattr *table_attr;
  860. int i;
  861. table_attr = nla_nest_start(msg, RDMA_NLDEV_ATTR_STAT_HWCOUNTERS);
  862. if (!table_attr)
  863. return -EMSGSIZE;
  864. mutex_lock(&st->lock);
  865. for (i = 0; i < st->num_counters; i++) {
  866. if (test_bit(i, st->is_disabled))
  867. continue;
  868. if (rdma_nl_stat_hwcounter_entry(msg, st->descs[i].name,
  869. st->value[i]))
  870. goto err;
  871. }
  872. mutex_unlock(&st->lock);
  873. nla_nest_end(msg, table_attr);
  874. return 0;
  875. err:
  876. mutex_unlock(&st->lock);
  877. nla_nest_cancel(msg, table_attr);
  878. return -EMSGSIZE;
  879. }
  880. static int fill_res_counter_entry(struct sk_buff *msg, bool has_cap_net_admin,
  881. struct rdma_restrack_entry *res,
  882. uint32_t port)
  883. {
  884. struct rdma_counter *counter =
  885. container_of(res, struct rdma_counter, res);
  886. if (port && port != counter->port)
  887. return -EAGAIN;
  888. /* Dump it even query failed */
  889. rdma_counter_query_stats(counter);
  890. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, counter->port) ||
  891. nla_put_u32(msg, RDMA_NLDEV_ATTR_STAT_COUNTER_ID, counter->id) ||
  892. fill_stat_counter_mode(msg, counter) ||
  893. fill_stat_counter_qps(msg, counter) ||
  894. fill_stat_counter_hwcounters(msg, counter))
  895. return -EMSGSIZE;
  896. return 0;
  897. }
  898. static int nldev_get_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  899. struct netlink_ext_ack *extack)
  900. {
  901. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  902. struct ib_device *device;
  903. struct sk_buff *msg;
  904. u32 index;
  905. int err;
  906. err = __nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  907. nldev_policy, NL_VALIDATE_LIBERAL, extack);
  908. if (err || !tb[RDMA_NLDEV_ATTR_DEV_INDEX])
  909. return -EINVAL;
  910. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  911. device = ib_device_get_by_index(sock_net(skb->sk), index);
  912. if (!device)
  913. return -EINVAL;
  914. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  915. if (!msg) {
  916. err = -ENOMEM;
  917. goto err;
  918. }
  919. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  920. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV, RDMA_NLDEV_CMD_GET),
  921. 0, 0);
  922. if (!nlh) {
  923. err = -EMSGSIZE;
  924. goto err_free;
  925. }
  926. err = fill_dev_info(msg, device);
  927. if (err)
  928. goto err_free;
  929. nlmsg_end(msg, nlh);
  930. ib_device_put(device);
  931. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  932. err_free:
  933. nlmsg_free(msg);
  934. err:
  935. ib_device_put(device);
  936. return err;
  937. }
  938. static int nldev_set_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  939. struct netlink_ext_ack *extack)
  940. {
  941. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  942. struct ib_device *device;
  943. u32 index;
  944. int err;
  945. err = nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  946. nldev_policy, extack);
  947. if (err || !tb[RDMA_NLDEV_ATTR_DEV_INDEX])
  948. return -EINVAL;
  949. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  950. device = ib_device_get_by_index(sock_net(skb->sk), index);
  951. if (!device)
  952. return -EINVAL;
  953. if (tb[RDMA_NLDEV_ATTR_DEV_NAME]) {
  954. char name[IB_DEVICE_NAME_MAX] = {};
  955. nla_strscpy(name, tb[RDMA_NLDEV_ATTR_DEV_NAME],
  956. IB_DEVICE_NAME_MAX);
  957. if (strlen(name) == 0) {
  958. err = -EINVAL;
  959. goto done;
  960. }
  961. err = ib_device_rename(device, name);
  962. goto done;
  963. }
  964. if (tb[RDMA_NLDEV_NET_NS_FD]) {
  965. u32 ns_fd;
  966. ns_fd = nla_get_u32(tb[RDMA_NLDEV_NET_NS_FD]);
  967. err = ib_device_set_netns_put(skb, device, ns_fd);
  968. goto put_done;
  969. }
  970. if (tb[RDMA_NLDEV_ATTR_DEV_DIM]) {
  971. u8 use_dim;
  972. use_dim = nla_get_u8(tb[RDMA_NLDEV_ATTR_DEV_DIM]);
  973. err = ib_device_set_dim(device, use_dim);
  974. goto done;
  975. }
  976. done:
  977. ib_device_put(device);
  978. put_done:
  979. return err;
  980. }
  981. static int _nldev_get_dumpit(struct ib_device *device,
  982. struct sk_buff *skb,
  983. struct netlink_callback *cb,
  984. unsigned int idx)
  985. {
  986. int start = cb->args[0];
  987. struct nlmsghdr *nlh;
  988. if (idx < start)
  989. return 0;
  990. nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
  991. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV, RDMA_NLDEV_CMD_GET),
  992. 0, NLM_F_MULTI);
  993. if (!nlh || fill_dev_info(skb, device)) {
  994. nlmsg_cancel(skb, nlh);
  995. goto out;
  996. }
  997. nlmsg_end(skb, nlh);
  998. idx++;
  999. out: cb->args[0] = idx;
  1000. return skb->len;
  1001. }
  1002. static int nldev_get_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
  1003. {
  1004. /*
  1005. * There is no need to take lock, because
  1006. * we are relying on ib_core's locking.
  1007. */
  1008. return ib_enum_all_devs(_nldev_get_dumpit, skb, cb);
  1009. }
  1010. static int nldev_port_get_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  1011. struct netlink_ext_ack *extack)
  1012. {
  1013. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1014. struct ib_device *device;
  1015. struct sk_buff *msg;
  1016. u32 index;
  1017. u32 port;
  1018. int err;
  1019. err = __nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1020. nldev_policy, NL_VALIDATE_LIBERAL, extack);
  1021. if (err ||
  1022. !tb[RDMA_NLDEV_ATTR_DEV_INDEX] ||
  1023. !tb[RDMA_NLDEV_ATTR_PORT_INDEX])
  1024. return -EINVAL;
  1025. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1026. device = ib_device_get_by_index(sock_net(skb->sk), index);
  1027. if (!device)
  1028. return -EINVAL;
  1029. port = nla_get_u32(tb[RDMA_NLDEV_ATTR_PORT_INDEX]);
  1030. if (!rdma_is_port_valid(device, port)) {
  1031. err = -EINVAL;
  1032. goto err;
  1033. }
  1034. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  1035. if (!msg) {
  1036. err = -ENOMEM;
  1037. goto err;
  1038. }
  1039. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  1040. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV, RDMA_NLDEV_CMD_GET),
  1041. 0, 0);
  1042. if (!nlh) {
  1043. err = -EMSGSIZE;
  1044. goto err_free;
  1045. }
  1046. err = fill_port_info(msg, device, port, sock_net(skb->sk));
  1047. if (err)
  1048. goto err_free;
  1049. nlmsg_end(msg, nlh);
  1050. ib_device_put(device);
  1051. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  1052. err_free:
  1053. nlmsg_free(msg);
  1054. err:
  1055. ib_device_put(device);
  1056. return err;
  1057. }
  1058. static int nldev_port_get_dumpit(struct sk_buff *skb,
  1059. struct netlink_callback *cb)
  1060. {
  1061. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1062. struct ib_device *device;
  1063. int start = cb->args[0];
  1064. struct nlmsghdr *nlh;
  1065. u32 idx = 0;
  1066. u32 ifindex;
  1067. int err;
  1068. unsigned int p;
  1069. err = __nlmsg_parse(cb->nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1070. nldev_policy, NL_VALIDATE_LIBERAL, NULL);
  1071. if (err || !tb[RDMA_NLDEV_ATTR_DEV_INDEX])
  1072. return -EINVAL;
  1073. ifindex = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1074. device = ib_device_get_by_index(sock_net(skb->sk), ifindex);
  1075. if (!device)
  1076. return -EINVAL;
  1077. rdma_for_each_port (device, p) {
  1078. /*
  1079. * The dumpit function returns all information from specific
  1080. * index. This specific index is taken from the netlink
  1081. * messages request sent by user and it is available
  1082. * in cb->args[0].
  1083. *
  1084. * Usually, the user doesn't fill this field and it causes
  1085. * to return everything.
  1086. *
  1087. */
  1088. if (idx < start) {
  1089. idx++;
  1090. continue;
  1091. }
  1092. nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid,
  1093. cb->nlh->nlmsg_seq,
  1094. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV,
  1095. RDMA_NLDEV_CMD_PORT_GET),
  1096. 0, NLM_F_MULTI);
  1097. if (!nlh || fill_port_info(skb, device, p, sock_net(skb->sk))) {
  1098. nlmsg_cancel(skb, nlh);
  1099. goto out;
  1100. }
  1101. idx++;
  1102. nlmsg_end(skb, nlh);
  1103. }
  1104. out:
  1105. ib_device_put(device);
  1106. cb->args[0] = idx;
  1107. return skb->len;
  1108. }
  1109. static int nldev_res_get_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  1110. struct netlink_ext_ack *extack)
  1111. {
  1112. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1113. bool show_details = false;
  1114. struct ib_device *device;
  1115. struct sk_buff *msg;
  1116. u32 index;
  1117. int ret;
  1118. ret = __nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1119. nldev_policy, NL_VALIDATE_LIBERAL, extack);
  1120. if (ret || !tb[RDMA_NLDEV_ATTR_DEV_INDEX])
  1121. return -EINVAL;
  1122. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1123. device = ib_device_get_by_index(sock_net(skb->sk), index);
  1124. if (!device)
  1125. return -EINVAL;
  1126. if (tb[RDMA_NLDEV_ATTR_DRIVER_DETAILS])
  1127. show_details = nla_get_u8(tb[RDMA_NLDEV_ATTR_DRIVER_DETAILS]);
  1128. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  1129. if (!msg) {
  1130. ret = -ENOMEM;
  1131. goto err;
  1132. }
  1133. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  1134. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV, RDMA_NLDEV_CMD_RES_GET),
  1135. 0, 0);
  1136. if (!nlh) {
  1137. ret = -EMSGSIZE;
  1138. goto err_free;
  1139. }
  1140. ret = fill_res_info(msg, device, show_details);
  1141. if (ret)
  1142. goto err_free;
  1143. nlmsg_end(msg, nlh);
  1144. ib_device_put(device);
  1145. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  1146. err_free:
  1147. nlmsg_free(msg);
  1148. err:
  1149. ib_device_put(device);
  1150. return ret;
  1151. }
  1152. static int _nldev_res_get_dumpit(struct ib_device *device,
  1153. struct sk_buff *skb,
  1154. struct netlink_callback *cb,
  1155. unsigned int idx)
  1156. {
  1157. int start = cb->args[0];
  1158. struct nlmsghdr *nlh;
  1159. if (idx < start)
  1160. return 0;
  1161. nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
  1162. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV, RDMA_NLDEV_CMD_RES_GET),
  1163. 0, NLM_F_MULTI);
  1164. if (!nlh || fill_res_info(skb, device, false)) {
  1165. nlmsg_cancel(skb, nlh);
  1166. goto out;
  1167. }
  1168. nlmsg_end(skb, nlh);
  1169. idx++;
  1170. out:
  1171. cb->args[0] = idx;
  1172. return skb->len;
  1173. }
  1174. static int nldev_res_get_dumpit(struct sk_buff *skb,
  1175. struct netlink_callback *cb)
  1176. {
  1177. return ib_enum_all_devs(_nldev_res_get_dumpit, skb, cb);
  1178. }
  1179. struct nldev_fill_res_entry {
  1180. enum rdma_nldev_attr nldev_attr;
  1181. u8 flags;
  1182. u32 entry;
  1183. u32 id;
  1184. };
  1185. enum nldev_res_flags {
  1186. NLDEV_PER_DEV = 1 << 0,
  1187. };
  1188. static const struct nldev_fill_res_entry fill_entries[RDMA_RESTRACK_MAX] = {
  1189. [RDMA_RESTRACK_QP] = {
  1190. .nldev_attr = RDMA_NLDEV_ATTR_RES_QP,
  1191. .entry = RDMA_NLDEV_ATTR_RES_QP_ENTRY,
  1192. .id = RDMA_NLDEV_ATTR_RES_LQPN,
  1193. },
  1194. [RDMA_RESTRACK_CM_ID] = {
  1195. .nldev_attr = RDMA_NLDEV_ATTR_RES_CM_ID,
  1196. .entry = RDMA_NLDEV_ATTR_RES_CM_ID_ENTRY,
  1197. .id = RDMA_NLDEV_ATTR_RES_CM_IDN,
  1198. },
  1199. [RDMA_RESTRACK_CQ] = {
  1200. .nldev_attr = RDMA_NLDEV_ATTR_RES_CQ,
  1201. .flags = NLDEV_PER_DEV,
  1202. .entry = RDMA_NLDEV_ATTR_RES_CQ_ENTRY,
  1203. .id = RDMA_NLDEV_ATTR_RES_CQN,
  1204. },
  1205. [RDMA_RESTRACK_MR] = {
  1206. .nldev_attr = RDMA_NLDEV_ATTR_RES_MR,
  1207. .flags = NLDEV_PER_DEV,
  1208. .entry = RDMA_NLDEV_ATTR_RES_MR_ENTRY,
  1209. .id = RDMA_NLDEV_ATTR_RES_MRN,
  1210. },
  1211. [RDMA_RESTRACK_PD] = {
  1212. .nldev_attr = RDMA_NLDEV_ATTR_RES_PD,
  1213. .flags = NLDEV_PER_DEV,
  1214. .entry = RDMA_NLDEV_ATTR_RES_PD_ENTRY,
  1215. .id = RDMA_NLDEV_ATTR_RES_PDN,
  1216. },
  1217. [RDMA_RESTRACK_COUNTER] = {
  1218. .nldev_attr = RDMA_NLDEV_ATTR_STAT_COUNTER,
  1219. .entry = RDMA_NLDEV_ATTR_STAT_COUNTER_ENTRY,
  1220. .id = RDMA_NLDEV_ATTR_STAT_COUNTER_ID,
  1221. },
  1222. [RDMA_RESTRACK_CTX] = {
  1223. .nldev_attr = RDMA_NLDEV_ATTR_RES_CTX,
  1224. .flags = NLDEV_PER_DEV,
  1225. .entry = RDMA_NLDEV_ATTR_RES_CTX_ENTRY,
  1226. .id = RDMA_NLDEV_ATTR_RES_CTXN,
  1227. },
  1228. [RDMA_RESTRACK_SRQ] = {
  1229. .nldev_attr = RDMA_NLDEV_ATTR_RES_SRQ,
  1230. .flags = NLDEV_PER_DEV,
  1231. .entry = RDMA_NLDEV_ATTR_RES_SRQ_ENTRY,
  1232. .id = RDMA_NLDEV_ATTR_RES_SRQN,
  1233. },
  1234. };
  1235. static noinline_for_stack int
  1236. res_get_common_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  1237. struct netlink_ext_ack *extack,
  1238. enum rdma_restrack_type res_type,
  1239. res_fill_func_t fill_func)
  1240. {
  1241. const struct nldev_fill_res_entry *fe = &fill_entries[res_type];
  1242. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1243. struct rdma_restrack_entry *res;
  1244. struct ib_device *device;
  1245. u32 index, id, port = 0;
  1246. bool has_cap_net_admin;
  1247. struct sk_buff *msg;
  1248. int ret;
  1249. ret = __nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1250. nldev_policy, NL_VALIDATE_LIBERAL, extack);
  1251. if (ret || !tb[RDMA_NLDEV_ATTR_DEV_INDEX] || !fe->id || !tb[fe->id])
  1252. return -EINVAL;
  1253. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1254. device = ib_device_get_by_index(sock_net(skb->sk), index);
  1255. if (!device)
  1256. return -EINVAL;
  1257. if (tb[RDMA_NLDEV_ATTR_PORT_INDEX]) {
  1258. port = nla_get_u32(tb[RDMA_NLDEV_ATTR_PORT_INDEX]);
  1259. if (!rdma_is_port_valid(device, port)) {
  1260. ret = -EINVAL;
  1261. goto err;
  1262. }
  1263. }
  1264. if ((port && fe->flags & NLDEV_PER_DEV) ||
  1265. (!port && ~fe->flags & NLDEV_PER_DEV)) {
  1266. ret = -EINVAL;
  1267. goto err;
  1268. }
  1269. id = nla_get_u32(tb[fe->id]);
  1270. res = rdma_restrack_get_byid(device, res_type, id);
  1271. if (IS_ERR(res)) {
  1272. ret = PTR_ERR(res);
  1273. goto err;
  1274. }
  1275. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  1276. if (!msg) {
  1277. ret = -ENOMEM;
  1278. goto err_get;
  1279. }
  1280. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  1281. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV,
  1282. RDMA_NL_GET_OP(nlh->nlmsg_type)),
  1283. 0, 0);
  1284. if (!nlh || fill_nldev_handle(msg, device)) {
  1285. ret = -EMSGSIZE;
  1286. goto err_free;
  1287. }
  1288. has_cap_net_admin = netlink_capable(skb, CAP_NET_ADMIN);
  1289. ret = fill_func(msg, has_cap_net_admin, res, port);
  1290. if (ret)
  1291. goto err_free;
  1292. rdma_restrack_put(res);
  1293. nlmsg_end(msg, nlh);
  1294. ib_device_put(device);
  1295. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  1296. err_free:
  1297. nlmsg_free(msg);
  1298. err_get:
  1299. rdma_restrack_put(res);
  1300. err:
  1301. ib_device_put(device);
  1302. return ret;
  1303. }
  1304. static int res_get_common_dumpit(struct sk_buff *skb,
  1305. struct netlink_callback *cb,
  1306. enum rdma_restrack_type res_type,
  1307. res_fill_func_t fill_func)
  1308. {
  1309. const struct nldev_fill_res_entry *fe = &fill_entries[res_type];
  1310. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1311. struct rdma_restrack_entry *res;
  1312. struct rdma_restrack_root *rt;
  1313. int err, ret = 0, idx = 0;
  1314. bool show_details = false;
  1315. struct nlattr *table_attr;
  1316. struct nlattr *entry_attr;
  1317. struct ib_device *device;
  1318. int start = cb->args[0];
  1319. bool has_cap_net_admin;
  1320. struct nlmsghdr *nlh;
  1321. unsigned long id;
  1322. u32 index, port = 0;
  1323. bool filled = false;
  1324. err = __nlmsg_parse(cb->nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1325. nldev_policy, NL_VALIDATE_LIBERAL, NULL);
  1326. /*
  1327. * Right now, we are expecting the device index to get res information,
  1328. * but it is possible to extend this code to return all devices in
  1329. * one shot by checking the existence of RDMA_NLDEV_ATTR_DEV_INDEX.
  1330. * if it doesn't exist, we will iterate over all devices.
  1331. *
  1332. * But it is not needed for now.
  1333. */
  1334. if (err || !tb[RDMA_NLDEV_ATTR_DEV_INDEX])
  1335. return -EINVAL;
  1336. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1337. device = ib_device_get_by_index(sock_net(skb->sk), index);
  1338. if (!device)
  1339. return -EINVAL;
  1340. if (tb[RDMA_NLDEV_ATTR_DRIVER_DETAILS])
  1341. show_details = nla_get_u8(tb[RDMA_NLDEV_ATTR_DRIVER_DETAILS]);
  1342. /*
  1343. * If no PORT_INDEX is supplied, we will return all QPs from that device
  1344. */
  1345. if (tb[RDMA_NLDEV_ATTR_PORT_INDEX]) {
  1346. port = nla_get_u32(tb[RDMA_NLDEV_ATTR_PORT_INDEX]);
  1347. if (!rdma_is_port_valid(device, port)) {
  1348. ret = -EINVAL;
  1349. goto err_index;
  1350. }
  1351. }
  1352. nlh = nlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
  1353. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV,
  1354. RDMA_NL_GET_OP(cb->nlh->nlmsg_type)),
  1355. 0, NLM_F_MULTI);
  1356. if (!nlh || fill_nldev_handle(skb, device)) {
  1357. ret = -EMSGSIZE;
  1358. goto err;
  1359. }
  1360. table_attr = nla_nest_start_noflag(skb, fe->nldev_attr);
  1361. if (!table_attr) {
  1362. ret = -EMSGSIZE;
  1363. goto err;
  1364. }
  1365. has_cap_net_admin = netlink_capable(cb->skb, CAP_NET_ADMIN);
  1366. rt = &device->res[res_type];
  1367. xa_lock(&rt->xa);
  1368. /*
  1369. * FIXME: if the skip ahead is something common this loop should
  1370. * use xas_for_each & xas_pause to optimize, we can have a lot of
  1371. * objects.
  1372. */
  1373. xa_for_each(&rt->xa, id, res) {
  1374. if (xa_get_mark(&rt->xa, res->id, RESTRACK_DD) && !show_details)
  1375. goto next;
  1376. if (idx < start || !rdma_restrack_get(res))
  1377. goto next;
  1378. xa_unlock(&rt->xa);
  1379. filled = true;
  1380. entry_attr = nla_nest_start_noflag(skb, fe->entry);
  1381. if (!entry_attr) {
  1382. ret = -EMSGSIZE;
  1383. rdma_restrack_put(res);
  1384. goto msg_full;
  1385. }
  1386. ret = fill_func(skb, has_cap_net_admin, res, port);
  1387. rdma_restrack_put(res);
  1388. if (ret) {
  1389. nla_nest_cancel(skb, entry_attr);
  1390. if (ret == -EMSGSIZE)
  1391. goto msg_full;
  1392. if (ret == -EAGAIN)
  1393. goto again;
  1394. goto res_err;
  1395. }
  1396. nla_nest_end(skb, entry_attr);
  1397. again: xa_lock(&rt->xa);
  1398. next: idx++;
  1399. }
  1400. xa_unlock(&rt->xa);
  1401. msg_full:
  1402. nla_nest_end(skb, table_attr);
  1403. nlmsg_end(skb, nlh);
  1404. cb->args[0] = idx;
  1405. /*
  1406. * No more entries to fill, cancel the message and
  1407. * return 0 to mark end of dumpit.
  1408. */
  1409. if (!filled)
  1410. goto err;
  1411. ib_device_put(device);
  1412. return skb->len;
  1413. res_err:
  1414. nla_nest_cancel(skb, table_attr);
  1415. err:
  1416. nlmsg_cancel(skb, nlh);
  1417. err_index:
  1418. ib_device_put(device);
  1419. return ret;
  1420. }
  1421. #define RES_GET_FUNCS(name, type) \
  1422. static int nldev_res_get_##name##_dumpit(struct sk_buff *skb, \
  1423. struct netlink_callback *cb) \
  1424. { \
  1425. return res_get_common_dumpit(skb, cb, type, \
  1426. fill_res_##name##_entry); \
  1427. } \
  1428. static int nldev_res_get_##name##_doit(struct sk_buff *skb, \
  1429. struct nlmsghdr *nlh, \
  1430. struct netlink_ext_ack *extack) \
  1431. { \
  1432. return res_get_common_doit(skb, nlh, extack, type, \
  1433. fill_res_##name##_entry); \
  1434. }
  1435. RES_GET_FUNCS(qp, RDMA_RESTRACK_QP);
  1436. RES_GET_FUNCS(qp_raw, RDMA_RESTRACK_QP);
  1437. RES_GET_FUNCS(cm_id, RDMA_RESTRACK_CM_ID);
  1438. RES_GET_FUNCS(cq, RDMA_RESTRACK_CQ);
  1439. RES_GET_FUNCS(cq_raw, RDMA_RESTRACK_CQ);
  1440. RES_GET_FUNCS(pd, RDMA_RESTRACK_PD);
  1441. RES_GET_FUNCS(mr, RDMA_RESTRACK_MR);
  1442. RES_GET_FUNCS(mr_raw, RDMA_RESTRACK_MR);
  1443. RES_GET_FUNCS(counter, RDMA_RESTRACK_COUNTER);
  1444. RES_GET_FUNCS(ctx, RDMA_RESTRACK_CTX);
  1445. RES_GET_FUNCS(srq, RDMA_RESTRACK_SRQ);
  1446. RES_GET_FUNCS(srq_raw, RDMA_RESTRACK_SRQ);
  1447. static LIST_HEAD(link_ops);
  1448. static DECLARE_RWSEM(link_ops_rwsem);
  1449. static const struct rdma_link_ops *link_ops_get(const char *type)
  1450. {
  1451. const struct rdma_link_ops *ops;
  1452. list_for_each_entry(ops, &link_ops, list) {
  1453. if (!strcmp(ops->type, type))
  1454. goto out;
  1455. }
  1456. ops = NULL;
  1457. out:
  1458. return ops;
  1459. }
  1460. void rdma_link_register(struct rdma_link_ops *ops)
  1461. {
  1462. down_write(&link_ops_rwsem);
  1463. if (WARN_ON_ONCE(link_ops_get(ops->type)))
  1464. goto out;
  1465. list_add(&ops->list, &link_ops);
  1466. out:
  1467. up_write(&link_ops_rwsem);
  1468. }
  1469. EXPORT_SYMBOL(rdma_link_register);
  1470. void rdma_link_unregister(struct rdma_link_ops *ops)
  1471. {
  1472. down_write(&link_ops_rwsem);
  1473. list_del(&ops->list);
  1474. up_write(&link_ops_rwsem);
  1475. }
  1476. EXPORT_SYMBOL(rdma_link_unregister);
  1477. static int nldev_newlink(struct sk_buff *skb, struct nlmsghdr *nlh,
  1478. struct netlink_ext_ack *extack)
  1479. {
  1480. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1481. char ibdev_name[IB_DEVICE_NAME_MAX];
  1482. const struct rdma_link_ops *ops;
  1483. char ndev_name[IFNAMSIZ];
  1484. struct net_device *ndev;
  1485. char type[IFNAMSIZ];
  1486. int err;
  1487. err = nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1488. nldev_policy, extack);
  1489. if (err || !tb[RDMA_NLDEV_ATTR_DEV_NAME] ||
  1490. !tb[RDMA_NLDEV_ATTR_LINK_TYPE] || !tb[RDMA_NLDEV_ATTR_NDEV_NAME])
  1491. return -EINVAL;
  1492. nla_strscpy(ibdev_name, tb[RDMA_NLDEV_ATTR_DEV_NAME],
  1493. sizeof(ibdev_name));
  1494. if (strchr(ibdev_name, '%') || strlen(ibdev_name) == 0)
  1495. return -EINVAL;
  1496. nla_strscpy(type, tb[RDMA_NLDEV_ATTR_LINK_TYPE], sizeof(type));
  1497. nla_strscpy(ndev_name, tb[RDMA_NLDEV_ATTR_NDEV_NAME],
  1498. sizeof(ndev_name));
  1499. ndev = dev_get_by_name(sock_net(skb->sk), ndev_name);
  1500. if (!ndev)
  1501. return -ENODEV;
  1502. down_read(&link_ops_rwsem);
  1503. ops = link_ops_get(type);
  1504. #ifdef CONFIG_MODULES
  1505. if (!ops) {
  1506. up_read(&link_ops_rwsem);
  1507. request_module("rdma-link-%s", type);
  1508. down_read(&link_ops_rwsem);
  1509. ops = link_ops_get(type);
  1510. }
  1511. #endif
  1512. err = ops ? ops->newlink(ibdev_name, ndev) : -EINVAL;
  1513. up_read(&link_ops_rwsem);
  1514. dev_put(ndev);
  1515. return err;
  1516. }
  1517. static int nldev_dellink(struct sk_buff *skb, struct nlmsghdr *nlh,
  1518. struct netlink_ext_ack *extack)
  1519. {
  1520. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1521. struct ib_device *device;
  1522. u32 index;
  1523. int err;
  1524. err = nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1525. nldev_policy, extack);
  1526. if (err || !tb[RDMA_NLDEV_ATTR_DEV_INDEX])
  1527. return -EINVAL;
  1528. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1529. device = ib_device_get_by_index(sock_net(skb->sk), index);
  1530. if (!device)
  1531. return -EINVAL;
  1532. if (!(device->attrs.kernel_cap_flags & IBK_ALLOW_USER_UNREG)) {
  1533. ib_device_put(device);
  1534. return -EINVAL;
  1535. }
  1536. ib_unregister_device_and_put(device);
  1537. return 0;
  1538. }
  1539. static int nldev_get_chardev(struct sk_buff *skb, struct nlmsghdr *nlh,
  1540. struct netlink_ext_ack *extack)
  1541. {
  1542. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1543. char client_name[RDMA_NLDEV_ATTR_CHARDEV_TYPE_SIZE];
  1544. struct ib_client_nl_info data = {};
  1545. struct ib_device *ibdev = NULL;
  1546. struct sk_buff *msg;
  1547. u32 index;
  1548. int err;
  1549. err = __nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1, nldev_policy,
  1550. NL_VALIDATE_LIBERAL, extack);
  1551. if (err || !tb[RDMA_NLDEV_ATTR_CHARDEV_TYPE])
  1552. return -EINVAL;
  1553. nla_strscpy(client_name, tb[RDMA_NLDEV_ATTR_CHARDEV_TYPE],
  1554. sizeof(client_name));
  1555. if (tb[RDMA_NLDEV_ATTR_DEV_INDEX]) {
  1556. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1557. ibdev = ib_device_get_by_index(sock_net(skb->sk), index);
  1558. if (!ibdev)
  1559. return -EINVAL;
  1560. if (tb[RDMA_NLDEV_ATTR_PORT_INDEX]) {
  1561. data.port = nla_get_u32(tb[RDMA_NLDEV_ATTR_PORT_INDEX]);
  1562. if (!rdma_is_port_valid(ibdev, data.port)) {
  1563. err = -EINVAL;
  1564. goto out_put;
  1565. }
  1566. } else {
  1567. data.port = -1;
  1568. }
  1569. } else if (tb[RDMA_NLDEV_ATTR_PORT_INDEX]) {
  1570. return -EINVAL;
  1571. }
  1572. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  1573. if (!msg) {
  1574. err = -ENOMEM;
  1575. goto out_put;
  1576. }
  1577. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  1578. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV,
  1579. RDMA_NLDEV_CMD_GET_CHARDEV),
  1580. 0, 0);
  1581. if (!nlh) {
  1582. err = -EMSGSIZE;
  1583. goto out_nlmsg;
  1584. }
  1585. data.nl_msg = msg;
  1586. err = ib_get_client_nl_info(ibdev, client_name, &data);
  1587. if (err)
  1588. goto out_nlmsg;
  1589. err = nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_CHARDEV,
  1590. huge_encode_dev(data.cdev->devt),
  1591. RDMA_NLDEV_ATTR_PAD);
  1592. if (err)
  1593. goto out_data;
  1594. err = nla_put_u64_64bit(msg, RDMA_NLDEV_ATTR_CHARDEV_ABI, data.abi,
  1595. RDMA_NLDEV_ATTR_PAD);
  1596. if (err)
  1597. goto out_data;
  1598. if (nla_put_string(msg, RDMA_NLDEV_ATTR_CHARDEV_NAME,
  1599. dev_name(data.cdev))) {
  1600. err = -EMSGSIZE;
  1601. goto out_data;
  1602. }
  1603. nlmsg_end(msg, nlh);
  1604. put_device(data.cdev);
  1605. if (ibdev)
  1606. ib_device_put(ibdev);
  1607. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  1608. out_data:
  1609. put_device(data.cdev);
  1610. out_nlmsg:
  1611. nlmsg_free(msg);
  1612. out_put:
  1613. if (ibdev)
  1614. ib_device_put(ibdev);
  1615. return err;
  1616. }
  1617. static int nldev_sys_get_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  1618. struct netlink_ext_ack *extack)
  1619. {
  1620. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1621. struct sk_buff *msg;
  1622. int err;
  1623. err = __nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1624. nldev_policy, NL_VALIDATE_LIBERAL, extack);
  1625. if (err)
  1626. return err;
  1627. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  1628. if (!msg)
  1629. return -ENOMEM;
  1630. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  1631. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV,
  1632. RDMA_NLDEV_CMD_SYS_GET),
  1633. 0, 0);
  1634. if (!nlh) {
  1635. nlmsg_free(msg);
  1636. return -EMSGSIZE;
  1637. }
  1638. err = nla_put_u8(msg, RDMA_NLDEV_SYS_ATTR_NETNS_MODE,
  1639. (u8)ib_devices_shared_netns);
  1640. if (err) {
  1641. nlmsg_free(msg);
  1642. return err;
  1643. }
  1644. err = nla_put_u8(msg, RDMA_NLDEV_SYS_ATTR_PRIVILEGED_QKEY_MODE,
  1645. (u8)privileged_qkey);
  1646. if (err) {
  1647. nlmsg_free(msg);
  1648. return err;
  1649. }
  1650. err = nla_put_u8(msg, RDMA_NLDEV_SYS_ATTR_MONITOR_MODE, 1);
  1651. if (err) {
  1652. nlmsg_free(msg);
  1653. return err;
  1654. }
  1655. /*
  1656. * Copy-on-fork is supported.
  1657. * See commits:
  1658. * 70e806e4e645 ("mm: Do early cow for pinned pages during fork() for ptes")
  1659. * 4eae4efa2c29 ("hugetlb: do early cow when page pinned on src mm")
  1660. * for more details. Don't backport this without them.
  1661. *
  1662. * Return value ignored on purpose, assume copy-on-fork is not
  1663. * supported in case of failure.
  1664. */
  1665. nla_put_u8(msg, RDMA_NLDEV_SYS_ATTR_COPY_ON_FORK, 1);
  1666. nlmsg_end(msg, nlh);
  1667. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  1668. }
  1669. static int nldev_set_sys_set_netns_doit(struct nlattr *tb[])
  1670. {
  1671. u8 enable;
  1672. int err;
  1673. enable = nla_get_u8(tb[RDMA_NLDEV_SYS_ATTR_NETNS_MODE]);
  1674. /* Only 0 and 1 are supported */
  1675. if (enable > 1)
  1676. return -EINVAL;
  1677. err = rdma_compatdev_set(enable);
  1678. return err;
  1679. }
  1680. static int nldev_set_sys_set_pqkey_doit(struct nlattr *tb[])
  1681. {
  1682. u8 enable;
  1683. enable = nla_get_u8(tb[RDMA_NLDEV_SYS_ATTR_PRIVILEGED_QKEY_MODE]);
  1684. /* Only 0 and 1 are supported */
  1685. if (enable > 1)
  1686. return -EINVAL;
  1687. privileged_qkey = enable;
  1688. return 0;
  1689. }
  1690. static int nldev_set_sys_set_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  1691. struct netlink_ext_ack *extack)
  1692. {
  1693. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1694. int err;
  1695. err = nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1696. nldev_policy, extack);
  1697. if (err)
  1698. return -EINVAL;
  1699. if (tb[RDMA_NLDEV_SYS_ATTR_NETNS_MODE])
  1700. return nldev_set_sys_set_netns_doit(tb);
  1701. if (tb[RDMA_NLDEV_SYS_ATTR_PRIVILEGED_QKEY_MODE])
  1702. return nldev_set_sys_set_pqkey_doit(tb);
  1703. return -EINVAL;
  1704. }
  1705. static int nldev_stat_set_mode_doit(struct sk_buff *msg,
  1706. struct netlink_ext_ack *extack,
  1707. struct nlattr *tb[],
  1708. struct ib_device *device, u32 port)
  1709. {
  1710. u32 mode, mask = 0, qpn, cntn = 0;
  1711. bool opcnt = false;
  1712. int ret;
  1713. /* Currently only counter for QP is supported */
  1714. if (!tb[RDMA_NLDEV_ATTR_STAT_RES] ||
  1715. nla_get_u32(tb[RDMA_NLDEV_ATTR_STAT_RES]) != RDMA_NLDEV_ATTR_RES_QP)
  1716. return -EINVAL;
  1717. if (tb[RDMA_NLDEV_ATTR_STAT_OPCOUNTER_ENABLED])
  1718. opcnt = !!nla_get_u8(
  1719. tb[RDMA_NLDEV_ATTR_STAT_OPCOUNTER_ENABLED]);
  1720. mode = nla_get_u32(tb[RDMA_NLDEV_ATTR_STAT_MODE]);
  1721. if (mode == RDMA_COUNTER_MODE_AUTO) {
  1722. if (tb[RDMA_NLDEV_ATTR_STAT_AUTO_MODE_MASK])
  1723. mask = nla_get_u32(
  1724. tb[RDMA_NLDEV_ATTR_STAT_AUTO_MODE_MASK]);
  1725. return rdma_counter_set_auto_mode(device, port, mask, opcnt,
  1726. extack);
  1727. }
  1728. if (!tb[RDMA_NLDEV_ATTR_RES_LQPN])
  1729. return -EINVAL;
  1730. qpn = nla_get_u32(tb[RDMA_NLDEV_ATTR_RES_LQPN]);
  1731. if (tb[RDMA_NLDEV_ATTR_STAT_COUNTER_ID]) {
  1732. cntn = nla_get_u32(tb[RDMA_NLDEV_ATTR_STAT_COUNTER_ID]);
  1733. ret = rdma_counter_bind_qpn(device, port, qpn, cntn);
  1734. if (ret)
  1735. return ret;
  1736. } else {
  1737. ret = rdma_counter_bind_qpn_alloc(device, port, qpn, &cntn);
  1738. if (ret)
  1739. return ret;
  1740. }
  1741. if (nla_put_u32(msg, RDMA_NLDEV_ATTR_STAT_COUNTER_ID, cntn) ||
  1742. nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_LQPN, qpn)) {
  1743. ret = -EMSGSIZE;
  1744. goto err_fill;
  1745. }
  1746. return 0;
  1747. err_fill:
  1748. rdma_counter_unbind_qpn(device, port, qpn, cntn);
  1749. return ret;
  1750. }
  1751. static int nldev_stat_set_counter_dynamic_doit(struct nlattr *tb[],
  1752. struct ib_device *device,
  1753. u32 port)
  1754. {
  1755. struct rdma_hw_stats *stats;
  1756. struct nlattr *entry_attr;
  1757. unsigned long *target;
  1758. int rem, i, ret = 0;
  1759. u32 index;
  1760. stats = ib_get_hw_stats_port(device, port);
  1761. if (!stats)
  1762. return -EINVAL;
  1763. target = kcalloc(BITS_TO_LONGS(stats->num_counters),
  1764. sizeof(*stats->is_disabled), GFP_KERNEL);
  1765. if (!target)
  1766. return -ENOMEM;
  1767. nla_for_each_nested(entry_attr, tb[RDMA_NLDEV_ATTR_STAT_HWCOUNTERS],
  1768. rem) {
  1769. index = nla_get_u32(entry_attr);
  1770. if ((index >= stats->num_counters) ||
  1771. !(stats->descs[index].flags & IB_STAT_FLAG_OPTIONAL)) {
  1772. ret = -EINVAL;
  1773. goto out;
  1774. }
  1775. set_bit(index, target);
  1776. }
  1777. for (i = 0; i < stats->num_counters; i++) {
  1778. if (!(stats->descs[i].flags & IB_STAT_FLAG_OPTIONAL))
  1779. continue;
  1780. ret = rdma_counter_modify(device, port, i, test_bit(i, target));
  1781. if (ret)
  1782. goto out;
  1783. }
  1784. out:
  1785. kfree(target);
  1786. return ret;
  1787. }
  1788. static int nldev_stat_set_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  1789. struct netlink_ext_ack *extack)
  1790. {
  1791. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1792. struct ib_device *device;
  1793. struct sk_buff *msg;
  1794. u32 index, port;
  1795. int ret;
  1796. ret = nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1, nldev_policy,
  1797. extack);
  1798. if (ret || !tb[RDMA_NLDEV_ATTR_DEV_INDEX] ||
  1799. !tb[RDMA_NLDEV_ATTR_PORT_INDEX])
  1800. return -EINVAL;
  1801. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1802. device = ib_device_get_by_index(sock_net(skb->sk), index);
  1803. if (!device)
  1804. return -EINVAL;
  1805. port = nla_get_u32(tb[RDMA_NLDEV_ATTR_PORT_INDEX]);
  1806. if (!rdma_is_port_valid(device, port)) {
  1807. ret = -EINVAL;
  1808. goto err_put_device;
  1809. }
  1810. if (!tb[RDMA_NLDEV_ATTR_STAT_MODE] &&
  1811. !tb[RDMA_NLDEV_ATTR_STAT_HWCOUNTERS]) {
  1812. ret = -EINVAL;
  1813. goto err_put_device;
  1814. }
  1815. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  1816. if (!msg) {
  1817. ret = -ENOMEM;
  1818. goto err_put_device;
  1819. }
  1820. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  1821. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV,
  1822. RDMA_NLDEV_CMD_STAT_SET),
  1823. 0, 0);
  1824. if (!nlh || fill_nldev_handle(msg, device) ||
  1825. nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, port)) {
  1826. ret = -EMSGSIZE;
  1827. goto err_free_msg;
  1828. }
  1829. if (tb[RDMA_NLDEV_ATTR_STAT_MODE]) {
  1830. ret = nldev_stat_set_mode_doit(msg, extack, tb, device, port);
  1831. if (ret)
  1832. goto err_free_msg;
  1833. }
  1834. if (tb[RDMA_NLDEV_ATTR_STAT_HWCOUNTERS]) {
  1835. ret = nldev_stat_set_counter_dynamic_doit(tb, device, port);
  1836. if (ret)
  1837. goto err_free_msg;
  1838. }
  1839. nlmsg_end(msg, nlh);
  1840. ib_device_put(device);
  1841. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  1842. err_free_msg:
  1843. nlmsg_free(msg);
  1844. err_put_device:
  1845. ib_device_put(device);
  1846. return ret;
  1847. }
  1848. static int nldev_stat_del_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  1849. struct netlink_ext_ack *extack)
  1850. {
  1851. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  1852. struct ib_device *device;
  1853. struct sk_buff *msg;
  1854. u32 index, port, qpn, cntn;
  1855. int ret;
  1856. ret = nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  1857. nldev_policy, extack);
  1858. if (ret || !tb[RDMA_NLDEV_ATTR_STAT_RES] ||
  1859. !tb[RDMA_NLDEV_ATTR_DEV_INDEX] || !tb[RDMA_NLDEV_ATTR_PORT_INDEX] ||
  1860. !tb[RDMA_NLDEV_ATTR_STAT_COUNTER_ID] ||
  1861. !tb[RDMA_NLDEV_ATTR_RES_LQPN])
  1862. return -EINVAL;
  1863. if (nla_get_u32(tb[RDMA_NLDEV_ATTR_STAT_RES]) != RDMA_NLDEV_ATTR_RES_QP)
  1864. return -EINVAL;
  1865. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1866. device = ib_device_get_by_index(sock_net(skb->sk), index);
  1867. if (!device)
  1868. return -EINVAL;
  1869. port = nla_get_u32(tb[RDMA_NLDEV_ATTR_PORT_INDEX]);
  1870. if (!rdma_is_port_valid(device, port)) {
  1871. ret = -EINVAL;
  1872. goto err;
  1873. }
  1874. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  1875. if (!msg) {
  1876. ret = -ENOMEM;
  1877. goto err;
  1878. }
  1879. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  1880. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV,
  1881. RDMA_NLDEV_CMD_STAT_SET),
  1882. 0, 0);
  1883. if (!nlh) {
  1884. ret = -EMSGSIZE;
  1885. goto err_fill;
  1886. }
  1887. cntn = nla_get_u32(tb[RDMA_NLDEV_ATTR_STAT_COUNTER_ID]);
  1888. qpn = nla_get_u32(tb[RDMA_NLDEV_ATTR_RES_LQPN]);
  1889. if (fill_nldev_handle(msg, device) ||
  1890. nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, port) ||
  1891. nla_put_u32(msg, RDMA_NLDEV_ATTR_STAT_COUNTER_ID, cntn) ||
  1892. nla_put_u32(msg, RDMA_NLDEV_ATTR_RES_LQPN, qpn)) {
  1893. ret = -EMSGSIZE;
  1894. goto err_fill;
  1895. }
  1896. ret = rdma_counter_unbind_qpn(device, port, qpn, cntn);
  1897. if (ret)
  1898. goto err_fill;
  1899. nlmsg_end(msg, nlh);
  1900. ib_device_put(device);
  1901. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  1902. err_fill:
  1903. nlmsg_free(msg);
  1904. err:
  1905. ib_device_put(device);
  1906. return ret;
  1907. }
  1908. static noinline_for_stack int
  1909. stat_get_doit_default_counter(struct sk_buff *skb, struct nlmsghdr *nlh,
  1910. struct netlink_ext_ack *extack,
  1911. struct nlattr *tb[])
  1912. {
  1913. struct rdma_hw_stats *stats;
  1914. struct nlattr *table_attr;
  1915. struct ib_device *device;
  1916. int ret, num_cnts, i;
  1917. struct sk_buff *msg;
  1918. u32 index, port;
  1919. u64 v;
  1920. if (!tb[RDMA_NLDEV_ATTR_DEV_INDEX] || !tb[RDMA_NLDEV_ATTR_PORT_INDEX])
  1921. return -EINVAL;
  1922. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  1923. device = ib_device_get_by_index(sock_net(skb->sk), index);
  1924. if (!device)
  1925. return -EINVAL;
  1926. if (!device->ops.alloc_hw_port_stats || !device->ops.get_hw_stats) {
  1927. ret = -EINVAL;
  1928. goto err;
  1929. }
  1930. port = nla_get_u32(tb[RDMA_NLDEV_ATTR_PORT_INDEX]);
  1931. stats = ib_get_hw_stats_port(device, port);
  1932. if (!stats) {
  1933. ret = -EINVAL;
  1934. goto err;
  1935. }
  1936. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  1937. if (!msg) {
  1938. ret = -ENOMEM;
  1939. goto err;
  1940. }
  1941. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  1942. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV,
  1943. RDMA_NLDEV_CMD_STAT_GET),
  1944. 0, 0);
  1945. if (!nlh || fill_nldev_handle(msg, device) ||
  1946. nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, port)) {
  1947. ret = -EMSGSIZE;
  1948. goto err_msg;
  1949. }
  1950. mutex_lock(&stats->lock);
  1951. num_cnts = device->ops.get_hw_stats(device, stats, port, 0);
  1952. if (num_cnts < 0) {
  1953. ret = -EINVAL;
  1954. goto err_stats;
  1955. }
  1956. table_attr = nla_nest_start(msg, RDMA_NLDEV_ATTR_STAT_HWCOUNTERS);
  1957. if (!table_attr) {
  1958. ret = -EMSGSIZE;
  1959. goto err_stats;
  1960. }
  1961. for (i = 0; i < num_cnts; i++) {
  1962. if (test_bit(i, stats->is_disabled))
  1963. continue;
  1964. v = stats->value[i] +
  1965. rdma_counter_get_hwstat_value(device, port, i);
  1966. if (rdma_nl_stat_hwcounter_entry(msg,
  1967. stats->descs[i].name, v)) {
  1968. ret = -EMSGSIZE;
  1969. goto err_table;
  1970. }
  1971. }
  1972. nla_nest_end(msg, table_attr);
  1973. mutex_unlock(&stats->lock);
  1974. nlmsg_end(msg, nlh);
  1975. ib_device_put(device);
  1976. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  1977. err_table:
  1978. nla_nest_cancel(msg, table_attr);
  1979. err_stats:
  1980. mutex_unlock(&stats->lock);
  1981. err_msg:
  1982. nlmsg_free(msg);
  1983. err:
  1984. ib_device_put(device);
  1985. return ret;
  1986. }
  1987. static noinline_for_stack int
  1988. stat_get_doit_qp(struct sk_buff *skb, struct nlmsghdr *nlh,
  1989. struct netlink_ext_ack *extack, struct nlattr *tb[])
  1990. {
  1991. static enum rdma_nl_counter_mode mode;
  1992. static enum rdma_nl_counter_mask mask;
  1993. struct ib_device *device;
  1994. struct sk_buff *msg;
  1995. u32 index, port;
  1996. bool opcnt;
  1997. int ret;
  1998. if (tb[RDMA_NLDEV_ATTR_STAT_COUNTER_ID])
  1999. return nldev_res_get_counter_doit(skb, nlh, extack);
  2000. if (!tb[RDMA_NLDEV_ATTR_STAT_MODE] ||
  2001. !tb[RDMA_NLDEV_ATTR_DEV_INDEX] || !tb[RDMA_NLDEV_ATTR_PORT_INDEX])
  2002. return -EINVAL;
  2003. index = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  2004. device = ib_device_get_by_index(sock_net(skb->sk), index);
  2005. if (!device)
  2006. return -EINVAL;
  2007. port = nla_get_u32(tb[RDMA_NLDEV_ATTR_PORT_INDEX]);
  2008. if (!rdma_is_port_valid(device, port)) {
  2009. ret = -EINVAL;
  2010. goto err;
  2011. }
  2012. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  2013. if (!msg) {
  2014. ret = -ENOMEM;
  2015. goto err;
  2016. }
  2017. nlh = nlmsg_put(msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  2018. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV,
  2019. RDMA_NLDEV_CMD_STAT_GET),
  2020. 0, 0);
  2021. if (!nlh) {
  2022. ret = -EMSGSIZE;
  2023. goto err_msg;
  2024. }
  2025. ret = rdma_counter_get_mode(device, port, &mode, &mask, &opcnt);
  2026. if (ret)
  2027. goto err_msg;
  2028. if (fill_nldev_handle(msg, device) ||
  2029. nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, port) ||
  2030. nla_put_u32(msg, RDMA_NLDEV_ATTR_STAT_MODE, mode)) {
  2031. ret = -EMSGSIZE;
  2032. goto err_msg;
  2033. }
  2034. if ((mode == RDMA_COUNTER_MODE_AUTO) &&
  2035. nla_put_u32(msg, RDMA_NLDEV_ATTR_STAT_AUTO_MODE_MASK, mask)) {
  2036. ret = -EMSGSIZE;
  2037. goto err_msg;
  2038. }
  2039. if ((mode == RDMA_COUNTER_MODE_AUTO) &&
  2040. nla_put_u8(msg, RDMA_NLDEV_ATTR_STAT_OPCOUNTER_ENABLED, opcnt)) {
  2041. ret = -EMSGSIZE;
  2042. goto err_msg;
  2043. }
  2044. nlmsg_end(msg, nlh);
  2045. ib_device_put(device);
  2046. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  2047. err_msg:
  2048. nlmsg_free(msg);
  2049. err:
  2050. ib_device_put(device);
  2051. return ret;
  2052. }
  2053. static int nldev_stat_get_doit(struct sk_buff *skb, struct nlmsghdr *nlh,
  2054. struct netlink_ext_ack *extack)
  2055. {
  2056. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  2057. int ret;
  2058. ret = __nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  2059. nldev_policy, NL_VALIDATE_LIBERAL, extack);
  2060. if (ret)
  2061. return -EINVAL;
  2062. if (!tb[RDMA_NLDEV_ATTR_STAT_RES])
  2063. return stat_get_doit_default_counter(skb, nlh, extack, tb);
  2064. switch (nla_get_u32(tb[RDMA_NLDEV_ATTR_STAT_RES])) {
  2065. case RDMA_NLDEV_ATTR_RES_QP:
  2066. ret = stat_get_doit_qp(skb, nlh, extack, tb);
  2067. break;
  2068. case RDMA_NLDEV_ATTR_RES_MR:
  2069. ret = res_get_common_doit(skb, nlh, extack, RDMA_RESTRACK_MR,
  2070. fill_stat_mr_entry);
  2071. break;
  2072. default:
  2073. ret = -EINVAL;
  2074. break;
  2075. }
  2076. return ret;
  2077. }
  2078. static int nldev_stat_get_dumpit(struct sk_buff *skb,
  2079. struct netlink_callback *cb)
  2080. {
  2081. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  2082. int ret;
  2083. ret = __nlmsg_parse(cb->nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  2084. nldev_policy, NL_VALIDATE_LIBERAL, NULL);
  2085. if (ret || !tb[RDMA_NLDEV_ATTR_STAT_RES])
  2086. return -EINVAL;
  2087. switch (nla_get_u32(tb[RDMA_NLDEV_ATTR_STAT_RES])) {
  2088. case RDMA_NLDEV_ATTR_RES_QP:
  2089. ret = nldev_res_get_counter_dumpit(skb, cb);
  2090. break;
  2091. case RDMA_NLDEV_ATTR_RES_MR:
  2092. ret = res_get_common_dumpit(skb, cb, RDMA_RESTRACK_MR,
  2093. fill_stat_mr_entry);
  2094. break;
  2095. default:
  2096. ret = -EINVAL;
  2097. break;
  2098. }
  2099. return ret;
  2100. }
  2101. static int nldev_stat_get_counter_status_doit(struct sk_buff *skb,
  2102. struct nlmsghdr *nlh,
  2103. struct netlink_ext_ack *extack)
  2104. {
  2105. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX], *table, *entry;
  2106. struct rdma_hw_stats *stats;
  2107. struct ib_device *device;
  2108. struct sk_buff *msg;
  2109. u32 devid, port;
  2110. int ret, i;
  2111. ret = __nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  2112. nldev_policy, NL_VALIDATE_LIBERAL, extack);
  2113. if (ret || !tb[RDMA_NLDEV_ATTR_DEV_INDEX] ||
  2114. !tb[RDMA_NLDEV_ATTR_PORT_INDEX])
  2115. return -EINVAL;
  2116. devid = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  2117. device = ib_device_get_by_index(sock_net(skb->sk), devid);
  2118. if (!device)
  2119. return -EINVAL;
  2120. port = nla_get_u32(tb[RDMA_NLDEV_ATTR_PORT_INDEX]);
  2121. if (!rdma_is_port_valid(device, port)) {
  2122. ret = -EINVAL;
  2123. goto err;
  2124. }
  2125. stats = ib_get_hw_stats_port(device, port);
  2126. if (!stats) {
  2127. ret = -EINVAL;
  2128. goto err;
  2129. }
  2130. msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  2131. if (!msg) {
  2132. ret = -ENOMEM;
  2133. goto err;
  2134. }
  2135. nlh = nlmsg_put(
  2136. msg, NETLINK_CB(skb).portid, nlh->nlmsg_seq,
  2137. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV, RDMA_NLDEV_CMD_STAT_GET_STATUS),
  2138. 0, 0);
  2139. ret = -EMSGSIZE;
  2140. if (!nlh || fill_nldev_handle(msg, device) ||
  2141. nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, port))
  2142. goto err_msg;
  2143. table = nla_nest_start(msg, RDMA_NLDEV_ATTR_STAT_HWCOUNTERS);
  2144. if (!table)
  2145. goto err_msg;
  2146. mutex_lock(&stats->lock);
  2147. for (i = 0; i < stats->num_counters; i++) {
  2148. entry = nla_nest_start(msg,
  2149. RDMA_NLDEV_ATTR_STAT_HWCOUNTER_ENTRY);
  2150. if (!entry)
  2151. goto err_msg_table;
  2152. if (nla_put_string(msg,
  2153. RDMA_NLDEV_ATTR_STAT_HWCOUNTER_ENTRY_NAME,
  2154. stats->descs[i].name) ||
  2155. nla_put_u32(msg, RDMA_NLDEV_ATTR_STAT_HWCOUNTER_INDEX, i))
  2156. goto err_msg_entry;
  2157. if ((stats->descs[i].flags & IB_STAT_FLAG_OPTIONAL) &&
  2158. (nla_put_u8(msg, RDMA_NLDEV_ATTR_STAT_HWCOUNTER_DYNAMIC,
  2159. !test_bit(i, stats->is_disabled))))
  2160. goto err_msg_entry;
  2161. nla_nest_end(msg, entry);
  2162. }
  2163. mutex_unlock(&stats->lock);
  2164. nla_nest_end(msg, table);
  2165. nlmsg_end(msg, nlh);
  2166. ib_device_put(device);
  2167. return rdma_nl_unicast(sock_net(skb->sk), msg, NETLINK_CB(skb).portid);
  2168. err_msg_entry:
  2169. nla_nest_cancel(msg, entry);
  2170. err_msg_table:
  2171. mutex_unlock(&stats->lock);
  2172. nla_nest_cancel(msg, table);
  2173. err_msg:
  2174. nlmsg_free(msg);
  2175. err:
  2176. ib_device_put(device);
  2177. return ret;
  2178. }
  2179. static int nldev_newdev(struct sk_buff *skb, struct nlmsghdr *nlh,
  2180. struct netlink_ext_ack *extack)
  2181. {
  2182. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  2183. enum rdma_nl_dev_type type;
  2184. struct ib_device *parent;
  2185. char name[IFNAMSIZ] = {};
  2186. u32 parentid;
  2187. int ret;
  2188. ret = nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  2189. nldev_policy, extack);
  2190. if (ret || !tb[RDMA_NLDEV_ATTR_DEV_INDEX] ||
  2191. !tb[RDMA_NLDEV_ATTR_DEV_NAME] || !tb[RDMA_NLDEV_ATTR_DEV_TYPE])
  2192. return -EINVAL;
  2193. nla_strscpy(name, tb[RDMA_NLDEV_ATTR_DEV_NAME], sizeof(name));
  2194. type = nla_get_u8(tb[RDMA_NLDEV_ATTR_DEV_TYPE]);
  2195. parentid = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  2196. parent = ib_device_get_by_index(sock_net(skb->sk), parentid);
  2197. if (!parent)
  2198. return -EINVAL;
  2199. ret = ib_add_sub_device(parent, type, name);
  2200. ib_device_put(parent);
  2201. return ret;
  2202. }
  2203. static int nldev_deldev(struct sk_buff *skb, struct nlmsghdr *nlh,
  2204. struct netlink_ext_ack *extack)
  2205. {
  2206. struct nlattr *tb[RDMA_NLDEV_ATTR_MAX];
  2207. struct ib_device *device;
  2208. u32 devid;
  2209. int ret;
  2210. ret = nlmsg_parse(nlh, 0, tb, RDMA_NLDEV_ATTR_MAX - 1,
  2211. nldev_policy, extack);
  2212. if (ret || !tb[RDMA_NLDEV_ATTR_DEV_INDEX])
  2213. return -EINVAL;
  2214. devid = nla_get_u32(tb[RDMA_NLDEV_ATTR_DEV_INDEX]);
  2215. device = ib_device_get_by_index(sock_net(skb->sk), devid);
  2216. if (!device)
  2217. return -EINVAL;
  2218. return ib_del_sub_device_and_put(device);
  2219. }
  2220. static const struct rdma_nl_cbs nldev_cb_table[RDMA_NLDEV_NUM_OPS] = {
  2221. [RDMA_NLDEV_CMD_GET] = {
  2222. .doit = nldev_get_doit,
  2223. .dump = nldev_get_dumpit,
  2224. },
  2225. [RDMA_NLDEV_CMD_GET_CHARDEV] = {
  2226. .doit = nldev_get_chardev,
  2227. },
  2228. [RDMA_NLDEV_CMD_SET] = {
  2229. .doit = nldev_set_doit,
  2230. .flags = RDMA_NL_ADMIN_PERM,
  2231. },
  2232. [RDMA_NLDEV_CMD_NEWLINK] = {
  2233. .doit = nldev_newlink,
  2234. .flags = RDMA_NL_ADMIN_PERM,
  2235. },
  2236. [RDMA_NLDEV_CMD_DELLINK] = {
  2237. .doit = nldev_dellink,
  2238. .flags = RDMA_NL_ADMIN_PERM,
  2239. },
  2240. [RDMA_NLDEV_CMD_PORT_GET] = {
  2241. .doit = nldev_port_get_doit,
  2242. .dump = nldev_port_get_dumpit,
  2243. },
  2244. [RDMA_NLDEV_CMD_RES_GET] = {
  2245. .doit = nldev_res_get_doit,
  2246. .dump = nldev_res_get_dumpit,
  2247. },
  2248. [RDMA_NLDEV_CMD_RES_QP_GET] = {
  2249. .doit = nldev_res_get_qp_doit,
  2250. .dump = nldev_res_get_qp_dumpit,
  2251. },
  2252. [RDMA_NLDEV_CMD_RES_CM_ID_GET] = {
  2253. .doit = nldev_res_get_cm_id_doit,
  2254. .dump = nldev_res_get_cm_id_dumpit,
  2255. },
  2256. [RDMA_NLDEV_CMD_RES_CQ_GET] = {
  2257. .doit = nldev_res_get_cq_doit,
  2258. .dump = nldev_res_get_cq_dumpit,
  2259. },
  2260. [RDMA_NLDEV_CMD_RES_MR_GET] = {
  2261. .doit = nldev_res_get_mr_doit,
  2262. .dump = nldev_res_get_mr_dumpit,
  2263. },
  2264. [RDMA_NLDEV_CMD_RES_PD_GET] = {
  2265. .doit = nldev_res_get_pd_doit,
  2266. .dump = nldev_res_get_pd_dumpit,
  2267. },
  2268. [RDMA_NLDEV_CMD_RES_CTX_GET] = {
  2269. .doit = nldev_res_get_ctx_doit,
  2270. .dump = nldev_res_get_ctx_dumpit,
  2271. },
  2272. [RDMA_NLDEV_CMD_RES_SRQ_GET] = {
  2273. .doit = nldev_res_get_srq_doit,
  2274. .dump = nldev_res_get_srq_dumpit,
  2275. },
  2276. [RDMA_NLDEV_CMD_SYS_GET] = {
  2277. .doit = nldev_sys_get_doit,
  2278. },
  2279. [RDMA_NLDEV_CMD_SYS_SET] = {
  2280. .doit = nldev_set_sys_set_doit,
  2281. .flags = RDMA_NL_ADMIN_PERM,
  2282. },
  2283. [RDMA_NLDEV_CMD_STAT_SET] = {
  2284. .doit = nldev_stat_set_doit,
  2285. .flags = RDMA_NL_ADMIN_PERM,
  2286. },
  2287. [RDMA_NLDEV_CMD_STAT_GET] = {
  2288. .doit = nldev_stat_get_doit,
  2289. .dump = nldev_stat_get_dumpit,
  2290. },
  2291. [RDMA_NLDEV_CMD_STAT_DEL] = {
  2292. .doit = nldev_stat_del_doit,
  2293. .flags = RDMA_NL_ADMIN_PERM,
  2294. },
  2295. [RDMA_NLDEV_CMD_RES_QP_GET_RAW] = {
  2296. .doit = nldev_res_get_qp_raw_doit,
  2297. .dump = nldev_res_get_qp_raw_dumpit,
  2298. .flags = RDMA_NL_ADMIN_PERM,
  2299. },
  2300. [RDMA_NLDEV_CMD_RES_CQ_GET_RAW] = {
  2301. .doit = nldev_res_get_cq_raw_doit,
  2302. .dump = nldev_res_get_cq_raw_dumpit,
  2303. .flags = RDMA_NL_ADMIN_PERM,
  2304. },
  2305. [RDMA_NLDEV_CMD_RES_MR_GET_RAW] = {
  2306. .doit = nldev_res_get_mr_raw_doit,
  2307. .dump = nldev_res_get_mr_raw_dumpit,
  2308. .flags = RDMA_NL_ADMIN_PERM,
  2309. },
  2310. [RDMA_NLDEV_CMD_RES_SRQ_GET_RAW] = {
  2311. .doit = nldev_res_get_srq_raw_doit,
  2312. .dump = nldev_res_get_srq_raw_dumpit,
  2313. .flags = RDMA_NL_ADMIN_PERM,
  2314. },
  2315. [RDMA_NLDEV_CMD_STAT_GET_STATUS] = {
  2316. .doit = nldev_stat_get_counter_status_doit,
  2317. },
  2318. [RDMA_NLDEV_CMD_NEWDEV] = {
  2319. .doit = nldev_newdev,
  2320. .flags = RDMA_NL_ADMIN_PERM,
  2321. },
  2322. [RDMA_NLDEV_CMD_DELDEV] = {
  2323. .doit = nldev_deldev,
  2324. .flags = RDMA_NL_ADMIN_PERM,
  2325. },
  2326. };
  2327. static int fill_mon_netdev_rename(struct sk_buff *msg,
  2328. struct ib_device *device, u32 port,
  2329. const struct net *net)
  2330. {
  2331. struct net_device *netdev = ib_device_get_netdev(device, port);
  2332. int ret = 0;
  2333. if (!netdev || !net_eq(dev_net(netdev), net))
  2334. goto out;
  2335. ret = nla_put_u32(msg, RDMA_NLDEV_ATTR_NDEV_INDEX, netdev->ifindex);
  2336. if (ret)
  2337. goto out;
  2338. ret = nla_put_string(msg, RDMA_NLDEV_ATTR_NDEV_NAME, netdev->name);
  2339. out:
  2340. dev_put(netdev);
  2341. return ret;
  2342. }
  2343. static int fill_mon_netdev_association(struct sk_buff *msg,
  2344. struct ib_device *device, u32 port,
  2345. const struct net *net)
  2346. {
  2347. struct net_device *netdev = ib_device_get_netdev(device, port);
  2348. int ret = 0;
  2349. if (netdev && !net_eq(dev_net(netdev), net))
  2350. goto out;
  2351. ret = nla_put_u32(msg, RDMA_NLDEV_ATTR_DEV_INDEX, device->index);
  2352. if (ret)
  2353. goto out;
  2354. ret = nla_put_string(msg, RDMA_NLDEV_ATTR_DEV_NAME,
  2355. dev_name(&device->dev));
  2356. if (ret)
  2357. goto out;
  2358. ret = nla_put_u32(msg, RDMA_NLDEV_ATTR_PORT_INDEX, port);
  2359. if (ret)
  2360. goto out;
  2361. if (netdev) {
  2362. ret = nla_put_u32(msg,
  2363. RDMA_NLDEV_ATTR_NDEV_INDEX, netdev->ifindex);
  2364. if (ret)
  2365. goto out;
  2366. ret = nla_put_string(msg,
  2367. RDMA_NLDEV_ATTR_NDEV_NAME, netdev->name);
  2368. }
  2369. out:
  2370. dev_put(netdev);
  2371. return ret;
  2372. }
  2373. static void rdma_nl_notify_err_msg(struct ib_device *device, u32 port_num,
  2374. enum rdma_nl_notify_event_type type)
  2375. {
  2376. struct net_device *netdev;
  2377. switch (type) {
  2378. case RDMA_REGISTER_EVENT:
  2379. dev_warn_ratelimited(&device->dev,
  2380. "Failed to send RDMA monitor register device event\n");
  2381. break;
  2382. case RDMA_UNREGISTER_EVENT:
  2383. dev_warn_ratelimited(&device->dev,
  2384. "Failed to send RDMA monitor unregister device event\n");
  2385. break;
  2386. case RDMA_NETDEV_ATTACH_EVENT:
  2387. netdev = ib_device_get_netdev(device, port_num);
  2388. dev_warn_ratelimited(&device->dev,
  2389. "Failed to send RDMA monitor netdev attach event: port %d netdev %d\n",
  2390. port_num, netdev->ifindex);
  2391. dev_put(netdev);
  2392. break;
  2393. case RDMA_NETDEV_DETACH_EVENT:
  2394. dev_warn_ratelimited(&device->dev,
  2395. "Failed to send RDMA monitor netdev detach event: port %d\n",
  2396. port_num);
  2397. break;
  2398. case RDMA_RENAME_EVENT:
  2399. dev_warn_ratelimited(&device->dev,
  2400. "Failed to send RDMA monitor rename device event\n");
  2401. break;
  2402. case RDMA_NETDEV_RENAME_EVENT:
  2403. netdev = ib_device_get_netdev(device, port_num);
  2404. dev_warn_ratelimited(&device->dev,
  2405. "Failed to send RDMA monitor netdev rename event: port %d netdev %d\n",
  2406. port_num, netdev->ifindex);
  2407. dev_put(netdev);
  2408. break;
  2409. default:
  2410. break;
  2411. }
  2412. }
  2413. int rdma_nl_notify_event(struct ib_device *device, u32 port_num,
  2414. enum rdma_nl_notify_event_type type)
  2415. {
  2416. struct sk_buff *skb;
  2417. int ret = -EMSGSIZE;
  2418. struct net *net;
  2419. void *nlh;
  2420. net = read_pnet(&device->coredev.rdma_net);
  2421. if (!net)
  2422. return -EINVAL;
  2423. skb = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
  2424. if (!skb)
  2425. return -ENOMEM;
  2426. nlh = nlmsg_put(skb, 0, 0,
  2427. RDMA_NL_GET_TYPE(RDMA_NL_NLDEV, RDMA_NLDEV_CMD_MONITOR),
  2428. 0, 0);
  2429. if (!nlh)
  2430. goto err_free;
  2431. switch (type) {
  2432. case RDMA_REGISTER_EVENT:
  2433. case RDMA_UNREGISTER_EVENT:
  2434. case RDMA_RENAME_EVENT:
  2435. ret = fill_nldev_handle(skb, device);
  2436. if (ret)
  2437. goto err_free;
  2438. break;
  2439. case RDMA_NETDEV_ATTACH_EVENT:
  2440. case RDMA_NETDEV_DETACH_EVENT:
  2441. ret = fill_mon_netdev_association(skb, device, port_num, net);
  2442. if (ret)
  2443. goto err_free;
  2444. break;
  2445. case RDMA_NETDEV_RENAME_EVENT:
  2446. ret = fill_mon_netdev_rename(skb, device, port_num, net);
  2447. if (ret)
  2448. goto err_free;
  2449. break;
  2450. default:
  2451. break;
  2452. }
  2453. ret = nla_put_u8(skb, RDMA_NLDEV_ATTR_EVENT_TYPE, type);
  2454. if (ret)
  2455. goto err_free;
  2456. nlmsg_end(skb, nlh);
  2457. ret = rdma_nl_multicast(net, skb, RDMA_NL_GROUP_NOTIFY, GFP_KERNEL);
  2458. if (ret && ret != -ESRCH) {
  2459. skb = NULL; /* skb is freed in the netlink send-op handling */
  2460. goto err_free;
  2461. }
  2462. return 0;
  2463. err_free:
  2464. rdma_nl_notify_err_msg(device, port_num, type);
  2465. nlmsg_free(skb);
  2466. return ret;
  2467. }
  2468. void __init nldev_init(void)
  2469. {
  2470. rdma_nl_register(RDMA_NL_NLDEV, nldev_cb_table);
  2471. }
  2472. void nldev_exit(void)
  2473. {
  2474. rdma_nl_unregister(RDMA_NL_NLDEV);
  2475. }
  2476. MODULE_ALIAS_RDMA_NETLINK(RDMA_NL_NLDEV, 5);