ib_verbs.h 110 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889
  1. /*
  2. * Copyright (c) 2004 Mellanox Technologies Ltd. All rights reserved.
  3. * Copyright (c) 2004 Infinicon Corporation. All rights reserved.
  4. * Copyright (c) 2004 Intel Corporation. All rights reserved.
  5. * Copyright (c) 2004 Topspin Corporation. All rights reserved.
  6. * Copyright (c) 2004 Voltaire Corporation. All rights reserved.
  7. * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved.
  8. * Copyright (c) 2005, 2006, 2007 Cisco Systems. All rights reserved.
  9. *
  10. * This software is available to you under a choice of one of two
  11. * licenses. You may choose to be licensed under the terms of the GNU
  12. * General Public License (GPL) Version 2, available from the file
  13. * COPYING in the main directory of this source tree, or the
  14. * OpenIB.org BSD license below:
  15. *
  16. * Redistribution and use in source and binary forms, with or
  17. * without modification, are permitted provided that the following
  18. * conditions are met:
  19. *
  20. * - Redistributions of source code must retain the above
  21. * copyright notice, this list of conditions and the following
  22. * disclaimer.
  23. *
  24. * - Redistributions in binary form must reproduce the above
  25. * copyright notice, this list of conditions and the following
  26. * disclaimer in the documentation and/or other materials
  27. * provided with the distribution.
  28. *
  29. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  30. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  31. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  32. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  33. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  34. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  35. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  36. * SOFTWARE.
  37. */
  38. #if !defined(IB_VERBS_H)
  39. #define IB_VERBS_H
  40. #include <linux/types.h>
  41. #include <linux/device.h>
  42. #include <linux/mm.h>
  43. #include <linux/dma-mapping.h>
  44. #include <linux/kref.h>
  45. #include <linux/list.h>
  46. #include <linux/rwsem.h>
  47. #include <linux/scatterlist.h>
  48. #include <linux/workqueue.h>
  49. #include <linux/socket.h>
  50. #include <linux/irq_poll.h>
  51. #include <uapi/linux/if_ether.h>
  52. #include <net/ipv6.h>
  53. #include <net/ip.h>
  54. #include <linux/string.h>
  55. #include <linux/slab.h>
  56. #include <linux/netdevice.h>
  57. #include <linux/if_link.h>
  58. #include <linux/atomic.h>
  59. #include <linux/mmu_notifier.h>
  60. #include <linux/uaccess.h>
  61. #include <linux/cgroup_rdma.h>
  62. #include <uapi/rdma/ib_user_verbs.h>
  63. #include <rdma/restrack.h>
  64. #define IB_FW_VERSION_NAME_MAX ETHTOOL_FWVERS_LEN
  65. extern struct workqueue_struct *ib_wq;
  66. extern struct workqueue_struct *ib_comp_wq;
  67. union ib_gid {
  68. u8 raw[16];
  69. struct {
  70. __be64 subnet_prefix;
  71. __be64 interface_id;
  72. } global;
  73. };
  74. extern union ib_gid zgid;
  75. enum ib_gid_type {
  76. /* If link layer is Ethernet, this is RoCE V1 */
  77. IB_GID_TYPE_IB = 0,
  78. IB_GID_TYPE_ROCE = 0,
  79. IB_GID_TYPE_ROCE_UDP_ENCAP = 1,
  80. IB_GID_TYPE_SIZE
  81. };
  82. #define ROCE_V2_UDP_DPORT 4791
  83. struct ib_gid_attr {
  84. enum ib_gid_type gid_type;
  85. struct net_device *ndev;
  86. };
  87. enum rdma_node_type {
  88. /* IB values map to NodeInfo:NodeType. */
  89. RDMA_NODE_IB_CA = 1,
  90. RDMA_NODE_IB_SWITCH,
  91. RDMA_NODE_IB_ROUTER,
  92. RDMA_NODE_RNIC,
  93. RDMA_NODE_USNIC,
  94. RDMA_NODE_USNIC_UDP,
  95. };
  96. enum {
  97. /* set the local administered indication */
  98. IB_SA_WELL_KNOWN_GUID = BIT_ULL(57) | 2,
  99. };
  100. enum rdma_transport_type {
  101. RDMA_TRANSPORT_IB,
  102. RDMA_TRANSPORT_IWARP,
  103. RDMA_TRANSPORT_USNIC,
  104. RDMA_TRANSPORT_USNIC_UDP
  105. };
  106. enum rdma_protocol_type {
  107. RDMA_PROTOCOL_IB,
  108. RDMA_PROTOCOL_IBOE,
  109. RDMA_PROTOCOL_IWARP,
  110. RDMA_PROTOCOL_USNIC_UDP
  111. };
  112. __attribute_const__ enum rdma_transport_type
  113. rdma_node_get_transport(enum rdma_node_type node_type);
  114. enum rdma_network_type {
  115. RDMA_NETWORK_IB,
  116. RDMA_NETWORK_ROCE_V1 = RDMA_NETWORK_IB,
  117. RDMA_NETWORK_IPV4,
  118. RDMA_NETWORK_IPV6
  119. };
  120. static inline enum ib_gid_type ib_network_to_gid_type(enum rdma_network_type network_type)
  121. {
  122. if (network_type == RDMA_NETWORK_IPV4 ||
  123. network_type == RDMA_NETWORK_IPV6)
  124. return IB_GID_TYPE_ROCE_UDP_ENCAP;
  125. /* IB_GID_TYPE_IB same as RDMA_NETWORK_ROCE_V1 */
  126. return IB_GID_TYPE_IB;
  127. }
  128. static inline enum rdma_network_type ib_gid_to_network_type(enum ib_gid_type gid_type,
  129. union ib_gid *gid)
  130. {
  131. if (gid_type == IB_GID_TYPE_IB)
  132. return RDMA_NETWORK_IB;
  133. if (ipv6_addr_v4mapped((struct in6_addr *)gid))
  134. return RDMA_NETWORK_IPV4;
  135. else
  136. return RDMA_NETWORK_IPV6;
  137. }
  138. enum rdma_link_layer {
  139. IB_LINK_LAYER_UNSPECIFIED,
  140. IB_LINK_LAYER_INFINIBAND,
  141. IB_LINK_LAYER_ETHERNET,
  142. };
  143. enum ib_device_cap_flags {
  144. IB_DEVICE_RESIZE_MAX_WR = (1 << 0),
  145. IB_DEVICE_BAD_PKEY_CNTR = (1 << 1),
  146. IB_DEVICE_BAD_QKEY_CNTR = (1 << 2),
  147. IB_DEVICE_RAW_MULTI = (1 << 3),
  148. IB_DEVICE_AUTO_PATH_MIG = (1 << 4),
  149. IB_DEVICE_CHANGE_PHY_PORT = (1 << 5),
  150. IB_DEVICE_UD_AV_PORT_ENFORCE = (1 << 6),
  151. IB_DEVICE_CURR_QP_STATE_MOD = (1 << 7),
  152. IB_DEVICE_SHUTDOWN_PORT = (1 << 8),
  153. /* Not in use, former INIT_TYPE = (1 << 9),*/
  154. IB_DEVICE_PORT_ACTIVE_EVENT = (1 << 10),
  155. IB_DEVICE_SYS_IMAGE_GUID = (1 << 11),
  156. IB_DEVICE_RC_RNR_NAK_GEN = (1 << 12),
  157. IB_DEVICE_SRQ_RESIZE = (1 << 13),
  158. IB_DEVICE_N_NOTIFY_CQ = (1 << 14),
  159. /*
  160. * This device supports a per-device lkey or stag that can be
  161. * used without performing a memory registration for the local
  162. * memory. Note that ULPs should never check this flag, but
  163. * instead of use the local_dma_lkey flag in the ib_pd structure,
  164. * which will always contain a usable lkey.
  165. */
  166. IB_DEVICE_LOCAL_DMA_LKEY = (1 << 15),
  167. /* Reserved, old SEND_W_INV = (1 << 16),*/
  168. IB_DEVICE_MEM_WINDOW = (1 << 17),
  169. /*
  170. * Devices should set IB_DEVICE_UD_IP_SUM if they support
  171. * insertion of UDP and TCP checksum on outgoing UD IPoIB
  172. * messages and can verify the validity of checksum for
  173. * incoming messages. Setting this flag implies that the
  174. * IPoIB driver may set NETIF_F_IP_CSUM for datagram mode.
  175. */
  176. IB_DEVICE_UD_IP_CSUM = (1 << 18),
  177. IB_DEVICE_UD_TSO = (1 << 19),
  178. IB_DEVICE_XRC = (1 << 20),
  179. /*
  180. * This device supports the IB "base memory management extension",
  181. * which includes support for fast registrations (IB_WR_REG_MR,
  182. * IB_WR_LOCAL_INV and IB_WR_SEND_WITH_INV verbs). This flag should
  183. * also be set by any iWarp device which must support FRs to comply
  184. * to the iWarp verbs spec. iWarp devices also support the
  185. * IB_WR_RDMA_READ_WITH_INV verb for RDMA READs that invalidate the
  186. * stag.
  187. */
  188. IB_DEVICE_MEM_MGT_EXTENSIONS = (1 << 21),
  189. IB_DEVICE_BLOCK_MULTICAST_LOOPBACK = (1 << 22),
  190. IB_DEVICE_MEM_WINDOW_TYPE_2A = (1 << 23),
  191. IB_DEVICE_MEM_WINDOW_TYPE_2B = (1 << 24),
  192. IB_DEVICE_RC_IP_CSUM = (1 << 25),
  193. /* Deprecated. Please use IB_RAW_PACKET_CAP_IP_CSUM. */
  194. IB_DEVICE_RAW_IP_CSUM = (1 << 26),
  195. /*
  196. * Devices should set IB_DEVICE_CROSS_CHANNEL if they
  197. * support execution of WQEs that involve synchronization
  198. * of I/O operations with single completion queue managed
  199. * by hardware.
  200. */
  201. IB_DEVICE_CROSS_CHANNEL = (1 << 27),
  202. IB_DEVICE_MANAGED_FLOW_STEERING = (1 << 29),
  203. IB_DEVICE_SIGNATURE_HANDOVER = (1 << 30),
  204. IB_DEVICE_ON_DEMAND_PAGING = (1ULL << 31),
  205. IB_DEVICE_SG_GAPS_REG = (1ULL << 32),
  206. IB_DEVICE_VIRTUAL_FUNCTION = (1ULL << 33),
  207. /* Deprecated. Please use IB_RAW_PACKET_CAP_SCATTER_FCS. */
  208. IB_DEVICE_RAW_SCATTER_FCS = (1ULL << 34),
  209. IB_DEVICE_RDMA_NETDEV_OPA_VNIC = (1ULL << 35),
  210. /* The device supports padding incoming writes to cacheline. */
  211. IB_DEVICE_PCI_WRITE_END_PADDING = (1ULL << 36),
  212. };
  213. enum ib_signature_prot_cap {
  214. IB_PROT_T10DIF_TYPE_1 = 1,
  215. IB_PROT_T10DIF_TYPE_2 = 1 << 1,
  216. IB_PROT_T10DIF_TYPE_3 = 1 << 2,
  217. };
  218. enum ib_signature_guard_cap {
  219. IB_GUARD_T10DIF_CRC = 1,
  220. IB_GUARD_T10DIF_CSUM = 1 << 1,
  221. };
  222. enum ib_atomic_cap {
  223. IB_ATOMIC_NONE,
  224. IB_ATOMIC_HCA,
  225. IB_ATOMIC_GLOB
  226. };
  227. enum ib_odp_general_cap_bits {
  228. IB_ODP_SUPPORT = 1 << 0,
  229. IB_ODP_SUPPORT_IMPLICIT = 1 << 1,
  230. };
  231. enum ib_odp_transport_cap_bits {
  232. IB_ODP_SUPPORT_SEND = 1 << 0,
  233. IB_ODP_SUPPORT_RECV = 1 << 1,
  234. IB_ODP_SUPPORT_WRITE = 1 << 2,
  235. IB_ODP_SUPPORT_READ = 1 << 3,
  236. IB_ODP_SUPPORT_ATOMIC = 1 << 4,
  237. };
  238. struct ib_odp_caps {
  239. uint64_t general_caps;
  240. struct {
  241. uint32_t rc_odp_caps;
  242. uint32_t uc_odp_caps;
  243. uint32_t ud_odp_caps;
  244. } per_transport_caps;
  245. };
  246. struct ib_rss_caps {
  247. /* Corresponding bit will be set if qp type from
  248. * 'enum ib_qp_type' is supported, e.g.
  249. * supported_qpts |= 1 << IB_QPT_UD
  250. */
  251. u32 supported_qpts;
  252. u32 max_rwq_indirection_tables;
  253. u32 max_rwq_indirection_table_size;
  254. };
  255. enum ib_tm_cap_flags {
  256. /* Support tag matching on RC transport */
  257. IB_TM_CAP_RC = 1 << 0,
  258. };
  259. struct ib_tm_caps {
  260. /* Max size of RNDV header */
  261. u32 max_rndv_hdr_size;
  262. /* Max number of entries in tag matching list */
  263. u32 max_num_tags;
  264. /* From enum ib_tm_cap_flags */
  265. u32 flags;
  266. /* Max number of outstanding list operations */
  267. u32 max_ops;
  268. /* Max number of SGE in tag matching entry */
  269. u32 max_sge;
  270. };
  271. struct ib_cq_init_attr {
  272. unsigned int cqe;
  273. int comp_vector;
  274. u32 flags;
  275. };
  276. enum ib_cq_attr_mask {
  277. IB_CQ_MODERATE = 1 << 0,
  278. };
  279. struct ib_cq_caps {
  280. u16 max_cq_moderation_count;
  281. u16 max_cq_moderation_period;
  282. };
  283. struct ib_device_attr {
  284. u64 fw_ver;
  285. __be64 sys_image_guid;
  286. u64 max_mr_size;
  287. u64 page_size_cap;
  288. u32 vendor_id;
  289. u32 vendor_part_id;
  290. u32 hw_ver;
  291. int max_qp;
  292. int max_qp_wr;
  293. u64 device_cap_flags;
  294. int max_sge;
  295. int max_sge_rd;
  296. int max_cq;
  297. int max_cqe;
  298. int max_mr;
  299. int max_pd;
  300. int max_qp_rd_atom;
  301. int max_ee_rd_atom;
  302. int max_res_rd_atom;
  303. int max_qp_init_rd_atom;
  304. int max_ee_init_rd_atom;
  305. enum ib_atomic_cap atomic_cap;
  306. enum ib_atomic_cap masked_atomic_cap;
  307. int max_ee;
  308. int max_rdd;
  309. int max_mw;
  310. int max_raw_ipv6_qp;
  311. int max_raw_ethy_qp;
  312. int max_mcast_grp;
  313. int max_mcast_qp_attach;
  314. int max_total_mcast_qp_attach;
  315. int max_ah;
  316. int max_fmr;
  317. int max_map_per_fmr;
  318. int max_srq;
  319. int max_srq_wr;
  320. int max_srq_sge;
  321. unsigned int max_fast_reg_page_list_len;
  322. u16 max_pkeys;
  323. u8 local_ca_ack_delay;
  324. int sig_prot_cap;
  325. int sig_guard_cap;
  326. struct ib_odp_caps odp_caps;
  327. uint64_t timestamp_mask;
  328. uint64_t hca_core_clock; /* in KHZ */
  329. struct ib_rss_caps rss_caps;
  330. u32 max_wq_type_rq;
  331. u32 raw_packet_caps; /* Use ib_raw_packet_caps enum */
  332. struct ib_tm_caps tm_caps;
  333. struct ib_cq_caps cq_caps;
  334. };
  335. enum ib_mtu {
  336. IB_MTU_256 = 1,
  337. IB_MTU_512 = 2,
  338. IB_MTU_1024 = 3,
  339. IB_MTU_2048 = 4,
  340. IB_MTU_4096 = 5
  341. };
  342. static inline int ib_mtu_enum_to_int(enum ib_mtu mtu)
  343. {
  344. switch (mtu) {
  345. case IB_MTU_256: return 256;
  346. case IB_MTU_512: return 512;
  347. case IB_MTU_1024: return 1024;
  348. case IB_MTU_2048: return 2048;
  349. case IB_MTU_4096: return 4096;
  350. default: return -1;
  351. }
  352. }
  353. static inline enum ib_mtu ib_mtu_int_to_enum(int mtu)
  354. {
  355. if (mtu >= 4096)
  356. return IB_MTU_4096;
  357. else if (mtu >= 2048)
  358. return IB_MTU_2048;
  359. else if (mtu >= 1024)
  360. return IB_MTU_1024;
  361. else if (mtu >= 512)
  362. return IB_MTU_512;
  363. else
  364. return IB_MTU_256;
  365. }
  366. enum ib_port_state {
  367. IB_PORT_NOP = 0,
  368. IB_PORT_DOWN = 1,
  369. IB_PORT_INIT = 2,
  370. IB_PORT_ARMED = 3,
  371. IB_PORT_ACTIVE = 4,
  372. IB_PORT_ACTIVE_DEFER = 5
  373. };
  374. enum ib_port_cap_flags {
  375. IB_PORT_SM = 1 << 1,
  376. IB_PORT_NOTICE_SUP = 1 << 2,
  377. IB_PORT_TRAP_SUP = 1 << 3,
  378. IB_PORT_OPT_IPD_SUP = 1 << 4,
  379. IB_PORT_AUTO_MIGR_SUP = 1 << 5,
  380. IB_PORT_SL_MAP_SUP = 1 << 6,
  381. IB_PORT_MKEY_NVRAM = 1 << 7,
  382. IB_PORT_PKEY_NVRAM = 1 << 8,
  383. IB_PORT_LED_INFO_SUP = 1 << 9,
  384. IB_PORT_SM_DISABLED = 1 << 10,
  385. IB_PORT_SYS_IMAGE_GUID_SUP = 1 << 11,
  386. IB_PORT_PKEY_SW_EXT_PORT_TRAP_SUP = 1 << 12,
  387. IB_PORT_EXTENDED_SPEEDS_SUP = 1 << 14,
  388. IB_PORT_CM_SUP = 1 << 16,
  389. IB_PORT_SNMP_TUNNEL_SUP = 1 << 17,
  390. IB_PORT_REINIT_SUP = 1 << 18,
  391. IB_PORT_DEVICE_MGMT_SUP = 1 << 19,
  392. IB_PORT_VENDOR_CLASS_SUP = 1 << 20,
  393. IB_PORT_DR_NOTICE_SUP = 1 << 21,
  394. IB_PORT_CAP_MASK_NOTICE_SUP = 1 << 22,
  395. IB_PORT_BOOT_MGMT_SUP = 1 << 23,
  396. IB_PORT_LINK_LATENCY_SUP = 1 << 24,
  397. IB_PORT_CLIENT_REG_SUP = 1 << 25,
  398. IB_PORT_IP_BASED_GIDS = 1 << 26,
  399. };
  400. enum ib_port_width {
  401. IB_WIDTH_1X = 1,
  402. IB_WIDTH_4X = 2,
  403. IB_WIDTH_8X = 4,
  404. IB_WIDTH_12X = 8
  405. };
  406. static inline int ib_width_enum_to_int(enum ib_port_width width)
  407. {
  408. switch (width) {
  409. case IB_WIDTH_1X: return 1;
  410. case IB_WIDTH_4X: return 4;
  411. case IB_WIDTH_8X: return 8;
  412. case IB_WIDTH_12X: return 12;
  413. default: return -1;
  414. }
  415. }
  416. enum ib_port_speed {
  417. IB_SPEED_SDR = 1,
  418. IB_SPEED_DDR = 2,
  419. IB_SPEED_QDR = 4,
  420. IB_SPEED_FDR10 = 8,
  421. IB_SPEED_FDR = 16,
  422. IB_SPEED_EDR = 32,
  423. IB_SPEED_HDR = 64
  424. };
  425. /**
  426. * struct rdma_hw_stats
  427. * @timestamp - Used by the core code to track when the last update was
  428. * @lifespan - Used by the core code to determine how old the counters
  429. * should be before being updated again. Stored in jiffies, defaults
  430. * to 10 milliseconds, drivers can override the default be specifying
  431. * their own value during their allocation routine.
  432. * @name - Array of pointers to static names used for the counters in
  433. * directory.
  434. * @num_counters - How many hardware counters there are. If name is
  435. * shorter than this number, a kernel oops will result. Driver authors
  436. * are encouraged to leave BUILD_BUG_ON(ARRAY_SIZE(@name) < num_counters)
  437. * in their code to prevent this.
  438. * @value - Array of u64 counters that are accessed by the sysfs code and
  439. * filled in by the drivers get_stats routine
  440. */
  441. struct rdma_hw_stats {
  442. unsigned long timestamp;
  443. unsigned long lifespan;
  444. const char * const *names;
  445. int num_counters;
  446. u64 value[];
  447. };
  448. #define RDMA_HW_STATS_DEFAULT_LIFESPAN 10
  449. /**
  450. * rdma_alloc_hw_stats_struct - Helper function to allocate dynamic struct
  451. * for drivers.
  452. * @names - Array of static const char *
  453. * @num_counters - How many elements in array
  454. * @lifespan - How many milliseconds between updates
  455. */
  456. static inline struct rdma_hw_stats *rdma_alloc_hw_stats_struct(
  457. const char * const *names, int num_counters,
  458. unsigned long lifespan)
  459. {
  460. struct rdma_hw_stats *stats;
  461. stats = kzalloc(sizeof(*stats) + num_counters * sizeof(u64),
  462. GFP_KERNEL);
  463. if (!stats)
  464. return NULL;
  465. stats->names = names;
  466. stats->num_counters = num_counters;
  467. stats->lifespan = msecs_to_jiffies(lifespan);
  468. return stats;
  469. }
  470. /* Define bits for the various functionality this port needs to be supported by
  471. * the core.
  472. */
  473. /* Management 0x00000FFF */
  474. #define RDMA_CORE_CAP_IB_MAD 0x00000001
  475. #define RDMA_CORE_CAP_IB_SMI 0x00000002
  476. #define RDMA_CORE_CAP_IB_CM 0x00000004
  477. #define RDMA_CORE_CAP_IW_CM 0x00000008
  478. #define RDMA_CORE_CAP_IB_SA 0x00000010
  479. #define RDMA_CORE_CAP_OPA_MAD 0x00000020
  480. /* Address format 0x000FF000 */
  481. #define RDMA_CORE_CAP_AF_IB 0x00001000
  482. #define RDMA_CORE_CAP_ETH_AH 0x00002000
  483. #define RDMA_CORE_CAP_OPA_AH 0x00004000
  484. /* Protocol 0xFFF00000 */
  485. #define RDMA_CORE_CAP_PROT_IB 0x00100000
  486. #define RDMA_CORE_CAP_PROT_ROCE 0x00200000
  487. #define RDMA_CORE_CAP_PROT_IWARP 0x00400000
  488. #define RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP 0x00800000
  489. #define RDMA_CORE_CAP_PROT_RAW_PACKET 0x01000000
  490. #define RDMA_CORE_CAP_PROT_USNIC 0x02000000
  491. #define RDMA_CORE_PORT_IBA_IB (RDMA_CORE_CAP_PROT_IB \
  492. | RDMA_CORE_CAP_IB_MAD \
  493. | RDMA_CORE_CAP_IB_SMI \
  494. | RDMA_CORE_CAP_IB_CM \
  495. | RDMA_CORE_CAP_IB_SA \
  496. | RDMA_CORE_CAP_AF_IB)
  497. #define RDMA_CORE_PORT_IBA_ROCE (RDMA_CORE_CAP_PROT_ROCE \
  498. | RDMA_CORE_CAP_IB_MAD \
  499. | RDMA_CORE_CAP_IB_CM \
  500. | RDMA_CORE_CAP_AF_IB \
  501. | RDMA_CORE_CAP_ETH_AH)
  502. #define RDMA_CORE_PORT_IBA_ROCE_UDP_ENCAP \
  503. (RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP \
  504. | RDMA_CORE_CAP_IB_MAD \
  505. | RDMA_CORE_CAP_IB_CM \
  506. | RDMA_CORE_CAP_AF_IB \
  507. | RDMA_CORE_CAP_ETH_AH)
  508. #define RDMA_CORE_PORT_IWARP (RDMA_CORE_CAP_PROT_IWARP \
  509. | RDMA_CORE_CAP_IW_CM)
  510. #define RDMA_CORE_PORT_INTEL_OPA (RDMA_CORE_PORT_IBA_IB \
  511. | RDMA_CORE_CAP_OPA_MAD)
  512. #define RDMA_CORE_PORT_RAW_PACKET (RDMA_CORE_CAP_PROT_RAW_PACKET)
  513. #define RDMA_CORE_PORT_USNIC (RDMA_CORE_CAP_PROT_USNIC)
  514. struct ib_port_attr {
  515. u64 subnet_prefix;
  516. enum ib_port_state state;
  517. enum ib_mtu max_mtu;
  518. enum ib_mtu active_mtu;
  519. int gid_tbl_len;
  520. u32 port_cap_flags;
  521. u32 max_msg_sz;
  522. u32 bad_pkey_cntr;
  523. u32 qkey_viol_cntr;
  524. u16 pkey_tbl_len;
  525. u32 sm_lid;
  526. u32 lid;
  527. u8 lmc;
  528. u8 max_vl_num;
  529. u8 sm_sl;
  530. u8 subnet_timeout;
  531. u8 init_type_reply;
  532. u8 active_width;
  533. u8 active_speed;
  534. u8 phys_state;
  535. bool grh_required;
  536. };
  537. enum ib_device_modify_flags {
  538. IB_DEVICE_MODIFY_SYS_IMAGE_GUID = 1 << 0,
  539. IB_DEVICE_MODIFY_NODE_DESC = 1 << 1
  540. };
  541. #define IB_DEVICE_NODE_DESC_MAX 64
  542. struct ib_device_modify {
  543. u64 sys_image_guid;
  544. char node_desc[IB_DEVICE_NODE_DESC_MAX];
  545. };
  546. enum ib_port_modify_flags {
  547. IB_PORT_SHUTDOWN = 1,
  548. IB_PORT_INIT_TYPE = (1<<2),
  549. IB_PORT_RESET_QKEY_CNTR = (1<<3),
  550. IB_PORT_OPA_MASK_CHG = (1<<4)
  551. };
  552. struct ib_port_modify {
  553. u32 set_port_cap_mask;
  554. u32 clr_port_cap_mask;
  555. u8 init_type;
  556. };
  557. enum ib_event_type {
  558. IB_EVENT_CQ_ERR,
  559. IB_EVENT_QP_FATAL,
  560. IB_EVENT_QP_REQ_ERR,
  561. IB_EVENT_QP_ACCESS_ERR,
  562. IB_EVENT_COMM_EST,
  563. IB_EVENT_SQ_DRAINED,
  564. IB_EVENT_PATH_MIG,
  565. IB_EVENT_PATH_MIG_ERR,
  566. IB_EVENT_DEVICE_FATAL,
  567. IB_EVENT_PORT_ACTIVE,
  568. IB_EVENT_PORT_ERR,
  569. IB_EVENT_LID_CHANGE,
  570. IB_EVENT_PKEY_CHANGE,
  571. IB_EVENT_SM_CHANGE,
  572. IB_EVENT_SRQ_ERR,
  573. IB_EVENT_SRQ_LIMIT_REACHED,
  574. IB_EVENT_QP_LAST_WQE_REACHED,
  575. IB_EVENT_CLIENT_REREGISTER,
  576. IB_EVENT_GID_CHANGE,
  577. IB_EVENT_WQ_FATAL,
  578. };
  579. const char *__attribute_const__ ib_event_msg(enum ib_event_type event);
  580. struct ib_event {
  581. struct ib_device *device;
  582. union {
  583. struct ib_cq *cq;
  584. struct ib_qp *qp;
  585. struct ib_srq *srq;
  586. struct ib_wq *wq;
  587. u8 port_num;
  588. } element;
  589. enum ib_event_type event;
  590. };
  591. struct ib_event_handler {
  592. struct ib_device *device;
  593. void (*handler)(struct ib_event_handler *, struct ib_event *);
  594. struct list_head list;
  595. };
  596. #define INIT_IB_EVENT_HANDLER(_ptr, _device, _handler) \
  597. do { \
  598. (_ptr)->device = _device; \
  599. (_ptr)->handler = _handler; \
  600. INIT_LIST_HEAD(&(_ptr)->list); \
  601. } while (0)
  602. struct ib_global_route {
  603. union ib_gid dgid;
  604. u32 flow_label;
  605. u8 sgid_index;
  606. u8 hop_limit;
  607. u8 traffic_class;
  608. };
  609. struct ib_grh {
  610. __be32 version_tclass_flow;
  611. __be16 paylen;
  612. u8 next_hdr;
  613. u8 hop_limit;
  614. union ib_gid sgid;
  615. union ib_gid dgid;
  616. };
  617. union rdma_network_hdr {
  618. struct ib_grh ibgrh;
  619. struct {
  620. /* The IB spec states that if it's IPv4, the header
  621. * is located in the last 20 bytes of the header.
  622. */
  623. u8 reserved[20];
  624. struct iphdr roce4grh;
  625. };
  626. };
  627. #define IB_QPN_MASK 0xFFFFFF
  628. enum {
  629. IB_MULTICAST_QPN = 0xffffff
  630. };
  631. #define IB_LID_PERMISSIVE cpu_to_be16(0xFFFF)
  632. #define IB_MULTICAST_LID_BASE cpu_to_be16(0xC000)
  633. enum ib_ah_flags {
  634. IB_AH_GRH = 1
  635. };
  636. enum ib_rate {
  637. IB_RATE_PORT_CURRENT = 0,
  638. IB_RATE_2_5_GBPS = 2,
  639. IB_RATE_5_GBPS = 5,
  640. IB_RATE_10_GBPS = 3,
  641. IB_RATE_20_GBPS = 6,
  642. IB_RATE_30_GBPS = 4,
  643. IB_RATE_40_GBPS = 7,
  644. IB_RATE_60_GBPS = 8,
  645. IB_RATE_80_GBPS = 9,
  646. IB_RATE_120_GBPS = 10,
  647. IB_RATE_14_GBPS = 11,
  648. IB_RATE_56_GBPS = 12,
  649. IB_RATE_112_GBPS = 13,
  650. IB_RATE_168_GBPS = 14,
  651. IB_RATE_25_GBPS = 15,
  652. IB_RATE_100_GBPS = 16,
  653. IB_RATE_200_GBPS = 17,
  654. IB_RATE_300_GBPS = 18
  655. };
  656. /**
  657. * ib_rate_to_mult - Convert the IB rate enum to a multiple of the
  658. * base rate of 2.5 Gbit/sec. For example, IB_RATE_5_GBPS will be
  659. * converted to 2, since 5 Gbit/sec is 2 * 2.5 Gbit/sec.
  660. * @rate: rate to convert.
  661. */
  662. __attribute_const__ int ib_rate_to_mult(enum ib_rate rate);
  663. /**
  664. * ib_rate_to_mbps - Convert the IB rate enum to Mbps.
  665. * For example, IB_RATE_2_5_GBPS will be converted to 2500.
  666. * @rate: rate to convert.
  667. */
  668. __attribute_const__ int ib_rate_to_mbps(enum ib_rate rate);
  669. /**
  670. * enum ib_mr_type - memory region type
  671. * @IB_MR_TYPE_MEM_REG: memory region that is used for
  672. * normal registration
  673. * @IB_MR_TYPE_SIGNATURE: memory region that is used for
  674. * signature operations (data-integrity
  675. * capable regions)
  676. * @IB_MR_TYPE_SG_GAPS: memory region that is capable to
  677. * register any arbitrary sg lists (without
  678. * the normal mr constraints - see
  679. * ib_map_mr_sg)
  680. */
  681. enum ib_mr_type {
  682. IB_MR_TYPE_MEM_REG,
  683. IB_MR_TYPE_SIGNATURE,
  684. IB_MR_TYPE_SG_GAPS,
  685. };
  686. /**
  687. * Signature types
  688. * IB_SIG_TYPE_NONE: Unprotected.
  689. * IB_SIG_TYPE_T10_DIF: Type T10-DIF
  690. */
  691. enum ib_signature_type {
  692. IB_SIG_TYPE_NONE,
  693. IB_SIG_TYPE_T10_DIF,
  694. };
  695. /**
  696. * Signature T10-DIF block-guard types
  697. * IB_T10DIF_CRC: Corresponds to T10-PI mandated CRC checksum rules.
  698. * IB_T10DIF_CSUM: Corresponds to IP checksum rules.
  699. */
  700. enum ib_t10_dif_bg_type {
  701. IB_T10DIF_CRC,
  702. IB_T10DIF_CSUM
  703. };
  704. /**
  705. * struct ib_t10_dif_domain - Parameters specific for T10-DIF
  706. * domain.
  707. * @bg_type: T10-DIF block guard type (CRC|CSUM)
  708. * @pi_interval: protection information interval.
  709. * @bg: seed of guard computation.
  710. * @app_tag: application tag of guard block
  711. * @ref_tag: initial guard block reference tag.
  712. * @ref_remap: Indicate wethear the reftag increments each block
  713. * @app_escape: Indicate to skip block check if apptag=0xffff
  714. * @ref_escape: Indicate to skip block check if reftag=0xffffffff
  715. * @apptag_check_mask: check bitmask of application tag.
  716. */
  717. struct ib_t10_dif_domain {
  718. enum ib_t10_dif_bg_type bg_type;
  719. u16 pi_interval;
  720. u16 bg;
  721. u16 app_tag;
  722. u32 ref_tag;
  723. bool ref_remap;
  724. bool app_escape;
  725. bool ref_escape;
  726. u16 apptag_check_mask;
  727. };
  728. /**
  729. * struct ib_sig_domain - Parameters for signature domain
  730. * @sig_type: specific signauture type
  731. * @sig: union of all signature domain attributes that may
  732. * be used to set domain layout.
  733. */
  734. struct ib_sig_domain {
  735. enum ib_signature_type sig_type;
  736. union {
  737. struct ib_t10_dif_domain dif;
  738. } sig;
  739. };
  740. /**
  741. * struct ib_sig_attrs - Parameters for signature handover operation
  742. * @check_mask: bitmask for signature byte check (8 bytes)
  743. * @mem: memory domain layout desciptor.
  744. * @wire: wire domain layout desciptor.
  745. */
  746. struct ib_sig_attrs {
  747. u8 check_mask;
  748. struct ib_sig_domain mem;
  749. struct ib_sig_domain wire;
  750. };
  751. enum ib_sig_err_type {
  752. IB_SIG_BAD_GUARD,
  753. IB_SIG_BAD_REFTAG,
  754. IB_SIG_BAD_APPTAG,
  755. };
  756. /**
  757. * struct ib_sig_err - signature error descriptor
  758. */
  759. struct ib_sig_err {
  760. enum ib_sig_err_type err_type;
  761. u32 expected;
  762. u32 actual;
  763. u64 sig_err_offset;
  764. u32 key;
  765. };
  766. enum ib_mr_status_check {
  767. IB_MR_CHECK_SIG_STATUS = 1,
  768. };
  769. /**
  770. * struct ib_mr_status - Memory region status container
  771. *
  772. * @fail_status: Bitmask of MR checks status. For each
  773. * failed check a corresponding status bit is set.
  774. * @sig_err: Additional info for IB_MR_CEHCK_SIG_STATUS
  775. * failure.
  776. */
  777. struct ib_mr_status {
  778. u32 fail_status;
  779. struct ib_sig_err sig_err;
  780. };
  781. /**
  782. * mult_to_ib_rate - Convert a multiple of 2.5 Gbit/sec to an IB rate
  783. * enum.
  784. * @mult: multiple to convert.
  785. */
  786. __attribute_const__ enum ib_rate mult_to_ib_rate(int mult);
  787. enum rdma_ah_attr_type {
  788. RDMA_AH_ATTR_TYPE_UNDEFINED,
  789. RDMA_AH_ATTR_TYPE_IB,
  790. RDMA_AH_ATTR_TYPE_ROCE,
  791. RDMA_AH_ATTR_TYPE_OPA,
  792. };
  793. struct ib_ah_attr {
  794. u16 dlid;
  795. u8 src_path_bits;
  796. };
  797. struct roce_ah_attr {
  798. u8 dmac[ETH_ALEN];
  799. };
  800. struct opa_ah_attr {
  801. u32 dlid;
  802. u8 src_path_bits;
  803. bool make_grd;
  804. };
  805. struct rdma_ah_attr {
  806. struct ib_global_route grh;
  807. u8 sl;
  808. u8 static_rate;
  809. u8 port_num;
  810. u8 ah_flags;
  811. enum rdma_ah_attr_type type;
  812. union {
  813. struct ib_ah_attr ib;
  814. struct roce_ah_attr roce;
  815. struct opa_ah_attr opa;
  816. };
  817. };
  818. enum ib_wc_status {
  819. IB_WC_SUCCESS,
  820. IB_WC_LOC_LEN_ERR,
  821. IB_WC_LOC_QP_OP_ERR,
  822. IB_WC_LOC_EEC_OP_ERR,
  823. IB_WC_LOC_PROT_ERR,
  824. IB_WC_WR_FLUSH_ERR,
  825. IB_WC_MW_BIND_ERR,
  826. IB_WC_BAD_RESP_ERR,
  827. IB_WC_LOC_ACCESS_ERR,
  828. IB_WC_REM_INV_REQ_ERR,
  829. IB_WC_REM_ACCESS_ERR,
  830. IB_WC_REM_OP_ERR,
  831. IB_WC_RETRY_EXC_ERR,
  832. IB_WC_RNR_RETRY_EXC_ERR,
  833. IB_WC_LOC_RDD_VIOL_ERR,
  834. IB_WC_REM_INV_RD_REQ_ERR,
  835. IB_WC_REM_ABORT_ERR,
  836. IB_WC_INV_EECN_ERR,
  837. IB_WC_INV_EEC_STATE_ERR,
  838. IB_WC_FATAL_ERR,
  839. IB_WC_RESP_TIMEOUT_ERR,
  840. IB_WC_GENERAL_ERR
  841. };
  842. const char *__attribute_const__ ib_wc_status_msg(enum ib_wc_status status);
  843. enum ib_wc_opcode {
  844. IB_WC_SEND,
  845. IB_WC_RDMA_WRITE,
  846. IB_WC_RDMA_READ,
  847. IB_WC_COMP_SWAP,
  848. IB_WC_FETCH_ADD,
  849. IB_WC_LSO,
  850. IB_WC_LOCAL_INV,
  851. IB_WC_REG_MR,
  852. IB_WC_MASKED_COMP_SWAP,
  853. IB_WC_MASKED_FETCH_ADD,
  854. /*
  855. * Set value of IB_WC_RECV so consumers can test if a completion is a
  856. * receive by testing (opcode & IB_WC_RECV).
  857. */
  858. IB_WC_RECV = 1 << 7,
  859. IB_WC_RECV_RDMA_WITH_IMM
  860. };
  861. enum ib_wc_flags {
  862. IB_WC_GRH = 1,
  863. IB_WC_WITH_IMM = (1<<1),
  864. IB_WC_WITH_INVALIDATE = (1<<2),
  865. IB_WC_IP_CSUM_OK = (1<<3),
  866. IB_WC_WITH_SMAC = (1<<4),
  867. IB_WC_WITH_VLAN = (1<<5),
  868. IB_WC_WITH_NETWORK_HDR_TYPE = (1<<6),
  869. };
  870. struct ib_wc {
  871. union {
  872. u64 wr_id;
  873. struct ib_cqe *wr_cqe;
  874. };
  875. enum ib_wc_status status;
  876. enum ib_wc_opcode opcode;
  877. u32 vendor_err;
  878. u32 byte_len;
  879. struct ib_qp *qp;
  880. union {
  881. __be32 imm_data;
  882. u32 invalidate_rkey;
  883. } ex;
  884. u32 src_qp;
  885. u32 slid;
  886. int wc_flags;
  887. u16 pkey_index;
  888. u8 sl;
  889. u8 dlid_path_bits;
  890. u8 port_num; /* valid only for DR SMPs on switches */
  891. u8 smac[ETH_ALEN];
  892. u16 vlan_id;
  893. u8 network_hdr_type;
  894. };
  895. enum ib_cq_notify_flags {
  896. IB_CQ_SOLICITED = 1 << 0,
  897. IB_CQ_NEXT_COMP = 1 << 1,
  898. IB_CQ_SOLICITED_MASK = IB_CQ_SOLICITED | IB_CQ_NEXT_COMP,
  899. IB_CQ_REPORT_MISSED_EVENTS = 1 << 2,
  900. };
  901. enum ib_srq_type {
  902. IB_SRQT_BASIC,
  903. IB_SRQT_XRC,
  904. IB_SRQT_TM,
  905. };
  906. static inline bool ib_srq_has_cq(enum ib_srq_type srq_type)
  907. {
  908. return srq_type == IB_SRQT_XRC ||
  909. srq_type == IB_SRQT_TM;
  910. }
  911. enum ib_srq_attr_mask {
  912. IB_SRQ_MAX_WR = 1 << 0,
  913. IB_SRQ_LIMIT = 1 << 1,
  914. };
  915. struct ib_srq_attr {
  916. u32 max_wr;
  917. u32 max_sge;
  918. u32 srq_limit;
  919. };
  920. struct ib_srq_init_attr {
  921. void (*event_handler)(struct ib_event *, void *);
  922. void *srq_context;
  923. struct ib_srq_attr attr;
  924. enum ib_srq_type srq_type;
  925. struct {
  926. struct ib_cq *cq;
  927. union {
  928. struct {
  929. struct ib_xrcd *xrcd;
  930. } xrc;
  931. struct {
  932. u32 max_num_tags;
  933. } tag_matching;
  934. };
  935. } ext;
  936. };
  937. struct ib_qp_cap {
  938. u32 max_send_wr;
  939. u32 max_recv_wr;
  940. u32 max_send_sge;
  941. u32 max_recv_sge;
  942. u32 max_inline_data;
  943. /*
  944. * Maximum number of rdma_rw_ctx structures in flight at a time.
  945. * ib_create_qp() will calculate the right amount of neededed WRs
  946. * and MRs based on this.
  947. */
  948. u32 max_rdma_ctxs;
  949. };
  950. enum ib_sig_type {
  951. IB_SIGNAL_ALL_WR,
  952. IB_SIGNAL_REQ_WR
  953. };
  954. enum ib_qp_type {
  955. /*
  956. * IB_QPT_SMI and IB_QPT_GSI have to be the first two entries
  957. * here (and in that order) since the MAD layer uses them as
  958. * indices into a 2-entry table.
  959. */
  960. IB_QPT_SMI,
  961. IB_QPT_GSI,
  962. IB_QPT_RC,
  963. IB_QPT_UC,
  964. IB_QPT_UD,
  965. IB_QPT_RAW_IPV6,
  966. IB_QPT_RAW_ETHERTYPE,
  967. IB_QPT_RAW_PACKET = 8,
  968. IB_QPT_XRC_INI = 9,
  969. IB_QPT_XRC_TGT,
  970. IB_QPT_MAX,
  971. IB_QPT_DRIVER = 0xFF,
  972. /* Reserve a range for qp types internal to the low level driver.
  973. * These qp types will not be visible at the IB core layer, so the
  974. * IB_QPT_MAX usages should not be affected in the core layer
  975. */
  976. IB_QPT_RESERVED1 = 0x1000,
  977. IB_QPT_RESERVED2,
  978. IB_QPT_RESERVED3,
  979. IB_QPT_RESERVED4,
  980. IB_QPT_RESERVED5,
  981. IB_QPT_RESERVED6,
  982. IB_QPT_RESERVED7,
  983. IB_QPT_RESERVED8,
  984. IB_QPT_RESERVED9,
  985. IB_QPT_RESERVED10,
  986. };
  987. enum ib_qp_create_flags {
  988. IB_QP_CREATE_IPOIB_UD_LSO = 1 << 0,
  989. IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK = 1 << 1,
  990. IB_QP_CREATE_CROSS_CHANNEL = 1 << 2,
  991. IB_QP_CREATE_MANAGED_SEND = 1 << 3,
  992. IB_QP_CREATE_MANAGED_RECV = 1 << 4,
  993. IB_QP_CREATE_NETIF_QP = 1 << 5,
  994. IB_QP_CREATE_SIGNATURE_EN = 1 << 6,
  995. /* FREE = 1 << 7, */
  996. IB_QP_CREATE_SCATTER_FCS = 1 << 8,
  997. IB_QP_CREATE_CVLAN_STRIPPING = 1 << 9,
  998. IB_QP_CREATE_SOURCE_QPN = 1 << 10,
  999. IB_QP_CREATE_PCI_WRITE_END_PADDING = 1 << 11,
  1000. /* reserve bits 26-31 for low level drivers' internal use */
  1001. IB_QP_CREATE_RESERVED_START = 1 << 26,
  1002. IB_QP_CREATE_RESERVED_END = 1 << 31,
  1003. };
  1004. /*
  1005. * Note: users may not call ib_close_qp or ib_destroy_qp from the event_handler
  1006. * callback to destroy the passed in QP.
  1007. */
  1008. struct ib_qp_init_attr {
  1009. void (*event_handler)(struct ib_event *, void *);
  1010. void *qp_context;
  1011. struct ib_cq *send_cq;
  1012. struct ib_cq *recv_cq;
  1013. struct ib_srq *srq;
  1014. struct ib_xrcd *xrcd; /* XRC TGT QPs only */
  1015. struct ib_qp_cap cap;
  1016. enum ib_sig_type sq_sig_type;
  1017. enum ib_qp_type qp_type;
  1018. enum ib_qp_create_flags create_flags;
  1019. /*
  1020. * Only needed for special QP types, or when using the RW API.
  1021. */
  1022. u8 port_num;
  1023. struct ib_rwq_ind_table *rwq_ind_tbl;
  1024. u32 source_qpn;
  1025. };
  1026. struct ib_qp_open_attr {
  1027. void (*event_handler)(struct ib_event *, void *);
  1028. void *qp_context;
  1029. u32 qp_num;
  1030. enum ib_qp_type qp_type;
  1031. };
  1032. enum ib_rnr_timeout {
  1033. IB_RNR_TIMER_655_36 = 0,
  1034. IB_RNR_TIMER_000_01 = 1,
  1035. IB_RNR_TIMER_000_02 = 2,
  1036. IB_RNR_TIMER_000_03 = 3,
  1037. IB_RNR_TIMER_000_04 = 4,
  1038. IB_RNR_TIMER_000_06 = 5,
  1039. IB_RNR_TIMER_000_08 = 6,
  1040. IB_RNR_TIMER_000_12 = 7,
  1041. IB_RNR_TIMER_000_16 = 8,
  1042. IB_RNR_TIMER_000_24 = 9,
  1043. IB_RNR_TIMER_000_32 = 10,
  1044. IB_RNR_TIMER_000_48 = 11,
  1045. IB_RNR_TIMER_000_64 = 12,
  1046. IB_RNR_TIMER_000_96 = 13,
  1047. IB_RNR_TIMER_001_28 = 14,
  1048. IB_RNR_TIMER_001_92 = 15,
  1049. IB_RNR_TIMER_002_56 = 16,
  1050. IB_RNR_TIMER_003_84 = 17,
  1051. IB_RNR_TIMER_005_12 = 18,
  1052. IB_RNR_TIMER_007_68 = 19,
  1053. IB_RNR_TIMER_010_24 = 20,
  1054. IB_RNR_TIMER_015_36 = 21,
  1055. IB_RNR_TIMER_020_48 = 22,
  1056. IB_RNR_TIMER_030_72 = 23,
  1057. IB_RNR_TIMER_040_96 = 24,
  1058. IB_RNR_TIMER_061_44 = 25,
  1059. IB_RNR_TIMER_081_92 = 26,
  1060. IB_RNR_TIMER_122_88 = 27,
  1061. IB_RNR_TIMER_163_84 = 28,
  1062. IB_RNR_TIMER_245_76 = 29,
  1063. IB_RNR_TIMER_327_68 = 30,
  1064. IB_RNR_TIMER_491_52 = 31
  1065. };
  1066. enum ib_qp_attr_mask {
  1067. IB_QP_STATE = 1,
  1068. IB_QP_CUR_STATE = (1<<1),
  1069. IB_QP_EN_SQD_ASYNC_NOTIFY = (1<<2),
  1070. IB_QP_ACCESS_FLAGS = (1<<3),
  1071. IB_QP_PKEY_INDEX = (1<<4),
  1072. IB_QP_PORT = (1<<5),
  1073. IB_QP_QKEY = (1<<6),
  1074. IB_QP_AV = (1<<7),
  1075. IB_QP_PATH_MTU = (1<<8),
  1076. IB_QP_TIMEOUT = (1<<9),
  1077. IB_QP_RETRY_CNT = (1<<10),
  1078. IB_QP_RNR_RETRY = (1<<11),
  1079. IB_QP_RQ_PSN = (1<<12),
  1080. IB_QP_MAX_QP_RD_ATOMIC = (1<<13),
  1081. IB_QP_ALT_PATH = (1<<14),
  1082. IB_QP_MIN_RNR_TIMER = (1<<15),
  1083. IB_QP_SQ_PSN = (1<<16),
  1084. IB_QP_MAX_DEST_RD_ATOMIC = (1<<17),
  1085. IB_QP_PATH_MIG_STATE = (1<<18),
  1086. IB_QP_CAP = (1<<19),
  1087. IB_QP_DEST_QPN = (1<<20),
  1088. IB_QP_RESERVED1 = (1<<21),
  1089. IB_QP_RESERVED2 = (1<<22),
  1090. IB_QP_RESERVED3 = (1<<23),
  1091. IB_QP_RESERVED4 = (1<<24),
  1092. IB_QP_RATE_LIMIT = (1<<25),
  1093. };
  1094. enum ib_qp_state {
  1095. IB_QPS_RESET,
  1096. IB_QPS_INIT,
  1097. IB_QPS_RTR,
  1098. IB_QPS_RTS,
  1099. IB_QPS_SQD,
  1100. IB_QPS_SQE,
  1101. IB_QPS_ERR
  1102. };
  1103. enum ib_mig_state {
  1104. IB_MIG_MIGRATED,
  1105. IB_MIG_REARM,
  1106. IB_MIG_ARMED
  1107. };
  1108. enum ib_mw_type {
  1109. IB_MW_TYPE_1 = 1,
  1110. IB_MW_TYPE_2 = 2
  1111. };
  1112. struct ib_qp_attr {
  1113. enum ib_qp_state qp_state;
  1114. enum ib_qp_state cur_qp_state;
  1115. enum ib_mtu path_mtu;
  1116. enum ib_mig_state path_mig_state;
  1117. u32 qkey;
  1118. u32 rq_psn;
  1119. u32 sq_psn;
  1120. u32 dest_qp_num;
  1121. int qp_access_flags;
  1122. struct ib_qp_cap cap;
  1123. struct rdma_ah_attr ah_attr;
  1124. struct rdma_ah_attr alt_ah_attr;
  1125. u16 pkey_index;
  1126. u16 alt_pkey_index;
  1127. u8 en_sqd_async_notify;
  1128. u8 sq_draining;
  1129. u8 max_rd_atomic;
  1130. u8 max_dest_rd_atomic;
  1131. u8 min_rnr_timer;
  1132. u8 port_num;
  1133. u8 timeout;
  1134. u8 retry_cnt;
  1135. u8 rnr_retry;
  1136. u8 alt_port_num;
  1137. u8 alt_timeout;
  1138. u32 rate_limit;
  1139. };
  1140. enum ib_wr_opcode {
  1141. IB_WR_RDMA_WRITE,
  1142. IB_WR_RDMA_WRITE_WITH_IMM,
  1143. IB_WR_SEND,
  1144. IB_WR_SEND_WITH_IMM,
  1145. IB_WR_RDMA_READ,
  1146. IB_WR_ATOMIC_CMP_AND_SWP,
  1147. IB_WR_ATOMIC_FETCH_AND_ADD,
  1148. IB_WR_LSO,
  1149. IB_WR_SEND_WITH_INV,
  1150. IB_WR_RDMA_READ_WITH_INV,
  1151. IB_WR_LOCAL_INV,
  1152. IB_WR_REG_MR,
  1153. IB_WR_MASKED_ATOMIC_CMP_AND_SWP,
  1154. IB_WR_MASKED_ATOMIC_FETCH_AND_ADD,
  1155. IB_WR_REG_SIG_MR,
  1156. /* reserve values for low level drivers' internal use.
  1157. * These values will not be used at all in the ib core layer.
  1158. */
  1159. IB_WR_RESERVED1 = 0xf0,
  1160. IB_WR_RESERVED2,
  1161. IB_WR_RESERVED3,
  1162. IB_WR_RESERVED4,
  1163. IB_WR_RESERVED5,
  1164. IB_WR_RESERVED6,
  1165. IB_WR_RESERVED7,
  1166. IB_WR_RESERVED8,
  1167. IB_WR_RESERVED9,
  1168. IB_WR_RESERVED10,
  1169. };
  1170. enum ib_send_flags {
  1171. IB_SEND_FENCE = 1,
  1172. IB_SEND_SIGNALED = (1<<1),
  1173. IB_SEND_SOLICITED = (1<<2),
  1174. IB_SEND_INLINE = (1<<3),
  1175. IB_SEND_IP_CSUM = (1<<4),
  1176. /* reserve bits 26-31 for low level drivers' internal use */
  1177. IB_SEND_RESERVED_START = (1 << 26),
  1178. IB_SEND_RESERVED_END = (1 << 31),
  1179. };
  1180. struct ib_sge {
  1181. u64 addr;
  1182. u32 length;
  1183. u32 lkey;
  1184. };
  1185. struct ib_cqe {
  1186. void (*done)(struct ib_cq *cq, struct ib_wc *wc);
  1187. };
  1188. struct ib_send_wr {
  1189. struct ib_send_wr *next;
  1190. union {
  1191. u64 wr_id;
  1192. struct ib_cqe *wr_cqe;
  1193. };
  1194. struct ib_sge *sg_list;
  1195. int num_sge;
  1196. enum ib_wr_opcode opcode;
  1197. int send_flags;
  1198. union {
  1199. __be32 imm_data;
  1200. u32 invalidate_rkey;
  1201. } ex;
  1202. };
  1203. struct ib_rdma_wr {
  1204. struct ib_send_wr wr;
  1205. u64 remote_addr;
  1206. u32 rkey;
  1207. };
  1208. static inline struct ib_rdma_wr *rdma_wr(struct ib_send_wr *wr)
  1209. {
  1210. return container_of(wr, struct ib_rdma_wr, wr);
  1211. }
  1212. struct ib_atomic_wr {
  1213. struct ib_send_wr wr;
  1214. u64 remote_addr;
  1215. u64 compare_add;
  1216. u64 swap;
  1217. u64 compare_add_mask;
  1218. u64 swap_mask;
  1219. u32 rkey;
  1220. };
  1221. static inline struct ib_atomic_wr *atomic_wr(struct ib_send_wr *wr)
  1222. {
  1223. return container_of(wr, struct ib_atomic_wr, wr);
  1224. }
  1225. struct ib_ud_wr {
  1226. struct ib_send_wr wr;
  1227. struct ib_ah *ah;
  1228. void *header;
  1229. int hlen;
  1230. int mss;
  1231. u32 remote_qpn;
  1232. u32 remote_qkey;
  1233. u16 pkey_index; /* valid for GSI only */
  1234. u8 port_num; /* valid for DR SMPs on switch only */
  1235. };
  1236. static inline struct ib_ud_wr *ud_wr(struct ib_send_wr *wr)
  1237. {
  1238. return container_of(wr, struct ib_ud_wr, wr);
  1239. }
  1240. struct ib_reg_wr {
  1241. struct ib_send_wr wr;
  1242. struct ib_mr *mr;
  1243. u32 key;
  1244. int access;
  1245. };
  1246. static inline struct ib_reg_wr *reg_wr(struct ib_send_wr *wr)
  1247. {
  1248. return container_of(wr, struct ib_reg_wr, wr);
  1249. }
  1250. struct ib_sig_handover_wr {
  1251. struct ib_send_wr wr;
  1252. struct ib_sig_attrs *sig_attrs;
  1253. struct ib_mr *sig_mr;
  1254. int access_flags;
  1255. struct ib_sge *prot;
  1256. };
  1257. static inline struct ib_sig_handover_wr *sig_handover_wr(struct ib_send_wr *wr)
  1258. {
  1259. return container_of(wr, struct ib_sig_handover_wr, wr);
  1260. }
  1261. struct ib_recv_wr {
  1262. struct ib_recv_wr *next;
  1263. union {
  1264. u64 wr_id;
  1265. struct ib_cqe *wr_cqe;
  1266. };
  1267. struct ib_sge *sg_list;
  1268. int num_sge;
  1269. };
  1270. enum ib_access_flags {
  1271. IB_ACCESS_LOCAL_WRITE = 1,
  1272. IB_ACCESS_REMOTE_WRITE = (1<<1),
  1273. IB_ACCESS_REMOTE_READ = (1<<2),
  1274. IB_ACCESS_REMOTE_ATOMIC = (1<<3),
  1275. IB_ACCESS_MW_BIND = (1<<4),
  1276. IB_ZERO_BASED = (1<<5),
  1277. IB_ACCESS_ON_DEMAND = (1<<6),
  1278. IB_ACCESS_HUGETLB = (1<<7),
  1279. };
  1280. /*
  1281. * XXX: these are apparently used for ->rereg_user_mr, no idea why they
  1282. * are hidden here instead of a uapi header!
  1283. */
  1284. enum ib_mr_rereg_flags {
  1285. IB_MR_REREG_TRANS = 1,
  1286. IB_MR_REREG_PD = (1<<1),
  1287. IB_MR_REREG_ACCESS = (1<<2),
  1288. IB_MR_REREG_SUPPORTED = ((IB_MR_REREG_ACCESS << 1) - 1)
  1289. };
  1290. struct ib_fmr_attr {
  1291. int max_pages;
  1292. int max_maps;
  1293. u8 page_shift;
  1294. };
  1295. struct ib_umem;
  1296. enum rdma_remove_reason {
  1297. /* Userspace requested uobject deletion. Call could fail */
  1298. RDMA_REMOVE_DESTROY,
  1299. /* Context deletion. This call should delete the actual object itself */
  1300. RDMA_REMOVE_CLOSE,
  1301. /* Driver is being hot-unplugged. This call should delete the actual object itself */
  1302. RDMA_REMOVE_DRIVER_REMOVE,
  1303. /* Context is being cleaned-up, but commit was just completed */
  1304. RDMA_REMOVE_DURING_CLEANUP,
  1305. };
  1306. struct ib_rdmacg_object {
  1307. #ifdef CONFIG_CGROUP_RDMA
  1308. struct rdma_cgroup *cg; /* owner rdma cgroup */
  1309. #endif
  1310. };
  1311. struct ib_ucontext {
  1312. struct ib_device *device;
  1313. struct ib_uverbs_file *ufile;
  1314. int closing;
  1315. /* locking the uobjects_list */
  1316. struct mutex uobjects_lock;
  1317. struct list_head uobjects;
  1318. /* protects cleanup process from other actions */
  1319. struct rw_semaphore cleanup_rwsem;
  1320. enum rdma_remove_reason cleanup_reason;
  1321. struct pid *tgid;
  1322. #ifdef CONFIG_INFINIBAND_ON_DEMAND_PAGING
  1323. struct rb_root_cached umem_tree;
  1324. /*
  1325. * Protects .umem_rbroot and tree, as well as odp_mrs_count and
  1326. * mmu notifiers registration.
  1327. */
  1328. struct rw_semaphore umem_rwsem;
  1329. void (*invalidate_range)(struct ib_umem *umem,
  1330. unsigned long start, unsigned long end);
  1331. struct mmu_notifier mn;
  1332. atomic_t notifier_count;
  1333. /* A list of umems that don't have private mmu notifier counters yet. */
  1334. struct list_head no_private_counters;
  1335. int odp_mrs_count;
  1336. #endif
  1337. struct ib_rdmacg_object cg_obj;
  1338. };
  1339. struct ib_uobject {
  1340. u64 user_handle; /* handle given to us by userspace */
  1341. struct ib_ucontext *context; /* associated user context */
  1342. void *object; /* containing object */
  1343. struct list_head list; /* link to context's list */
  1344. struct ib_rdmacg_object cg_obj; /* rdmacg object */
  1345. int id; /* index into kernel idr */
  1346. struct kref ref;
  1347. atomic_t usecnt; /* protects exclusive access */
  1348. struct rcu_head rcu; /* kfree_rcu() overhead */
  1349. const struct uverbs_obj_type *type;
  1350. };
  1351. struct ib_uobject_file {
  1352. struct ib_uobject uobj;
  1353. /* ufile contains the lock between context release and file close */
  1354. struct ib_uverbs_file *ufile;
  1355. };
  1356. struct ib_udata {
  1357. const void __user *inbuf;
  1358. void __user *outbuf;
  1359. size_t inlen;
  1360. size_t outlen;
  1361. };
  1362. struct ib_pd {
  1363. u32 local_dma_lkey;
  1364. u32 flags;
  1365. struct ib_device *device;
  1366. struct ib_uobject *uobject;
  1367. atomic_t usecnt; /* count all resources */
  1368. u32 unsafe_global_rkey;
  1369. /*
  1370. * Implementation details of the RDMA core, don't use in drivers:
  1371. */
  1372. struct ib_mr *__internal_mr;
  1373. struct rdma_restrack_entry res;
  1374. };
  1375. struct ib_xrcd {
  1376. struct ib_device *device;
  1377. atomic_t usecnt; /* count all exposed resources */
  1378. struct inode *inode;
  1379. struct mutex tgt_qp_mutex;
  1380. struct list_head tgt_qp_list;
  1381. /*
  1382. * Implementation details of the RDMA core, don't use in drivers:
  1383. */
  1384. struct rdma_restrack_entry res;
  1385. };
  1386. struct ib_ah {
  1387. struct ib_device *device;
  1388. struct ib_pd *pd;
  1389. struct ib_uobject *uobject;
  1390. enum rdma_ah_attr_type type;
  1391. };
  1392. typedef void (*ib_comp_handler)(struct ib_cq *cq, void *cq_context);
  1393. enum ib_poll_context {
  1394. IB_POLL_DIRECT, /* caller context, no hw completions */
  1395. IB_POLL_SOFTIRQ, /* poll from softirq context */
  1396. IB_POLL_WORKQUEUE, /* poll from workqueue */
  1397. };
  1398. struct ib_cq {
  1399. struct ib_device *device;
  1400. struct ib_uobject *uobject;
  1401. ib_comp_handler comp_handler;
  1402. void (*event_handler)(struct ib_event *, void *);
  1403. void *cq_context;
  1404. int cqe;
  1405. atomic_t usecnt; /* count number of work queues */
  1406. enum ib_poll_context poll_ctx;
  1407. struct ib_wc *wc;
  1408. union {
  1409. struct irq_poll iop;
  1410. struct work_struct work;
  1411. };
  1412. /*
  1413. * Implementation details of the RDMA core, don't use in drivers:
  1414. */
  1415. struct rdma_restrack_entry res;
  1416. };
  1417. struct ib_srq {
  1418. struct ib_device *device;
  1419. struct ib_pd *pd;
  1420. struct ib_uobject *uobject;
  1421. void (*event_handler)(struct ib_event *, void *);
  1422. void *srq_context;
  1423. enum ib_srq_type srq_type;
  1424. atomic_t usecnt;
  1425. struct {
  1426. struct ib_cq *cq;
  1427. union {
  1428. struct {
  1429. struct ib_xrcd *xrcd;
  1430. u32 srq_num;
  1431. } xrc;
  1432. };
  1433. } ext;
  1434. };
  1435. enum ib_raw_packet_caps {
  1436. /* Strip cvlan from incoming packet and report it in the matching work
  1437. * completion is supported.
  1438. */
  1439. IB_RAW_PACKET_CAP_CVLAN_STRIPPING = (1 << 0),
  1440. /* Scatter FCS field of an incoming packet to host memory is supported.
  1441. */
  1442. IB_RAW_PACKET_CAP_SCATTER_FCS = (1 << 1),
  1443. /* Checksum offloads are supported (for both send and receive). */
  1444. IB_RAW_PACKET_CAP_IP_CSUM = (1 << 2),
  1445. /* When a packet is received for an RQ with no receive WQEs, the
  1446. * packet processing is delayed.
  1447. */
  1448. IB_RAW_PACKET_CAP_DELAY_DROP = (1 << 3),
  1449. };
  1450. enum ib_wq_type {
  1451. IB_WQT_RQ
  1452. };
  1453. enum ib_wq_state {
  1454. IB_WQS_RESET,
  1455. IB_WQS_RDY,
  1456. IB_WQS_ERR
  1457. };
  1458. struct ib_wq {
  1459. struct ib_device *device;
  1460. struct ib_uobject *uobject;
  1461. void *wq_context;
  1462. void (*event_handler)(struct ib_event *, void *);
  1463. struct ib_pd *pd;
  1464. struct ib_cq *cq;
  1465. u32 wq_num;
  1466. enum ib_wq_state state;
  1467. enum ib_wq_type wq_type;
  1468. atomic_t usecnt;
  1469. };
  1470. enum ib_wq_flags {
  1471. IB_WQ_FLAGS_CVLAN_STRIPPING = 1 << 0,
  1472. IB_WQ_FLAGS_SCATTER_FCS = 1 << 1,
  1473. IB_WQ_FLAGS_DELAY_DROP = 1 << 2,
  1474. IB_WQ_FLAGS_PCI_WRITE_END_PADDING = 1 << 3,
  1475. };
  1476. struct ib_wq_init_attr {
  1477. void *wq_context;
  1478. enum ib_wq_type wq_type;
  1479. u32 max_wr;
  1480. u32 max_sge;
  1481. struct ib_cq *cq;
  1482. void (*event_handler)(struct ib_event *, void *);
  1483. u32 create_flags; /* Use enum ib_wq_flags */
  1484. };
  1485. enum ib_wq_attr_mask {
  1486. IB_WQ_STATE = 1 << 0,
  1487. IB_WQ_CUR_STATE = 1 << 1,
  1488. IB_WQ_FLAGS = 1 << 2,
  1489. };
  1490. struct ib_wq_attr {
  1491. enum ib_wq_state wq_state;
  1492. enum ib_wq_state curr_wq_state;
  1493. u32 flags; /* Use enum ib_wq_flags */
  1494. u32 flags_mask; /* Use enum ib_wq_flags */
  1495. };
  1496. struct ib_rwq_ind_table {
  1497. struct ib_device *device;
  1498. struct ib_uobject *uobject;
  1499. atomic_t usecnt;
  1500. u32 ind_tbl_num;
  1501. u32 log_ind_tbl_size;
  1502. struct ib_wq **ind_tbl;
  1503. };
  1504. struct ib_rwq_ind_table_init_attr {
  1505. u32 log_ind_tbl_size;
  1506. /* Each entry is a pointer to Receive Work Queue */
  1507. struct ib_wq **ind_tbl;
  1508. };
  1509. enum port_pkey_state {
  1510. IB_PORT_PKEY_NOT_VALID = 0,
  1511. IB_PORT_PKEY_VALID = 1,
  1512. IB_PORT_PKEY_LISTED = 2,
  1513. };
  1514. struct ib_qp_security;
  1515. struct ib_port_pkey {
  1516. enum port_pkey_state state;
  1517. u16 pkey_index;
  1518. u8 port_num;
  1519. struct list_head qp_list;
  1520. struct list_head to_error_list;
  1521. struct ib_qp_security *sec;
  1522. };
  1523. struct ib_ports_pkeys {
  1524. struct ib_port_pkey main;
  1525. struct ib_port_pkey alt;
  1526. };
  1527. struct ib_qp_security {
  1528. struct ib_qp *qp;
  1529. struct ib_device *dev;
  1530. /* Hold this mutex when changing port and pkey settings. */
  1531. struct mutex mutex;
  1532. struct ib_ports_pkeys *ports_pkeys;
  1533. /* A list of all open shared QP handles. Required to enforce security
  1534. * properly for all users of a shared QP.
  1535. */
  1536. struct list_head shared_qp_list;
  1537. void *security;
  1538. bool destroying;
  1539. atomic_t error_list_count;
  1540. struct completion error_complete;
  1541. int error_comps_pending;
  1542. };
  1543. /*
  1544. * @max_write_sge: Maximum SGE elements per RDMA WRITE request.
  1545. * @max_read_sge: Maximum SGE elements per RDMA READ request.
  1546. */
  1547. struct ib_qp {
  1548. struct ib_device *device;
  1549. struct ib_pd *pd;
  1550. struct ib_cq *send_cq;
  1551. struct ib_cq *recv_cq;
  1552. spinlock_t mr_lock;
  1553. int mrs_used;
  1554. struct list_head rdma_mrs;
  1555. struct list_head sig_mrs;
  1556. struct ib_srq *srq;
  1557. struct ib_xrcd *xrcd; /* XRC TGT QPs only */
  1558. struct list_head xrcd_list;
  1559. /* count times opened, mcast attaches, flow attaches */
  1560. atomic_t usecnt;
  1561. struct list_head open_list;
  1562. struct ib_qp *real_qp;
  1563. struct ib_uobject *uobject;
  1564. void (*event_handler)(struct ib_event *, void *);
  1565. void *qp_context;
  1566. u32 qp_num;
  1567. u32 max_write_sge;
  1568. u32 max_read_sge;
  1569. enum ib_qp_type qp_type;
  1570. struct ib_rwq_ind_table *rwq_ind_tbl;
  1571. struct ib_qp_security *qp_sec;
  1572. u8 port;
  1573. /*
  1574. * Implementation details of the RDMA core, don't use in drivers:
  1575. */
  1576. struct rdma_restrack_entry res;
  1577. };
  1578. struct ib_mr {
  1579. struct ib_device *device;
  1580. struct ib_pd *pd;
  1581. u32 lkey;
  1582. u32 rkey;
  1583. u64 iova;
  1584. u64 length;
  1585. unsigned int page_size;
  1586. bool need_inval;
  1587. union {
  1588. struct ib_uobject *uobject; /* user */
  1589. struct list_head qp_entry; /* FR */
  1590. };
  1591. };
  1592. struct ib_mw {
  1593. struct ib_device *device;
  1594. struct ib_pd *pd;
  1595. struct ib_uobject *uobject;
  1596. u32 rkey;
  1597. enum ib_mw_type type;
  1598. };
  1599. struct ib_fmr {
  1600. struct ib_device *device;
  1601. struct ib_pd *pd;
  1602. struct list_head list;
  1603. u32 lkey;
  1604. u32 rkey;
  1605. };
  1606. /* Supported steering options */
  1607. enum ib_flow_attr_type {
  1608. /* steering according to rule specifications */
  1609. IB_FLOW_ATTR_NORMAL = 0x0,
  1610. /* default unicast and multicast rule -
  1611. * receive all Eth traffic which isn't steered to any QP
  1612. */
  1613. IB_FLOW_ATTR_ALL_DEFAULT = 0x1,
  1614. /* default multicast rule -
  1615. * receive all Eth multicast traffic which isn't steered to any QP
  1616. */
  1617. IB_FLOW_ATTR_MC_DEFAULT = 0x2,
  1618. /* sniffer rule - receive all port traffic */
  1619. IB_FLOW_ATTR_SNIFFER = 0x3
  1620. };
  1621. /* Supported steering header types */
  1622. enum ib_flow_spec_type {
  1623. /* L2 headers*/
  1624. IB_FLOW_SPEC_ETH = 0x20,
  1625. IB_FLOW_SPEC_IB = 0x22,
  1626. /* L3 header*/
  1627. IB_FLOW_SPEC_IPV4 = 0x30,
  1628. IB_FLOW_SPEC_IPV6 = 0x31,
  1629. /* L4 headers*/
  1630. IB_FLOW_SPEC_TCP = 0x40,
  1631. IB_FLOW_SPEC_UDP = 0x41,
  1632. IB_FLOW_SPEC_VXLAN_TUNNEL = 0x50,
  1633. IB_FLOW_SPEC_INNER = 0x100,
  1634. /* Actions */
  1635. IB_FLOW_SPEC_ACTION_TAG = 0x1000,
  1636. IB_FLOW_SPEC_ACTION_DROP = 0x1001,
  1637. };
  1638. #define IB_FLOW_SPEC_LAYER_MASK 0xF0
  1639. #define IB_FLOW_SPEC_SUPPORT_LAYERS 8
  1640. /* Flow steering rule priority is set according to it's domain.
  1641. * Lower domain value means higher priority.
  1642. */
  1643. enum ib_flow_domain {
  1644. IB_FLOW_DOMAIN_USER,
  1645. IB_FLOW_DOMAIN_ETHTOOL,
  1646. IB_FLOW_DOMAIN_RFS,
  1647. IB_FLOW_DOMAIN_NIC,
  1648. IB_FLOW_DOMAIN_NUM /* Must be last */
  1649. };
  1650. enum ib_flow_flags {
  1651. IB_FLOW_ATTR_FLAGS_DONT_TRAP = 1UL << 1, /* Continue match, no steal */
  1652. IB_FLOW_ATTR_FLAGS_RESERVED = 1UL << 2 /* Must be last */
  1653. };
  1654. struct ib_flow_eth_filter {
  1655. u8 dst_mac[6];
  1656. u8 src_mac[6];
  1657. __be16 ether_type;
  1658. __be16 vlan_tag;
  1659. /* Must be last */
  1660. u8 real_sz[0];
  1661. };
  1662. struct ib_flow_spec_eth {
  1663. u32 type;
  1664. u16 size;
  1665. struct ib_flow_eth_filter val;
  1666. struct ib_flow_eth_filter mask;
  1667. };
  1668. struct ib_flow_ib_filter {
  1669. __be16 dlid;
  1670. __u8 sl;
  1671. /* Must be last */
  1672. u8 real_sz[0];
  1673. };
  1674. struct ib_flow_spec_ib {
  1675. u32 type;
  1676. u16 size;
  1677. struct ib_flow_ib_filter val;
  1678. struct ib_flow_ib_filter mask;
  1679. };
  1680. /* IPv4 header flags */
  1681. enum ib_ipv4_flags {
  1682. IB_IPV4_DONT_FRAG = 0x2, /* Don't enable packet fragmentation */
  1683. IB_IPV4_MORE_FRAG = 0X4 /* For All fragmented packets except the
  1684. last have this flag set */
  1685. };
  1686. struct ib_flow_ipv4_filter {
  1687. __be32 src_ip;
  1688. __be32 dst_ip;
  1689. u8 proto;
  1690. u8 tos;
  1691. u8 ttl;
  1692. u8 flags;
  1693. /* Must be last */
  1694. u8 real_sz[0];
  1695. };
  1696. struct ib_flow_spec_ipv4 {
  1697. u32 type;
  1698. u16 size;
  1699. struct ib_flow_ipv4_filter val;
  1700. struct ib_flow_ipv4_filter mask;
  1701. };
  1702. struct ib_flow_ipv6_filter {
  1703. u8 src_ip[16];
  1704. u8 dst_ip[16];
  1705. __be32 flow_label;
  1706. u8 next_hdr;
  1707. u8 traffic_class;
  1708. u8 hop_limit;
  1709. /* Must be last */
  1710. u8 real_sz[0];
  1711. };
  1712. struct ib_flow_spec_ipv6 {
  1713. u32 type;
  1714. u16 size;
  1715. struct ib_flow_ipv6_filter val;
  1716. struct ib_flow_ipv6_filter mask;
  1717. };
  1718. struct ib_flow_tcp_udp_filter {
  1719. __be16 dst_port;
  1720. __be16 src_port;
  1721. /* Must be last */
  1722. u8 real_sz[0];
  1723. };
  1724. struct ib_flow_spec_tcp_udp {
  1725. u32 type;
  1726. u16 size;
  1727. struct ib_flow_tcp_udp_filter val;
  1728. struct ib_flow_tcp_udp_filter mask;
  1729. };
  1730. struct ib_flow_tunnel_filter {
  1731. __be32 tunnel_id;
  1732. u8 real_sz[0];
  1733. };
  1734. /* ib_flow_spec_tunnel describes the Vxlan tunnel
  1735. * the tunnel_id from val has the vni value
  1736. */
  1737. struct ib_flow_spec_tunnel {
  1738. u32 type;
  1739. u16 size;
  1740. struct ib_flow_tunnel_filter val;
  1741. struct ib_flow_tunnel_filter mask;
  1742. };
  1743. struct ib_flow_spec_action_tag {
  1744. enum ib_flow_spec_type type;
  1745. u16 size;
  1746. u32 tag_id;
  1747. };
  1748. struct ib_flow_spec_action_drop {
  1749. enum ib_flow_spec_type type;
  1750. u16 size;
  1751. };
  1752. union ib_flow_spec {
  1753. struct {
  1754. u32 type;
  1755. u16 size;
  1756. };
  1757. struct ib_flow_spec_eth eth;
  1758. struct ib_flow_spec_ib ib;
  1759. struct ib_flow_spec_ipv4 ipv4;
  1760. struct ib_flow_spec_tcp_udp tcp_udp;
  1761. struct ib_flow_spec_ipv6 ipv6;
  1762. struct ib_flow_spec_tunnel tunnel;
  1763. struct ib_flow_spec_action_tag flow_tag;
  1764. struct ib_flow_spec_action_drop drop;
  1765. };
  1766. struct ib_flow_attr {
  1767. enum ib_flow_attr_type type;
  1768. u16 size;
  1769. u16 priority;
  1770. u32 flags;
  1771. u8 num_of_specs;
  1772. u8 port;
  1773. /* Following are the optional layers according to user request
  1774. * struct ib_flow_spec_xxx
  1775. * struct ib_flow_spec_yyy
  1776. */
  1777. };
  1778. struct ib_flow {
  1779. struct ib_qp *qp;
  1780. struct ib_uobject *uobject;
  1781. };
  1782. struct ib_mad_hdr;
  1783. struct ib_grh;
  1784. enum ib_process_mad_flags {
  1785. IB_MAD_IGNORE_MKEY = 1,
  1786. IB_MAD_IGNORE_BKEY = 2,
  1787. IB_MAD_IGNORE_ALL = IB_MAD_IGNORE_MKEY | IB_MAD_IGNORE_BKEY
  1788. };
  1789. enum ib_mad_result {
  1790. IB_MAD_RESULT_FAILURE = 0, /* (!SUCCESS is the important flag) */
  1791. IB_MAD_RESULT_SUCCESS = 1 << 0, /* MAD was successfully processed */
  1792. IB_MAD_RESULT_REPLY = 1 << 1, /* Reply packet needs to be sent */
  1793. IB_MAD_RESULT_CONSUMED = 1 << 2 /* Packet consumed: stop processing */
  1794. };
  1795. struct ib_port_cache {
  1796. u64 subnet_prefix;
  1797. struct ib_pkey_cache *pkey;
  1798. struct ib_gid_table *gid;
  1799. u8 lmc;
  1800. enum ib_port_state port_state;
  1801. };
  1802. struct ib_cache {
  1803. rwlock_t lock;
  1804. struct ib_event_handler event_handler;
  1805. struct ib_port_cache *ports;
  1806. };
  1807. struct iw_cm_verbs;
  1808. struct ib_port_immutable {
  1809. int pkey_tbl_len;
  1810. int gid_tbl_len;
  1811. u32 core_cap_flags;
  1812. u32 max_mad_size;
  1813. };
  1814. /* rdma netdev type - specifies protocol type */
  1815. enum rdma_netdev_t {
  1816. RDMA_NETDEV_OPA_VNIC,
  1817. RDMA_NETDEV_IPOIB,
  1818. };
  1819. /**
  1820. * struct rdma_netdev - rdma netdev
  1821. * For cases where netstack interfacing is required.
  1822. */
  1823. struct rdma_netdev {
  1824. void *clnt_priv;
  1825. struct ib_device *hca;
  1826. u8 port_num;
  1827. /* cleanup function must be specified */
  1828. void (*free_rdma_netdev)(struct net_device *netdev);
  1829. /* control functions */
  1830. void (*set_id)(struct net_device *netdev, int id);
  1831. /* send packet */
  1832. int (*send)(struct net_device *dev, struct sk_buff *skb,
  1833. struct ib_ah *address, u32 dqpn);
  1834. /* multicast */
  1835. int (*attach_mcast)(struct net_device *dev, struct ib_device *hca,
  1836. union ib_gid *gid, u16 mlid,
  1837. int set_qkey, u32 qkey);
  1838. int (*detach_mcast)(struct net_device *dev, struct ib_device *hca,
  1839. union ib_gid *gid, u16 mlid);
  1840. };
  1841. struct ib_port_pkey_list {
  1842. /* Lock to hold while modifying the list. */
  1843. spinlock_t list_lock;
  1844. struct list_head pkey_list;
  1845. };
  1846. struct ib_device {
  1847. /* Do not access @dma_device directly from ULP nor from HW drivers. */
  1848. struct device *dma_device;
  1849. char name[IB_DEVICE_NAME_MAX];
  1850. struct list_head event_handler_list;
  1851. spinlock_t event_handler_lock;
  1852. spinlock_t client_data_lock;
  1853. struct list_head core_list;
  1854. /* Access to the client_data_list is protected by the client_data_lock
  1855. * spinlock and the lists_rwsem read-write semaphore */
  1856. struct list_head client_data_list;
  1857. struct ib_cache cache;
  1858. /**
  1859. * port_immutable is indexed by port number
  1860. */
  1861. struct ib_port_immutable *port_immutable;
  1862. int num_comp_vectors;
  1863. struct ib_port_pkey_list *port_pkey_list;
  1864. struct iw_cm_verbs *iwcm;
  1865. /**
  1866. * alloc_hw_stats - Allocate a struct rdma_hw_stats and fill in the
  1867. * driver initialized data. The struct is kfree()'ed by the sysfs
  1868. * core when the device is removed. A lifespan of -1 in the return
  1869. * struct tells the core to set a default lifespan.
  1870. */
  1871. struct rdma_hw_stats *(*alloc_hw_stats)(struct ib_device *device,
  1872. u8 port_num);
  1873. /**
  1874. * get_hw_stats - Fill in the counter value(s) in the stats struct.
  1875. * @index - The index in the value array we wish to have updated, or
  1876. * num_counters if we want all stats updated
  1877. * Return codes -
  1878. * < 0 - Error, no counters updated
  1879. * index - Updated the single counter pointed to by index
  1880. * num_counters - Updated all counters (will reset the timestamp
  1881. * and prevent further calls for lifespan milliseconds)
  1882. * Drivers are allowed to update all counters in leiu of just the
  1883. * one given in index at their option
  1884. */
  1885. int (*get_hw_stats)(struct ib_device *device,
  1886. struct rdma_hw_stats *stats,
  1887. u8 port, int index);
  1888. int (*query_device)(struct ib_device *device,
  1889. struct ib_device_attr *device_attr,
  1890. struct ib_udata *udata);
  1891. int (*query_port)(struct ib_device *device,
  1892. u8 port_num,
  1893. struct ib_port_attr *port_attr);
  1894. enum rdma_link_layer (*get_link_layer)(struct ib_device *device,
  1895. u8 port_num);
  1896. /* When calling get_netdev, the HW vendor's driver should return the
  1897. * net device of device @device at port @port_num or NULL if such
  1898. * a net device doesn't exist. The vendor driver should call dev_hold
  1899. * on this net device. The HW vendor's device driver must guarantee
  1900. * that this function returns NULL before the net device reaches
  1901. * NETDEV_UNREGISTER_FINAL state.
  1902. */
  1903. struct net_device *(*get_netdev)(struct ib_device *device,
  1904. u8 port_num);
  1905. int (*query_gid)(struct ib_device *device,
  1906. u8 port_num, int index,
  1907. union ib_gid *gid);
  1908. /* When calling add_gid, the HW vendor's driver should
  1909. * add the gid of device @device at gid index @index of
  1910. * port @port_num to be @gid. Meta-info of that gid (for example,
  1911. * the network device related to this gid is available
  1912. * at @attr. @context allows the HW vendor driver to store extra
  1913. * information together with a GID entry. The HW vendor may allocate
  1914. * memory to contain this information and store it in @context when a
  1915. * new GID entry is written to. Params are consistent until the next
  1916. * call of add_gid or delete_gid. The function should return 0 on
  1917. * success or error otherwise. The function could be called
  1918. * concurrently for different ports. This function is only called
  1919. * when roce_gid_table is used.
  1920. */
  1921. int (*add_gid)(struct ib_device *device,
  1922. u8 port_num,
  1923. unsigned int index,
  1924. const union ib_gid *gid,
  1925. const struct ib_gid_attr *attr,
  1926. void **context);
  1927. /* When calling del_gid, the HW vendor's driver should delete the
  1928. * gid of device @device at gid index @index of port @port_num.
  1929. * Upon the deletion of a GID entry, the HW vendor must free any
  1930. * allocated memory. The caller will clear @context afterwards.
  1931. * This function is only called when roce_gid_table is used.
  1932. */
  1933. int (*del_gid)(struct ib_device *device,
  1934. u8 port_num,
  1935. unsigned int index,
  1936. void **context);
  1937. int (*query_pkey)(struct ib_device *device,
  1938. u8 port_num, u16 index, u16 *pkey);
  1939. int (*modify_device)(struct ib_device *device,
  1940. int device_modify_mask,
  1941. struct ib_device_modify *device_modify);
  1942. int (*modify_port)(struct ib_device *device,
  1943. u8 port_num, int port_modify_mask,
  1944. struct ib_port_modify *port_modify);
  1945. struct ib_ucontext * (*alloc_ucontext)(struct ib_device *device,
  1946. struct ib_udata *udata);
  1947. int (*dealloc_ucontext)(struct ib_ucontext *context);
  1948. int (*mmap)(struct ib_ucontext *context,
  1949. struct vm_area_struct *vma);
  1950. struct ib_pd * (*alloc_pd)(struct ib_device *device,
  1951. struct ib_ucontext *context,
  1952. struct ib_udata *udata);
  1953. int (*dealloc_pd)(struct ib_pd *pd);
  1954. struct ib_ah * (*create_ah)(struct ib_pd *pd,
  1955. struct rdma_ah_attr *ah_attr,
  1956. struct ib_udata *udata);
  1957. int (*modify_ah)(struct ib_ah *ah,
  1958. struct rdma_ah_attr *ah_attr);
  1959. int (*query_ah)(struct ib_ah *ah,
  1960. struct rdma_ah_attr *ah_attr);
  1961. int (*destroy_ah)(struct ib_ah *ah);
  1962. struct ib_srq * (*create_srq)(struct ib_pd *pd,
  1963. struct ib_srq_init_attr *srq_init_attr,
  1964. struct ib_udata *udata);
  1965. int (*modify_srq)(struct ib_srq *srq,
  1966. struct ib_srq_attr *srq_attr,
  1967. enum ib_srq_attr_mask srq_attr_mask,
  1968. struct ib_udata *udata);
  1969. int (*query_srq)(struct ib_srq *srq,
  1970. struct ib_srq_attr *srq_attr);
  1971. int (*destroy_srq)(struct ib_srq *srq);
  1972. int (*post_srq_recv)(struct ib_srq *srq,
  1973. struct ib_recv_wr *recv_wr,
  1974. struct ib_recv_wr **bad_recv_wr);
  1975. struct ib_qp * (*create_qp)(struct ib_pd *pd,
  1976. struct ib_qp_init_attr *qp_init_attr,
  1977. struct ib_udata *udata);
  1978. int (*modify_qp)(struct ib_qp *qp,
  1979. struct ib_qp_attr *qp_attr,
  1980. int qp_attr_mask,
  1981. struct ib_udata *udata);
  1982. int (*query_qp)(struct ib_qp *qp,
  1983. struct ib_qp_attr *qp_attr,
  1984. int qp_attr_mask,
  1985. struct ib_qp_init_attr *qp_init_attr);
  1986. int (*destroy_qp)(struct ib_qp *qp);
  1987. int (*post_send)(struct ib_qp *qp,
  1988. struct ib_send_wr *send_wr,
  1989. struct ib_send_wr **bad_send_wr);
  1990. int (*post_recv)(struct ib_qp *qp,
  1991. struct ib_recv_wr *recv_wr,
  1992. struct ib_recv_wr **bad_recv_wr);
  1993. struct ib_cq * (*create_cq)(struct ib_device *device,
  1994. const struct ib_cq_init_attr *attr,
  1995. struct ib_ucontext *context,
  1996. struct ib_udata *udata);
  1997. int (*modify_cq)(struct ib_cq *cq, u16 cq_count,
  1998. u16 cq_period);
  1999. int (*destroy_cq)(struct ib_cq *cq);
  2000. int (*resize_cq)(struct ib_cq *cq, int cqe,
  2001. struct ib_udata *udata);
  2002. int (*poll_cq)(struct ib_cq *cq, int num_entries,
  2003. struct ib_wc *wc);
  2004. int (*peek_cq)(struct ib_cq *cq, int wc_cnt);
  2005. int (*req_notify_cq)(struct ib_cq *cq,
  2006. enum ib_cq_notify_flags flags);
  2007. int (*req_ncomp_notif)(struct ib_cq *cq,
  2008. int wc_cnt);
  2009. struct ib_mr * (*get_dma_mr)(struct ib_pd *pd,
  2010. int mr_access_flags);
  2011. struct ib_mr * (*reg_user_mr)(struct ib_pd *pd,
  2012. u64 start, u64 length,
  2013. u64 virt_addr,
  2014. int mr_access_flags,
  2015. struct ib_udata *udata);
  2016. int (*rereg_user_mr)(struct ib_mr *mr,
  2017. int flags,
  2018. u64 start, u64 length,
  2019. u64 virt_addr,
  2020. int mr_access_flags,
  2021. struct ib_pd *pd,
  2022. struct ib_udata *udata);
  2023. int (*dereg_mr)(struct ib_mr *mr);
  2024. struct ib_mr * (*alloc_mr)(struct ib_pd *pd,
  2025. enum ib_mr_type mr_type,
  2026. u32 max_num_sg);
  2027. int (*map_mr_sg)(struct ib_mr *mr,
  2028. struct scatterlist *sg,
  2029. int sg_nents,
  2030. unsigned int *sg_offset);
  2031. struct ib_mw * (*alloc_mw)(struct ib_pd *pd,
  2032. enum ib_mw_type type,
  2033. struct ib_udata *udata);
  2034. int (*dealloc_mw)(struct ib_mw *mw);
  2035. struct ib_fmr * (*alloc_fmr)(struct ib_pd *pd,
  2036. int mr_access_flags,
  2037. struct ib_fmr_attr *fmr_attr);
  2038. int (*map_phys_fmr)(struct ib_fmr *fmr,
  2039. u64 *page_list, int list_len,
  2040. u64 iova);
  2041. int (*unmap_fmr)(struct list_head *fmr_list);
  2042. int (*dealloc_fmr)(struct ib_fmr *fmr);
  2043. int (*attach_mcast)(struct ib_qp *qp,
  2044. union ib_gid *gid,
  2045. u16 lid);
  2046. int (*detach_mcast)(struct ib_qp *qp,
  2047. union ib_gid *gid,
  2048. u16 lid);
  2049. int (*process_mad)(struct ib_device *device,
  2050. int process_mad_flags,
  2051. u8 port_num,
  2052. const struct ib_wc *in_wc,
  2053. const struct ib_grh *in_grh,
  2054. const struct ib_mad_hdr *in_mad,
  2055. size_t in_mad_size,
  2056. struct ib_mad_hdr *out_mad,
  2057. size_t *out_mad_size,
  2058. u16 *out_mad_pkey_index);
  2059. struct ib_xrcd * (*alloc_xrcd)(struct ib_device *device,
  2060. struct ib_ucontext *ucontext,
  2061. struct ib_udata *udata);
  2062. int (*dealloc_xrcd)(struct ib_xrcd *xrcd);
  2063. struct ib_flow * (*create_flow)(struct ib_qp *qp,
  2064. struct ib_flow_attr
  2065. *flow_attr,
  2066. int domain);
  2067. int (*destroy_flow)(struct ib_flow *flow_id);
  2068. int (*check_mr_status)(struct ib_mr *mr, u32 check_mask,
  2069. struct ib_mr_status *mr_status);
  2070. void (*disassociate_ucontext)(struct ib_ucontext *ibcontext);
  2071. void (*drain_rq)(struct ib_qp *qp);
  2072. void (*drain_sq)(struct ib_qp *qp);
  2073. int (*set_vf_link_state)(struct ib_device *device, int vf, u8 port,
  2074. int state);
  2075. int (*get_vf_config)(struct ib_device *device, int vf, u8 port,
  2076. struct ifla_vf_info *ivf);
  2077. int (*get_vf_stats)(struct ib_device *device, int vf, u8 port,
  2078. struct ifla_vf_stats *stats);
  2079. int (*set_vf_guid)(struct ib_device *device, int vf, u8 port, u64 guid,
  2080. int type);
  2081. struct ib_wq * (*create_wq)(struct ib_pd *pd,
  2082. struct ib_wq_init_attr *init_attr,
  2083. struct ib_udata *udata);
  2084. int (*destroy_wq)(struct ib_wq *wq);
  2085. int (*modify_wq)(struct ib_wq *wq,
  2086. struct ib_wq_attr *attr,
  2087. u32 wq_attr_mask,
  2088. struct ib_udata *udata);
  2089. struct ib_rwq_ind_table * (*create_rwq_ind_table)(struct ib_device *device,
  2090. struct ib_rwq_ind_table_init_attr *init_attr,
  2091. struct ib_udata *udata);
  2092. int (*destroy_rwq_ind_table)(struct ib_rwq_ind_table *wq_ind_table);
  2093. /**
  2094. * rdma netdev operation
  2095. *
  2096. * Driver implementing alloc_rdma_netdev must return -EOPNOTSUPP if it
  2097. * doesn't support the specified rdma netdev type.
  2098. */
  2099. struct net_device *(*alloc_rdma_netdev)(
  2100. struct ib_device *device,
  2101. u8 port_num,
  2102. enum rdma_netdev_t type,
  2103. const char *name,
  2104. unsigned char name_assign_type,
  2105. void (*setup)(struct net_device *));
  2106. struct module *owner;
  2107. struct device dev;
  2108. struct kobject *ports_parent;
  2109. struct list_head port_list;
  2110. enum {
  2111. IB_DEV_UNINITIALIZED,
  2112. IB_DEV_REGISTERED,
  2113. IB_DEV_UNREGISTERED
  2114. } reg_state;
  2115. int uverbs_abi_ver;
  2116. u64 uverbs_cmd_mask;
  2117. u64 uverbs_ex_cmd_mask;
  2118. char node_desc[IB_DEVICE_NODE_DESC_MAX];
  2119. __be64 node_guid;
  2120. u32 local_dma_lkey;
  2121. u16 is_switch:1;
  2122. u8 node_type;
  2123. u8 phys_port_cnt;
  2124. struct ib_device_attr attrs;
  2125. struct attribute_group *hw_stats_ag;
  2126. struct rdma_hw_stats *hw_stats;
  2127. #ifdef CONFIG_CGROUP_RDMA
  2128. struct rdmacg_device cg_device;
  2129. #endif
  2130. u32 index;
  2131. /*
  2132. * Implementation details of the RDMA core, don't use in drivers
  2133. */
  2134. struct rdma_restrack_root res;
  2135. /**
  2136. * The following mandatory functions are used only at device
  2137. * registration. Keep functions such as these at the end of this
  2138. * structure to avoid cache line misses when accessing struct ib_device
  2139. * in fast paths.
  2140. */
  2141. int (*get_port_immutable)(struct ib_device *, u8, struct ib_port_immutable *);
  2142. void (*get_dev_fw_str)(struct ib_device *, char *str);
  2143. const struct cpumask *(*get_vector_affinity)(struct ib_device *ibdev,
  2144. int comp_vector);
  2145. struct uverbs_root_spec *specs_root;
  2146. };
  2147. struct ib_client {
  2148. char *name;
  2149. void (*add) (struct ib_device *);
  2150. void (*remove)(struct ib_device *, void *client_data);
  2151. /* Returns the net_dev belonging to this ib_client and matching the
  2152. * given parameters.
  2153. * @dev: An RDMA device that the net_dev use for communication.
  2154. * @port: A physical port number on the RDMA device.
  2155. * @pkey: P_Key that the net_dev uses if applicable.
  2156. * @gid: A GID that the net_dev uses to communicate.
  2157. * @addr: An IP address the net_dev is configured with.
  2158. * @client_data: The device's client data set by ib_set_client_data().
  2159. *
  2160. * An ib_client that implements a net_dev on top of RDMA devices
  2161. * (such as IP over IB) should implement this callback, allowing the
  2162. * rdma_cm module to find the right net_dev for a given request.
  2163. *
  2164. * The caller is responsible for calling dev_put on the returned
  2165. * netdev. */
  2166. struct net_device *(*get_net_dev_by_params)(
  2167. struct ib_device *dev,
  2168. u8 port,
  2169. u16 pkey,
  2170. const union ib_gid *gid,
  2171. const struct sockaddr *addr,
  2172. void *client_data);
  2173. struct list_head list;
  2174. };
  2175. struct ib_device *ib_alloc_device(size_t size);
  2176. void ib_dealloc_device(struct ib_device *device);
  2177. void ib_get_device_fw_str(struct ib_device *device, char *str);
  2178. int ib_register_device(struct ib_device *device,
  2179. int (*port_callback)(struct ib_device *,
  2180. u8, struct kobject *));
  2181. void ib_unregister_device(struct ib_device *device);
  2182. int ib_register_client (struct ib_client *client);
  2183. void ib_unregister_client(struct ib_client *client);
  2184. void *ib_get_client_data(struct ib_device *device, struct ib_client *client);
  2185. void ib_set_client_data(struct ib_device *device, struct ib_client *client,
  2186. void *data);
  2187. static inline int ib_copy_from_udata(void *dest, struct ib_udata *udata, size_t len)
  2188. {
  2189. return copy_from_user(dest, udata->inbuf, len) ? -EFAULT : 0;
  2190. }
  2191. static inline int ib_copy_to_udata(struct ib_udata *udata, void *src, size_t len)
  2192. {
  2193. return copy_to_user(udata->outbuf, src, len) ? -EFAULT : 0;
  2194. }
  2195. static inline bool ib_is_udata_cleared(struct ib_udata *udata,
  2196. size_t offset,
  2197. size_t len)
  2198. {
  2199. const void __user *p = udata->inbuf + offset;
  2200. bool ret;
  2201. u8 *buf;
  2202. if (len > USHRT_MAX)
  2203. return false;
  2204. buf = memdup_user(p, len);
  2205. if (IS_ERR(buf))
  2206. return false;
  2207. ret = !memchr_inv(buf, 0, len);
  2208. kfree(buf);
  2209. return ret;
  2210. }
  2211. /**
  2212. * ib_modify_qp_is_ok - Check that the supplied attribute mask
  2213. * contains all required attributes and no attributes not allowed for
  2214. * the given QP state transition.
  2215. * @cur_state: Current QP state
  2216. * @next_state: Next QP state
  2217. * @type: QP type
  2218. * @mask: Mask of supplied QP attributes
  2219. * @ll : link layer of port
  2220. *
  2221. * This function is a helper function that a low-level driver's
  2222. * modify_qp method can use to validate the consumer's input. It
  2223. * checks that cur_state and next_state are valid QP states, that a
  2224. * transition from cur_state to next_state is allowed by the IB spec,
  2225. * and that the attribute mask supplied is allowed for the transition.
  2226. */
  2227. int ib_modify_qp_is_ok(enum ib_qp_state cur_state, enum ib_qp_state next_state,
  2228. enum ib_qp_type type, enum ib_qp_attr_mask mask,
  2229. enum rdma_link_layer ll);
  2230. void ib_register_event_handler(struct ib_event_handler *event_handler);
  2231. void ib_unregister_event_handler(struct ib_event_handler *event_handler);
  2232. void ib_dispatch_event(struct ib_event *event);
  2233. int ib_query_port(struct ib_device *device,
  2234. u8 port_num, struct ib_port_attr *port_attr);
  2235. enum rdma_link_layer rdma_port_get_link_layer(struct ib_device *device,
  2236. u8 port_num);
  2237. /**
  2238. * rdma_cap_ib_switch - Check if the device is IB switch
  2239. * @device: Device to check
  2240. *
  2241. * Device driver is responsible for setting is_switch bit on
  2242. * in ib_device structure at init time.
  2243. *
  2244. * Return: true if the device is IB switch.
  2245. */
  2246. static inline bool rdma_cap_ib_switch(const struct ib_device *device)
  2247. {
  2248. return device->is_switch;
  2249. }
  2250. /**
  2251. * rdma_start_port - Return the first valid port number for the device
  2252. * specified
  2253. *
  2254. * @device: Device to be checked
  2255. *
  2256. * Return start port number
  2257. */
  2258. static inline u8 rdma_start_port(const struct ib_device *device)
  2259. {
  2260. return rdma_cap_ib_switch(device) ? 0 : 1;
  2261. }
  2262. /**
  2263. * rdma_end_port - Return the last valid port number for the device
  2264. * specified
  2265. *
  2266. * @device: Device to be checked
  2267. *
  2268. * Return last port number
  2269. */
  2270. static inline u8 rdma_end_port(const struct ib_device *device)
  2271. {
  2272. return rdma_cap_ib_switch(device) ? 0 : device->phys_port_cnt;
  2273. }
  2274. static inline int rdma_is_port_valid(const struct ib_device *device,
  2275. unsigned int port)
  2276. {
  2277. return (port >= rdma_start_port(device) &&
  2278. port <= rdma_end_port(device));
  2279. }
  2280. static inline bool rdma_protocol_ib(const struct ib_device *device, u8 port_num)
  2281. {
  2282. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_IB;
  2283. }
  2284. static inline bool rdma_protocol_roce(const struct ib_device *device, u8 port_num)
  2285. {
  2286. return device->port_immutable[port_num].core_cap_flags &
  2287. (RDMA_CORE_CAP_PROT_ROCE | RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP);
  2288. }
  2289. static inline bool rdma_protocol_roce_udp_encap(const struct ib_device *device, u8 port_num)
  2290. {
  2291. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_ROCE_UDP_ENCAP;
  2292. }
  2293. static inline bool rdma_protocol_roce_eth_encap(const struct ib_device *device, u8 port_num)
  2294. {
  2295. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_ROCE;
  2296. }
  2297. static inline bool rdma_protocol_iwarp(const struct ib_device *device, u8 port_num)
  2298. {
  2299. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_IWARP;
  2300. }
  2301. static inline bool rdma_ib_or_roce(const struct ib_device *device, u8 port_num)
  2302. {
  2303. return rdma_protocol_ib(device, port_num) ||
  2304. rdma_protocol_roce(device, port_num);
  2305. }
  2306. static inline bool rdma_protocol_raw_packet(const struct ib_device *device, u8 port_num)
  2307. {
  2308. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_RAW_PACKET;
  2309. }
  2310. static inline bool rdma_protocol_usnic(const struct ib_device *device, u8 port_num)
  2311. {
  2312. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_PROT_USNIC;
  2313. }
  2314. /**
  2315. * rdma_cap_ib_mad - Check if the port of a device supports Infiniband
  2316. * Management Datagrams.
  2317. * @device: Device to check
  2318. * @port_num: Port number to check
  2319. *
  2320. * Management Datagrams (MAD) are a required part of the InfiniBand
  2321. * specification and are supported on all InfiniBand devices. A slightly
  2322. * extended version are also supported on OPA interfaces.
  2323. *
  2324. * Return: true if the port supports sending/receiving of MAD packets.
  2325. */
  2326. static inline bool rdma_cap_ib_mad(const struct ib_device *device, u8 port_num)
  2327. {
  2328. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IB_MAD;
  2329. }
  2330. /**
  2331. * rdma_cap_opa_mad - Check if the port of device provides support for OPA
  2332. * Management Datagrams.
  2333. * @device: Device to check
  2334. * @port_num: Port number to check
  2335. *
  2336. * Intel OmniPath devices extend and/or replace the InfiniBand Management
  2337. * datagrams with their own versions. These OPA MADs share many but not all of
  2338. * the characteristics of InfiniBand MADs.
  2339. *
  2340. * OPA MADs differ in the following ways:
  2341. *
  2342. * 1) MADs are variable size up to 2K
  2343. * IBTA defined MADs remain fixed at 256 bytes
  2344. * 2) OPA SMPs must carry valid PKeys
  2345. * 3) OPA SMP packets are a different format
  2346. *
  2347. * Return: true if the port supports OPA MAD packet formats.
  2348. */
  2349. static inline bool rdma_cap_opa_mad(struct ib_device *device, u8 port_num)
  2350. {
  2351. return (device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_OPA_MAD)
  2352. == RDMA_CORE_CAP_OPA_MAD;
  2353. }
  2354. /**
  2355. * rdma_cap_ib_smi - Check if the port of a device provides an Infiniband
  2356. * Subnet Management Agent (SMA) on the Subnet Management Interface (SMI).
  2357. * @device: Device to check
  2358. * @port_num: Port number to check
  2359. *
  2360. * Each InfiniBand node is required to provide a Subnet Management Agent
  2361. * that the subnet manager can access. Prior to the fabric being fully
  2362. * configured by the subnet manager, the SMA is accessed via a well known
  2363. * interface called the Subnet Management Interface (SMI). This interface
  2364. * uses directed route packets to communicate with the SM to get around the
  2365. * chicken and egg problem of the SM needing to know what's on the fabric
  2366. * in order to configure the fabric, and needing to configure the fabric in
  2367. * order to send packets to the devices on the fabric. These directed
  2368. * route packets do not need the fabric fully configured in order to reach
  2369. * their destination. The SMI is the only method allowed to send
  2370. * directed route packets on an InfiniBand fabric.
  2371. *
  2372. * Return: true if the port provides an SMI.
  2373. */
  2374. static inline bool rdma_cap_ib_smi(const struct ib_device *device, u8 port_num)
  2375. {
  2376. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IB_SMI;
  2377. }
  2378. /**
  2379. * rdma_cap_ib_cm - Check if the port of device has the capability Infiniband
  2380. * Communication Manager.
  2381. * @device: Device to check
  2382. * @port_num: Port number to check
  2383. *
  2384. * The InfiniBand Communication Manager is one of many pre-defined General
  2385. * Service Agents (GSA) that are accessed via the General Service
  2386. * Interface (GSI). It's role is to facilitate establishment of connections
  2387. * between nodes as well as other management related tasks for established
  2388. * connections.
  2389. *
  2390. * Return: true if the port supports an IB CM (this does not guarantee that
  2391. * a CM is actually running however).
  2392. */
  2393. static inline bool rdma_cap_ib_cm(const struct ib_device *device, u8 port_num)
  2394. {
  2395. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IB_CM;
  2396. }
  2397. /**
  2398. * rdma_cap_iw_cm - Check if the port of device has the capability IWARP
  2399. * Communication Manager.
  2400. * @device: Device to check
  2401. * @port_num: Port number to check
  2402. *
  2403. * Similar to above, but specific to iWARP connections which have a different
  2404. * managment protocol than InfiniBand.
  2405. *
  2406. * Return: true if the port supports an iWARP CM (this does not guarantee that
  2407. * a CM is actually running however).
  2408. */
  2409. static inline bool rdma_cap_iw_cm(const struct ib_device *device, u8 port_num)
  2410. {
  2411. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IW_CM;
  2412. }
  2413. /**
  2414. * rdma_cap_ib_sa - Check if the port of device has the capability Infiniband
  2415. * Subnet Administration.
  2416. * @device: Device to check
  2417. * @port_num: Port number to check
  2418. *
  2419. * An InfiniBand Subnet Administration (SA) service is a pre-defined General
  2420. * Service Agent (GSA) provided by the Subnet Manager (SM). On InfiniBand
  2421. * fabrics, devices should resolve routes to other hosts by contacting the
  2422. * SA to query the proper route.
  2423. *
  2424. * Return: true if the port should act as a client to the fabric Subnet
  2425. * Administration interface. This does not imply that the SA service is
  2426. * running locally.
  2427. */
  2428. static inline bool rdma_cap_ib_sa(const struct ib_device *device, u8 port_num)
  2429. {
  2430. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_IB_SA;
  2431. }
  2432. /**
  2433. * rdma_cap_ib_mcast - Check if the port of device has the capability Infiniband
  2434. * Multicast.
  2435. * @device: Device to check
  2436. * @port_num: Port number to check
  2437. *
  2438. * InfiniBand multicast registration is more complex than normal IPv4 or
  2439. * IPv6 multicast registration. Each Host Channel Adapter must register
  2440. * with the Subnet Manager when it wishes to join a multicast group. It
  2441. * should do so only once regardless of how many queue pairs it subscribes
  2442. * to this group. And it should leave the group only after all queue pairs
  2443. * attached to the group have been detached.
  2444. *
  2445. * Return: true if the port must undertake the additional adminstrative
  2446. * overhead of registering/unregistering with the SM and tracking of the
  2447. * total number of queue pairs attached to the multicast group.
  2448. */
  2449. static inline bool rdma_cap_ib_mcast(const struct ib_device *device, u8 port_num)
  2450. {
  2451. return rdma_cap_ib_sa(device, port_num);
  2452. }
  2453. /**
  2454. * rdma_cap_af_ib - Check if the port of device has the capability
  2455. * Native Infiniband Address.
  2456. * @device: Device to check
  2457. * @port_num: Port number to check
  2458. *
  2459. * InfiniBand addressing uses a port's GUID + Subnet Prefix to make a default
  2460. * GID. RoCE uses a different mechanism, but still generates a GID via
  2461. * a prescribed mechanism and port specific data.
  2462. *
  2463. * Return: true if the port uses a GID address to identify devices on the
  2464. * network.
  2465. */
  2466. static inline bool rdma_cap_af_ib(const struct ib_device *device, u8 port_num)
  2467. {
  2468. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_AF_IB;
  2469. }
  2470. /**
  2471. * rdma_cap_eth_ah - Check if the port of device has the capability
  2472. * Ethernet Address Handle.
  2473. * @device: Device to check
  2474. * @port_num: Port number to check
  2475. *
  2476. * RoCE is InfiniBand over Ethernet, and it uses a well defined technique
  2477. * to fabricate GIDs over Ethernet/IP specific addresses native to the
  2478. * port. Normally, packet headers are generated by the sending host
  2479. * adapter, but when sending connectionless datagrams, we must manually
  2480. * inject the proper headers for the fabric we are communicating over.
  2481. *
  2482. * Return: true if we are running as a RoCE port and must force the
  2483. * addition of a Global Route Header built from our Ethernet Address
  2484. * Handle into our header list for connectionless packets.
  2485. */
  2486. static inline bool rdma_cap_eth_ah(const struct ib_device *device, u8 port_num)
  2487. {
  2488. return device->port_immutable[port_num].core_cap_flags & RDMA_CORE_CAP_ETH_AH;
  2489. }
  2490. /**
  2491. * rdma_cap_opa_ah - Check if the port of device supports
  2492. * OPA Address handles
  2493. * @device: Device to check
  2494. * @port_num: Port number to check
  2495. *
  2496. * Return: true if we are running on an OPA device which supports
  2497. * the extended OPA addressing.
  2498. */
  2499. static inline bool rdma_cap_opa_ah(struct ib_device *device, u8 port_num)
  2500. {
  2501. return (device->port_immutable[port_num].core_cap_flags &
  2502. RDMA_CORE_CAP_OPA_AH) == RDMA_CORE_CAP_OPA_AH;
  2503. }
  2504. /**
  2505. * rdma_max_mad_size - Return the max MAD size required by this RDMA Port.
  2506. *
  2507. * @device: Device
  2508. * @port_num: Port number
  2509. *
  2510. * This MAD size includes the MAD headers and MAD payload. No other headers
  2511. * are included.
  2512. *
  2513. * Return the max MAD size required by the Port. Will return 0 if the port
  2514. * does not support MADs
  2515. */
  2516. static inline size_t rdma_max_mad_size(const struct ib_device *device, u8 port_num)
  2517. {
  2518. return device->port_immutable[port_num].max_mad_size;
  2519. }
  2520. /**
  2521. * rdma_cap_roce_gid_table - Check if the port of device uses roce_gid_table
  2522. * @device: Device to check
  2523. * @port_num: Port number to check
  2524. *
  2525. * RoCE GID table mechanism manages the various GIDs for a device.
  2526. *
  2527. * NOTE: if allocating the port's GID table has failed, this call will still
  2528. * return true, but any RoCE GID table API will fail.
  2529. *
  2530. * Return: true if the port uses RoCE GID table mechanism in order to manage
  2531. * its GIDs.
  2532. */
  2533. static inline bool rdma_cap_roce_gid_table(const struct ib_device *device,
  2534. u8 port_num)
  2535. {
  2536. return rdma_protocol_roce(device, port_num) &&
  2537. device->add_gid && device->del_gid;
  2538. }
  2539. /*
  2540. * Check if the device supports READ W/ INVALIDATE.
  2541. */
  2542. static inline bool rdma_cap_read_inv(struct ib_device *dev, u32 port_num)
  2543. {
  2544. /*
  2545. * iWarp drivers must support READ W/ INVALIDATE. No other protocol
  2546. * has support for it yet.
  2547. */
  2548. return rdma_protocol_iwarp(dev, port_num);
  2549. }
  2550. int ib_query_gid(struct ib_device *device,
  2551. u8 port_num, int index, union ib_gid *gid,
  2552. struct ib_gid_attr *attr);
  2553. int ib_set_vf_link_state(struct ib_device *device, int vf, u8 port,
  2554. int state);
  2555. int ib_get_vf_config(struct ib_device *device, int vf, u8 port,
  2556. struct ifla_vf_info *info);
  2557. int ib_get_vf_stats(struct ib_device *device, int vf, u8 port,
  2558. struct ifla_vf_stats *stats);
  2559. int ib_set_vf_guid(struct ib_device *device, int vf, u8 port, u64 guid,
  2560. int type);
  2561. int ib_query_pkey(struct ib_device *device,
  2562. u8 port_num, u16 index, u16 *pkey);
  2563. int ib_modify_device(struct ib_device *device,
  2564. int device_modify_mask,
  2565. struct ib_device_modify *device_modify);
  2566. int ib_modify_port(struct ib_device *device,
  2567. u8 port_num, int port_modify_mask,
  2568. struct ib_port_modify *port_modify);
  2569. int ib_find_gid(struct ib_device *device, union ib_gid *gid,
  2570. struct net_device *ndev, u8 *port_num, u16 *index);
  2571. int ib_find_pkey(struct ib_device *device,
  2572. u8 port_num, u16 pkey, u16 *index);
  2573. enum ib_pd_flags {
  2574. /*
  2575. * Create a memory registration for all memory in the system and place
  2576. * the rkey for it into pd->unsafe_global_rkey. This can be used by
  2577. * ULPs to avoid the overhead of dynamic MRs.
  2578. *
  2579. * This flag is generally considered unsafe and must only be used in
  2580. * extremly trusted environments. Every use of it will log a warning
  2581. * in the kernel log.
  2582. */
  2583. IB_PD_UNSAFE_GLOBAL_RKEY = 0x01,
  2584. };
  2585. struct ib_pd *__ib_alloc_pd(struct ib_device *device, unsigned int flags,
  2586. const char *caller);
  2587. #define ib_alloc_pd(device, flags) \
  2588. __ib_alloc_pd((device), (flags), KBUILD_MODNAME)
  2589. void ib_dealloc_pd(struct ib_pd *pd);
  2590. /**
  2591. * rdma_create_ah - Creates an address handle for the given address vector.
  2592. * @pd: The protection domain associated with the address handle.
  2593. * @ah_attr: The attributes of the address vector.
  2594. *
  2595. * The address handle is used to reference a local or global destination
  2596. * in all UD QP post sends.
  2597. */
  2598. struct ib_ah *rdma_create_ah(struct ib_pd *pd, struct rdma_ah_attr *ah_attr);
  2599. /**
  2600. * rdma_create_user_ah - Creates an address handle for the given address vector.
  2601. * It resolves destination mac address for ah attribute of RoCE type.
  2602. * @pd: The protection domain associated with the address handle.
  2603. * @ah_attr: The attributes of the address vector.
  2604. * @udata: pointer to user's input output buffer information need by
  2605. * provider driver.
  2606. *
  2607. * It returns 0 on success and returns appropriate error code on error.
  2608. * The address handle is used to reference a local or global destination
  2609. * in all UD QP post sends.
  2610. */
  2611. struct ib_ah *rdma_create_user_ah(struct ib_pd *pd,
  2612. struct rdma_ah_attr *ah_attr,
  2613. struct ib_udata *udata);
  2614. /**
  2615. * ib_get_gids_from_rdma_hdr - Get sgid and dgid from GRH or IPv4 header
  2616. * work completion.
  2617. * @hdr: the L3 header to parse
  2618. * @net_type: type of header to parse
  2619. * @sgid: place to store source gid
  2620. * @dgid: place to store destination gid
  2621. */
  2622. int ib_get_gids_from_rdma_hdr(const union rdma_network_hdr *hdr,
  2623. enum rdma_network_type net_type,
  2624. union ib_gid *sgid, union ib_gid *dgid);
  2625. /**
  2626. * ib_get_rdma_header_version - Get the header version
  2627. * @hdr: the L3 header to parse
  2628. */
  2629. int ib_get_rdma_header_version(const union rdma_network_hdr *hdr);
  2630. /**
  2631. * ib_init_ah_attr_from_wc - Initializes address handle attributes from a
  2632. * work completion.
  2633. * @device: Device on which the received message arrived.
  2634. * @port_num: Port on which the received message arrived.
  2635. * @wc: Work completion associated with the received message.
  2636. * @grh: References the received global route header. This parameter is
  2637. * ignored unless the work completion indicates that the GRH is valid.
  2638. * @ah_attr: Returned attributes that can be used when creating an address
  2639. * handle for replying to the message.
  2640. */
  2641. int ib_init_ah_attr_from_wc(struct ib_device *device, u8 port_num,
  2642. const struct ib_wc *wc, const struct ib_grh *grh,
  2643. struct rdma_ah_attr *ah_attr);
  2644. /**
  2645. * ib_create_ah_from_wc - Creates an address handle associated with the
  2646. * sender of the specified work completion.
  2647. * @pd: The protection domain associated with the address handle.
  2648. * @wc: Work completion information associated with a received message.
  2649. * @grh: References the received global route header. This parameter is
  2650. * ignored unless the work completion indicates that the GRH is valid.
  2651. * @port_num: The outbound port number to associate with the address.
  2652. *
  2653. * The address handle is used to reference a local or global destination
  2654. * in all UD QP post sends.
  2655. */
  2656. struct ib_ah *ib_create_ah_from_wc(struct ib_pd *pd, const struct ib_wc *wc,
  2657. const struct ib_grh *grh, u8 port_num);
  2658. /**
  2659. * rdma_modify_ah - Modifies the address vector associated with an address
  2660. * handle.
  2661. * @ah: The address handle to modify.
  2662. * @ah_attr: The new address vector attributes to associate with the
  2663. * address handle.
  2664. */
  2665. int rdma_modify_ah(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
  2666. /**
  2667. * rdma_query_ah - Queries the address vector associated with an address
  2668. * handle.
  2669. * @ah: The address handle to query.
  2670. * @ah_attr: The address vector attributes associated with the address
  2671. * handle.
  2672. */
  2673. int rdma_query_ah(struct ib_ah *ah, struct rdma_ah_attr *ah_attr);
  2674. /**
  2675. * rdma_destroy_ah - Destroys an address handle.
  2676. * @ah: The address handle to destroy.
  2677. */
  2678. int rdma_destroy_ah(struct ib_ah *ah);
  2679. /**
  2680. * ib_create_srq - Creates a SRQ associated with the specified protection
  2681. * domain.
  2682. * @pd: The protection domain associated with the SRQ.
  2683. * @srq_init_attr: A list of initial attributes required to create the
  2684. * SRQ. If SRQ creation succeeds, then the attributes are updated to
  2685. * the actual capabilities of the created SRQ.
  2686. *
  2687. * srq_attr->max_wr and srq_attr->max_sge are read the determine the
  2688. * requested size of the SRQ, and set to the actual values allocated
  2689. * on return. If ib_create_srq() succeeds, then max_wr and max_sge
  2690. * will always be at least as large as the requested values.
  2691. */
  2692. struct ib_srq *ib_create_srq(struct ib_pd *pd,
  2693. struct ib_srq_init_attr *srq_init_attr);
  2694. /**
  2695. * ib_modify_srq - Modifies the attributes for the specified SRQ.
  2696. * @srq: The SRQ to modify.
  2697. * @srq_attr: On input, specifies the SRQ attributes to modify. On output,
  2698. * the current values of selected SRQ attributes are returned.
  2699. * @srq_attr_mask: A bit-mask used to specify which attributes of the SRQ
  2700. * are being modified.
  2701. *
  2702. * The mask may contain IB_SRQ_MAX_WR to resize the SRQ and/or
  2703. * IB_SRQ_LIMIT to set the SRQ's limit and request notification when
  2704. * the number of receives queued drops below the limit.
  2705. */
  2706. int ib_modify_srq(struct ib_srq *srq,
  2707. struct ib_srq_attr *srq_attr,
  2708. enum ib_srq_attr_mask srq_attr_mask);
  2709. /**
  2710. * ib_query_srq - Returns the attribute list and current values for the
  2711. * specified SRQ.
  2712. * @srq: The SRQ to query.
  2713. * @srq_attr: The attributes of the specified SRQ.
  2714. */
  2715. int ib_query_srq(struct ib_srq *srq,
  2716. struct ib_srq_attr *srq_attr);
  2717. /**
  2718. * ib_destroy_srq - Destroys the specified SRQ.
  2719. * @srq: The SRQ to destroy.
  2720. */
  2721. int ib_destroy_srq(struct ib_srq *srq);
  2722. /**
  2723. * ib_post_srq_recv - Posts a list of work requests to the specified SRQ.
  2724. * @srq: The SRQ to post the work request on.
  2725. * @recv_wr: A list of work requests to post on the receive queue.
  2726. * @bad_recv_wr: On an immediate failure, this parameter will reference
  2727. * the work request that failed to be posted on the QP.
  2728. */
  2729. static inline int ib_post_srq_recv(struct ib_srq *srq,
  2730. struct ib_recv_wr *recv_wr,
  2731. struct ib_recv_wr **bad_recv_wr)
  2732. {
  2733. return srq->device->post_srq_recv(srq, recv_wr, bad_recv_wr);
  2734. }
  2735. /**
  2736. * ib_create_qp - Creates a QP associated with the specified protection
  2737. * domain.
  2738. * @pd: The protection domain associated with the QP.
  2739. * @qp_init_attr: A list of initial attributes required to create the
  2740. * QP. If QP creation succeeds, then the attributes are updated to
  2741. * the actual capabilities of the created QP.
  2742. */
  2743. struct ib_qp *ib_create_qp(struct ib_pd *pd,
  2744. struct ib_qp_init_attr *qp_init_attr);
  2745. /**
  2746. * ib_modify_qp_with_udata - Modifies the attributes for the specified QP.
  2747. * @qp: The QP to modify.
  2748. * @attr: On input, specifies the QP attributes to modify. On output,
  2749. * the current values of selected QP attributes are returned.
  2750. * @attr_mask: A bit-mask used to specify which attributes of the QP
  2751. * are being modified.
  2752. * @udata: pointer to user's input output buffer information
  2753. * are being modified.
  2754. * It returns 0 on success and returns appropriate error code on error.
  2755. */
  2756. int ib_modify_qp_with_udata(struct ib_qp *qp,
  2757. struct ib_qp_attr *attr,
  2758. int attr_mask,
  2759. struct ib_udata *udata);
  2760. /**
  2761. * ib_modify_qp - Modifies the attributes for the specified QP and then
  2762. * transitions the QP to the given state.
  2763. * @qp: The QP to modify.
  2764. * @qp_attr: On input, specifies the QP attributes to modify. On output,
  2765. * the current values of selected QP attributes are returned.
  2766. * @qp_attr_mask: A bit-mask used to specify which attributes of the QP
  2767. * are being modified.
  2768. */
  2769. int ib_modify_qp(struct ib_qp *qp,
  2770. struct ib_qp_attr *qp_attr,
  2771. int qp_attr_mask);
  2772. /**
  2773. * ib_query_qp - Returns the attribute list and current values for the
  2774. * specified QP.
  2775. * @qp: The QP to query.
  2776. * @qp_attr: The attributes of the specified QP.
  2777. * @qp_attr_mask: A bit-mask used to select specific attributes to query.
  2778. * @qp_init_attr: Additional attributes of the selected QP.
  2779. *
  2780. * The qp_attr_mask may be used to limit the query to gathering only the
  2781. * selected attributes.
  2782. */
  2783. int ib_query_qp(struct ib_qp *qp,
  2784. struct ib_qp_attr *qp_attr,
  2785. int qp_attr_mask,
  2786. struct ib_qp_init_attr *qp_init_attr);
  2787. /**
  2788. * ib_destroy_qp - Destroys the specified QP.
  2789. * @qp: The QP to destroy.
  2790. */
  2791. int ib_destroy_qp(struct ib_qp *qp);
  2792. /**
  2793. * ib_open_qp - Obtain a reference to an existing sharable QP.
  2794. * @xrcd - XRC domain
  2795. * @qp_open_attr: Attributes identifying the QP to open.
  2796. *
  2797. * Returns a reference to a sharable QP.
  2798. */
  2799. struct ib_qp *ib_open_qp(struct ib_xrcd *xrcd,
  2800. struct ib_qp_open_attr *qp_open_attr);
  2801. /**
  2802. * ib_close_qp - Release an external reference to a QP.
  2803. * @qp: The QP handle to release
  2804. *
  2805. * The opened QP handle is released by the caller. The underlying
  2806. * shared QP is not destroyed until all internal references are released.
  2807. */
  2808. int ib_close_qp(struct ib_qp *qp);
  2809. /**
  2810. * ib_post_send - Posts a list of work requests to the send queue of
  2811. * the specified QP.
  2812. * @qp: The QP to post the work request on.
  2813. * @send_wr: A list of work requests to post on the send queue.
  2814. * @bad_send_wr: On an immediate failure, this parameter will reference
  2815. * the work request that failed to be posted on the QP.
  2816. *
  2817. * While IBA Vol. 1 section 11.4.1.1 specifies that if an immediate
  2818. * error is returned, the QP state shall not be affected,
  2819. * ib_post_send() will return an immediate error after queueing any
  2820. * earlier work requests in the list.
  2821. */
  2822. static inline int ib_post_send(struct ib_qp *qp,
  2823. struct ib_send_wr *send_wr,
  2824. struct ib_send_wr **bad_send_wr)
  2825. {
  2826. return qp->device->post_send(qp, send_wr, bad_send_wr);
  2827. }
  2828. /**
  2829. * ib_post_recv - Posts a list of work requests to the receive queue of
  2830. * the specified QP.
  2831. * @qp: The QP to post the work request on.
  2832. * @recv_wr: A list of work requests to post on the receive queue.
  2833. * @bad_recv_wr: On an immediate failure, this parameter will reference
  2834. * the work request that failed to be posted on the QP.
  2835. */
  2836. static inline int ib_post_recv(struct ib_qp *qp,
  2837. struct ib_recv_wr *recv_wr,
  2838. struct ib_recv_wr **bad_recv_wr)
  2839. {
  2840. return qp->device->post_recv(qp, recv_wr, bad_recv_wr);
  2841. }
  2842. struct ib_cq *__ib_alloc_cq(struct ib_device *dev, void *private,
  2843. int nr_cqe, int comp_vector,
  2844. enum ib_poll_context poll_ctx, const char *caller);
  2845. #define ib_alloc_cq(device, priv, nr_cqe, comp_vect, poll_ctx) \
  2846. __ib_alloc_cq((device), (priv), (nr_cqe), (comp_vect), (poll_ctx), KBUILD_MODNAME)
  2847. void ib_free_cq(struct ib_cq *cq);
  2848. int ib_process_cq_direct(struct ib_cq *cq, int budget);
  2849. /**
  2850. * ib_create_cq - Creates a CQ on the specified device.
  2851. * @device: The device on which to create the CQ.
  2852. * @comp_handler: A user-specified callback that is invoked when a
  2853. * completion event occurs on the CQ.
  2854. * @event_handler: A user-specified callback that is invoked when an
  2855. * asynchronous event not associated with a completion occurs on the CQ.
  2856. * @cq_context: Context associated with the CQ returned to the user via
  2857. * the associated completion and event handlers.
  2858. * @cq_attr: The attributes the CQ should be created upon.
  2859. *
  2860. * Users can examine the cq structure to determine the actual CQ size.
  2861. */
  2862. struct ib_cq *ib_create_cq(struct ib_device *device,
  2863. ib_comp_handler comp_handler,
  2864. void (*event_handler)(struct ib_event *, void *),
  2865. void *cq_context,
  2866. const struct ib_cq_init_attr *cq_attr);
  2867. /**
  2868. * ib_resize_cq - Modifies the capacity of the CQ.
  2869. * @cq: The CQ to resize.
  2870. * @cqe: The minimum size of the CQ.
  2871. *
  2872. * Users can examine the cq structure to determine the actual CQ size.
  2873. */
  2874. int ib_resize_cq(struct ib_cq *cq, int cqe);
  2875. /**
  2876. * rdma_set_cq_moderation - Modifies moderation params of the CQ
  2877. * @cq: The CQ to modify.
  2878. * @cq_count: number of CQEs that will trigger an event
  2879. * @cq_period: max period of time in usec before triggering an event
  2880. *
  2881. */
  2882. int rdma_set_cq_moderation(struct ib_cq *cq, u16 cq_count, u16 cq_period);
  2883. /**
  2884. * ib_destroy_cq - Destroys the specified CQ.
  2885. * @cq: The CQ to destroy.
  2886. */
  2887. int ib_destroy_cq(struct ib_cq *cq);
  2888. /**
  2889. * ib_poll_cq - poll a CQ for completion(s)
  2890. * @cq:the CQ being polled
  2891. * @num_entries:maximum number of completions to return
  2892. * @wc:array of at least @num_entries &struct ib_wc where completions
  2893. * will be returned
  2894. *
  2895. * Poll a CQ for (possibly multiple) completions. If the return value
  2896. * is < 0, an error occurred. If the return value is >= 0, it is the
  2897. * number of completions returned. If the return value is
  2898. * non-negative and < num_entries, then the CQ was emptied.
  2899. */
  2900. static inline int ib_poll_cq(struct ib_cq *cq, int num_entries,
  2901. struct ib_wc *wc)
  2902. {
  2903. return cq->device->poll_cq(cq, num_entries, wc);
  2904. }
  2905. /**
  2906. * ib_peek_cq - Returns the number of unreaped completions currently
  2907. * on the specified CQ.
  2908. * @cq: The CQ to peek.
  2909. * @wc_cnt: A minimum number of unreaped completions to check for.
  2910. *
  2911. * If the number of unreaped completions is greater than or equal to wc_cnt,
  2912. * this function returns wc_cnt, otherwise, it returns the actual number of
  2913. * unreaped completions.
  2914. */
  2915. int ib_peek_cq(struct ib_cq *cq, int wc_cnt);
  2916. /**
  2917. * ib_req_notify_cq - Request completion notification on a CQ.
  2918. * @cq: The CQ to generate an event for.
  2919. * @flags:
  2920. * Must contain exactly one of %IB_CQ_SOLICITED or %IB_CQ_NEXT_COMP
  2921. * to request an event on the next solicited event or next work
  2922. * completion at any type, respectively. %IB_CQ_REPORT_MISSED_EVENTS
  2923. * may also be |ed in to request a hint about missed events, as
  2924. * described below.
  2925. *
  2926. * Return Value:
  2927. * < 0 means an error occurred while requesting notification
  2928. * == 0 means notification was requested successfully, and if
  2929. * IB_CQ_REPORT_MISSED_EVENTS was passed in, then no events
  2930. * were missed and it is safe to wait for another event. In
  2931. * this case is it guaranteed that any work completions added
  2932. * to the CQ since the last CQ poll will trigger a completion
  2933. * notification event.
  2934. * > 0 is only returned if IB_CQ_REPORT_MISSED_EVENTS was passed
  2935. * in. It means that the consumer must poll the CQ again to
  2936. * make sure it is empty to avoid missing an event because of a
  2937. * race between requesting notification and an entry being
  2938. * added to the CQ. This return value means it is possible
  2939. * (but not guaranteed) that a work completion has been added
  2940. * to the CQ since the last poll without triggering a
  2941. * completion notification event.
  2942. */
  2943. static inline int ib_req_notify_cq(struct ib_cq *cq,
  2944. enum ib_cq_notify_flags flags)
  2945. {
  2946. return cq->device->req_notify_cq(cq, flags);
  2947. }
  2948. /**
  2949. * ib_req_ncomp_notif - Request completion notification when there are
  2950. * at least the specified number of unreaped completions on the CQ.
  2951. * @cq: The CQ to generate an event for.
  2952. * @wc_cnt: The number of unreaped completions that should be on the
  2953. * CQ before an event is generated.
  2954. */
  2955. static inline int ib_req_ncomp_notif(struct ib_cq *cq, int wc_cnt)
  2956. {
  2957. return cq->device->req_ncomp_notif ?
  2958. cq->device->req_ncomp_notif(cq, wc_cnt) :
  2959. -ENOSYS;
  2960. }
  2961. /**
  2962. * ib_dma_mapping_error - check a DMA addr for error
  2963. * @dev: The device for which the dma_addr was created
  2964. * @dma_addr: The DMA address to check
  2965. */
  2966. static inline int ib_dma_mapping_error(struct ib_device *dev, u64 dma_addr)
  2967. {
  2968. return dma_mapping_error(dev->dma_device, dma_addr);
  2969. }
  2970. /**
  2971. * ib_dma_map_single - Map a kernel virtual address to DMA address
  2972. * @dev: The device for which the dma_addr is to be created
  2973. * @cpu_addr: The kernel virtual address
  2974. * @size: The size of the region in bytes
  2975. * @direction: The direction of the DMA
  2976. */
  2977. static inline u64 ib_dma_map_single(struct ib_device *dev,
  2978. void *cpu_addr, size_t size,
  2979. enum dma_data_direction direction)
  2980. {
  2981. return dma_map_single(dev->dma_device, cpu_addr, size, direction);
  2982. }
  2983. /**
  2984. * ib_dma_unmap_single - Destroy a mapping created by ib_dma_map_single()
  2985. * @dev: The device for which the DMA address was created
  2986. * @addr: The DMA address
  2987. * @size: The size of the region in bytes
  2988. * @direction: The direction of the DMA
  2989. */
  2990. static inline void ib_dma_unmap_single(struct ib_device *dev,
  2991. u64 addr, size_t size,
  2992. enum dma_data_direction direction)
  2993. {
  2994. dma_unmap_single(dev->dma_device, addr, size, direction);
  2995. }
  2996. /**
  2997. * ib_dma_map_page - Map a physical page to DMA address
  2998. * @dev: The device for which the dma_addr is to be created
  2999. * @page: The page to be mapped
  3000. * @offset: The offset within the page
  3001. * @size: The size of the region in bytes
  3002. * @direction: The direction of the DMA
  3003. */
  3004. static inline u64 ib_dma_map_page(struct ib_device *dev,
  3005. struct page *page,
  3006. unsigned long offset,
  3007. size_t size,
  3008. enum dma_data_direction direction)
  3009. {
  3010. return dma_map_page(dev->dma_device, page, offset, size, direction);
  3011. }
  3012. /**
  3013. * ib_dma_unmap_page - Destroy a mapping created by ib_dma_map_page()
  3014. * @dev: The device for which the DMA address was created
  3015. * @addr: The DMA address
  3016. * @size: The size of the region in bytes
  3017. * @direction: The direction of the DMA
  3018. */
  3019. static inline void ib_dma_unmap_page(struct ib_device *dev,
  3020. u64 addr, size_t size,
  3021. enum dma_data_direction direction)
  3022. {
  3023. dma_unmap_page(dev->dma_device, addr, size, direction);
  3024. }
  3025. /**
  3026. * ib_dma_map_sg - Map a scatter/gather list to DMA addresses
  3027. * @dev: The device for which the DMA addresses are to be created
  3028. * @sg: The array of scatter/gather entries
  3029. * @nents: The number of scatter/gather entries
  3030. * @direction: The direction of the DMA
  3031. */
  3032. static inline int ib_dma_map_sg(struct ib_device *dev,
  3033. struct scatterlist *sg, int nents,
  3034. enum dma_data_direction direction)
  3035. {
  3036. return dma_map_sg(dev->dma_device, sg, nents, direction);
  3037. }
  3038. /**
  3039. * ib_dma_unmap_sg - Unmap a scatter/gather list of DMA addresses
  3040. * @dev: The device for which the DMA addresses were created
  3041. * @sg: The array of scatter/gather entries
  3042. * @nents: The number of scatter/gather entries
  3043. * @direction: The direction of the DMA
  3044. */
  3045. static inline void ib_dma_unmap_sg(struct ib_device *dev,
  3046. struct scatterlist *sg, int nents,
  3047. enum dma_data_direction direction)
  3048. {
  3049. dma_unmap_sg(dev->dma_device, sg, nents, direction);
  3050. }
  3051. static inline int ib_dma_map_sg_attrs(struct ib_device *dev,
  3052. struct scatterlist *sg, int nents,
  3053. enum dma_data_direction direction,
  3054. unsigned long dma_attrs)
  3055. {
  3056. return dma_map_sg_attrs(dev->dma_device, sg, nents, direction,
  3057. dma_attrs);
  3058. }
  3059. static inline void ib_dma_unmap_sg_attrs(struct ib_device *dev,
  3060. struct scatterlist *sg, int nents,
  3061. enum dma_data_direction direction,
  3062. unsigned long dma_attrs)
  3063. {
  3064. dma_unmap_sg_attrs(dev->dma_device, sg, nents, direction, dma_attrs);
  3065. }
  3066. /**
  3067. * ib_sg_dma_address - Return the DMA address from a scatter/gather entry
  3068. * @dev: The device for which the DMA addresses were created
  3069. * @sg: The scatter/gather entry
  3070. *
  3071. * Note: this function is obsolete. To do: change all occurrences of
  3072. * ib_sg_dma_address() into sg_dma_address().
  3073. */
  3074. static inline u64 ib_sg_dma_address(struct ib_device *dev,
  3075. struct scatterlist *sg)
  3076. {
  3077. return sg_dma_address(sg);
  3078. }
  3079. /**
  3080. * ib_sg_dma_len - Return the DMA length from a scatter/gather entry
  3081. * @dev: The device for which the DMA addresses were created
  3082. * @sg: The scatter/gather entry
  3083. *
  3084. * Note: this function is obsolete. To do: change all occurrences of
  3085. * ib_sg_dma_len() into sg_dma_len().
  3086. */
  3087. static inline unsigned int ib_sg_dma_len(struct ib_device *dev,
  3088. struct scatterlist *sg)
  3089. {
  3090. return sg_dma_len(sg);
  3091. }
  3092. /**
  3093. * ib_dma_sync_single_for_cpu - Prepare DMA region to be accessed by CPU
  3094. * @dev: The device for which the DMA address was created
  3095. * @addr: The DMA address
  3096. * @size: The size of the region in bytes
  3097. * @dir: The direction of the DMA
  3098. */
  3099. static inline void ib_dma_sync_single_for_cpu(struct ib_device *dev,
  3100. u64 addr,
  3101. size_t size,
  3102. enum dma_data_direction dir)
  3103. {
  3104. dma_sync_single_for_cpu(dev->dma_device, addr, size, dir);
  3105. }
  3106. /**
  3107. * ib_dma_sync_single_for_device - Prepare DMA region to be accessed by device
  3108. * @dev: The device for which the DMA address was created
  3109. * @addr: The DMA address
  3110. * @size: The size of the region in bytes
  3111. * @dir: The direction of the DMA
  3112. */
  3113. static inline void ib_dma_sync_single_for_device(struct ib_device *dev,
  3114. u64 addr,
  3115. size_t size,
  3116. enum dma_data_direction dir)
  3117. {
  3118. dma_sync_single_for_device(dev->dma_device, addr, size, dir);
  3119. }
  3120. /**
  3121. * ib_dma_alloc_coherent - Allocate memory and map it for DMA
  3122. * @dev: The device for which the DMA address is requested
  3123. * @size: The size of the region to allocate in bytes
  3124. * @dma_handle: A pointer for returning the DMA address of the region
  3125. * @flag: memory allocator flags
  3126. */
  3127. static inline void *ib_dma_alloc_coherent(struct ib_device *dev,
  3128. size_t size,
  3129. dma_addr_t *dma_handle,
  3130. gfp_t flag)
  3131. {
  3132. return dma_alloc_coherent(dev->dma_device, size, dma_handle, flag);
  3133. }
  3134. /**
  3135. * ib_dma_free_coherent - Free memory allocated by ib_dma_alloc_coherent()
  3136. * @dev: The device for which the DMA addresses were allocated
  3137. * @size: The size of the region
  3138. * @cpu_addr: the address returned by ib_dma_alloc_coherent()
  3139. * @dma_handle: the DMA address returned by ib_dma_alloc_coherent()
  3140. */
  3141. static inline void ib_dma_free_coherent(struct ib_device *dev,
  3142. size_t size, void *cpu_addr,
  3143. dma_addr_t dma_handle)
  3144. {
  3145. dma_free_coherent(dev->dma_device, size, cpu_addr, dma_handle);
  3146. }
  3147. /**
  3148. * ib_dereg_mr - Deregisters a memory region and removes it from the
  3149. * HCA translation table.
  3150. * @mr: The memory region to deregister.
  3151. *
  3152. * This function can fail, if the memory region has memory windows bound to it.
  3153. */
  3154. int ib_dereg_mr(struct ib_mr *mr);
  3155. struct ib_mr *ib_alloc_mr(struct ib_pd *pd,
  3156. enum ib_mr_type mr_type,
  3157. u32 max_num_sg);
  3158. /**
  3159. * ib_update_fast_reg_key - updates the key portion of the fast_reg MR
  3160. * R_Key and L_Key.
  3161. * @mr - struct ib_mr pointer to be updated.
  3162. * @newkey - new key to be used.
  3163. */
  3164. static inline void ib_update_fast_reg_key(struct ib_mr *mr, u8 newkey)
  3165. {
  3166. mr->lkey = (mr->lkey & 0xffffff00) | newkey;
  3167. mr->rkey = (mr->rkey & 0xffffff00) | newkey;
  3168. }
  3169. /**
  3170. * ib_inc_rkey - increments the key portion of the given rkey. Can be used
  3171. * for calculating a new rkey for type 2 memory windows.
  3172. * @rkey - the rkey to increment.
  3173. */
  3174. static inline u32 ib_inc_rkey(u32 rkey)
  3175. {
  3176. const u32 mask = 0x000000ff;
  3177. return ((rkey + 1) & mask) | (rkey & ~mask);
  3178. }
  3179. /**
  3180. * ib_alloc_fmr - Allocates a unmapped fast memory region.
  3181. * @pd: The protection domain associated with the unmapped region.
  3182. * @mr_access_flags: Specifies the memory access rights.
  3183. * @fmr_attr: Attributes of the unmapped region.
  3184. *
  3185. * A fast memory region must be mapped before it can be used as part of
  3186. * a work request.
  3187. */
  3188. struct ib_fmr *ib_alloc_fmr(struct ib_pd *pd,
  3189. int mr_access_flags,
  3190. struct ib_fmr_attr *fmr_attr);
  3191. /**
  3192. * ib_map_phys_fmr - Maps a list of physical pages to a fast memory region.
  3193. * @fmr: The fast memory region to associate with the pages.
  3194. * @page_list: An array of physical pages to map to the fast memory region.
  3195. * @list_len: The number of pages in page_list.
  3196. * @iova: The I/O virtual address to use with the mapped region.
  3197. */
  3198. static inline int ib_map_phys_fmr(struct ib_fmr *fmr,
  3199. u64 *page_list, int list_len,
  3200. u64 iova)
  3201. {
  3202. return fmr->device->map_phys_fmr(fmr, page_list, list_len, iova);
  3203. }
  3204. /**
  3205. * ib_unmap_fmr - Removes the mapping from a list of fast memory regions.
  3206. * @fmr_list: A linked list of fast memory regions to unmap.
  3207. */
  3208. int ib_unmap_fmr(struct list_head *fmr_list);
  3209. /**
  3210. * ib_dealloc_fmr - Deallocates a fast memory region.
  3211. * @fmr: The fast memory region to deallocate.
  3212. */
  3213. int ib_dealloc_fmr(struct ib_fmr *fmr);
  3214. /**
  3215. * ib_attach_mcast - Attaches the specified QP to a multicast group.
  3216. * @qp: QP to attach to the multicast group. The QP must be type
  3217. * IB_QPT_UD.
  3218. * @gid: Multicast group GID.
  3219. * @lid: Multicast group LID in host byte order.
  3220. *
  3221. * In order to send and receive multicast packets, subnet
  3222. * administration must have created the multicast group and configured
  3223. * the fabric appropriately. The port associated with the specified
  3224. * QP must also be a member of the multicast group.
  3225. */
  3226. int ib_attach_mcast(struct ib_qp *qp, union ib_gid *gid, u16 lid);
  3227. /**
  3228. * ib_detach_mcast - Detaches the specified QP from a multicast group.
  3229. * @qp: QP to detach from the multicast group.
  3230. * @gid: Multicast group GID.
  3231. * @lid: Multicast group LID in host byte order.
  3232. */
  3233. int ib_detach_mcast(struct ib_qp *qp, union ib_gid *gid, u16 lid);
  3234. /**
  3235. * ib_alloc_xrcd - Allocates an XRC domain.
  3236. * @device: The device on which to allocate the XRC domain.
  3237. * @caller: Module name for kernel consumers
  3238. */
  3239. struct ib_xrcd *__ib_alloc_xrcd(struct ib_device *device, const char *caller);
  3240. #define ib_alloc_xrcd(device) \
  3241. __ib_alloc_xrcd((device), KBUILD_MODNAME)
  3242. /**
  3243. * ib_dealloc_xrcd - Deallocates an XRC domain.
  3244. * @xrcd: The XRC domain to deallocate.
  3245. */
  3246. int ib_dealloc_xrcd(struct ib_xrcd *xrcd);
  3247. struct ib_flow *ib_create_flow(struct ib_qp *qp,
  3248. struct ib_flow_attr *flow_attr, int domain);
  3249. int ib_destroy_flow(struct ib_flow *flow_id);
  3250. static inline int ib_check_mr_access(int flags)
  3251. {
  3252. /*
  3253. * Local write permission is required if remote write or
  3254. * remote atomic permission is also requested.
  3255. */
  3256. if (flags & (IB_ACCESS_REMOTE_ATOMIC | IB_ACCESS_REMOTE_WRITE) &&
  3257. !(flags & IB_ACCESS_LOCAL_WRITE))
  3258. return -EINVAL;
  3259. return 0;
  3260. }
  3261. /**
  3262. * ib_check_mr_status: lightweight check of MR status.
  3263. * This routine may provide status checks on a selected
  3264. * ib_mr. first use is for signature status check.
  3265. *
  3266. * @mr: A memory region.
  3267. * @check_mask: Bitmask of which checks to perform from
  3268. * ib_mr_status_check enumeration.
  3269. * @mr_status: The container of relevant status checks.
  3270. * failed checks will be indicated in the status bitmask
  3271. * and the relevant info shall be in the error item.
  3272. */
  3273. int ib_check_mr_status(struct ib_mr *mr, u32 check_mask,
  3274. struct ib_mr_status *mr_status);
  3275. struct net_device *ib_get_net_dev_by_params(struct ib_device *dev, u8 port,
  3276. u16 pkey, const union ib_gid *gid,
  3277. const struct sockaddr *addr);
  3278. struct ib_wq *ib_create_wq(struct ib_pd *pd,
  3279. struct ib_wq_init_attr *init_attr);
  3280. int ib_destroy_wq(struct ib_wq *wq);
  3281. int ib_modify_wq(struct ib_wq *wq, struct ib_wq_attr *attr,
  3282. u32 wq_attr_mask);
  3283. struct ib_rwq_ind_table *ib_create_rwq_ind_table(struct ib_device *device,
  3284. struct ib_rwq_ind_table_init_attr*
  3285. wq_ind_table_init_attr);
  3286. int ib_destroy_rwq_ind_table(struct ib_rwq_ind_table *wq_ind_table);
  3287. int ib_map_mr_sg(struct ib_mr *mr, struct scatterlist *sg, int sg_nents,
  3288. unsigned int *sg_offset, unsigned int page_size);
  3289. static inline int
  3290. ib_map_mr_sg_zbva(struct ib_mr *mr, struct scatterlist *sg, int sg_nents,
  3291. unsigned int *sg_offset, unsigned int page_size)
  3292. {
  3293. int n;
  3294. n = ib_map_mr_sg(mr, sg, sg_nents, sg_offset, page_size);
  3295. mr->iova = 0;
  3296. return n;
  3297. }
  3298. int ib_sg_to_pages(struct ib_mr *mr, struct scatterlist *sgl, int sg_nents,
  3299. unsigned int *sg_offset, int (*set_page)(struct ib_mr *, u64));
  3300. void ib_drain_rq(struct ib_qp *qp);
  3301. void ib_drain_sq(struct ib_qp *qp);
  3302. void ib_drain_qp(struct ib_qp *qp);
  3303. int ib_get_eth_speed(struct ib_device *dev, u8 port_num, u8 *speed, u8 *width);
  3304. static inline u8 *rdma_ah_retrieve_dmac(struct rdma_ah_attr *attr)
  3305. {
  3306. if (attr->type == RDMA_AH_ATTR_TYPE_ROCE)
  3307. return attr->roce.dmac;
  3308. return NULL;
  3309. }
  3310. static inline void rdma_ah_set_dlid(struct rdma_ah_attr *attr, u32 dlid)
  3311. {
  3312. if (attr->type == RDMA_AH_ATTR_TYPE_IB)
  3313. attr->ib.dlid = (u16)dlid;
  3314. else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
  3315. attr->opa.dlid = dlid;
  3316. }
  3317. static inline u32 rdma_ah_get_dlid(const struct rdma_ah_attr *attr)
  3318. {
  3319. if (attr->type == RDMA_AH_ATTR_TYPE_IB)
  3320. return attr->ib.dlid;
  3321. else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
  3322. return attr->opa.dlid;
  3323. return 0;
  3324. }
  3325. static inline void rdma_ah_set_sl(struct rdma_ah_attr *attr, u8 sl)
  3326. {
  3327. attr->sl = sl;
  3328. }
  3329. static inline u8 rdma_ah_get_sl(const struct rdma_ah_attr *attr)
  3330. {
  3331. return attr->sl;
  3332. }
  3333. static inline void rdma_ah_set_path_bits(struct rdma_ah_attr *attr,
  3334. u8 src_path_bits)
  3335. {
  3336. if (attr->type == RDMA_AH_ATTR_TYPE_IB)
  3337. attr->ib.src_path_bits = src_path_bits;
  3338. else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
  3339. attr->opa.src_path_bits = src_path_bits;
  3340. }
  3341. static inline u8 rdma_ah_get_path_bits(const struct rdma_ah_attr *attr)
  3342. {
  3343. if (attr->type == RDMA_AH_ATTR_TYPE_IB)
  3344. return attr->ib.src_path_bits;
  3345. else if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
  3346. return attr->opa.src_path_bits;
  3347. return 0;
  3348. }
  3349. static inline void rdma_ah_set_make_grd(struct rdma_ah_attr *attr,
  3350. bool make_grd)
  3351. {
  3352. if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
  3353. attr->opa.make_grd = make_grd;
  3354. }
  3355. static inline bool rdma_ah_get_make_grd(const struct rdma_ah_attr *attr)
  3356. {
  3357. if (attr->type == RDMA_AH_ATTR_TYPE_OPA)
  3358. return attr->opa.make_grd;
  3359. return false;
  3360. }
  3361. static inline void rdma_ah_set_port_num(struct rdma_ah_attr *attr, u8 port_num)
  3362. {
  3363. attr->port_num = port_num;
  3364. }
  3365. static inline u8 rdma_ah_get_port_num(const struct rdma_ah_attr *attr)
  3366. {
  3367. return attr->port_num;
  3368. }
  3369. static inline void rdma_ah_set_static_rate(struct rdma_ah_attr *attr,
  3370. u8 static_rate)
  3371. {
  3372. attr->static_rate = static_rate;
  3373. }
  3374. static inline u8 rdma_ah_get_static_rate(const struct rdma_ah_attr *attr)
  3375. {
  3376. return attr->static_rate;
  3377. }
  3378. static inline void rdma_ah_set_ah_flags(struct rdma_ah_attr *attr,
  3379. enum ib_ah_flags flag)
  3380. {
  3381. attr->ah_flags = flag;
  3382. }
  3383. static inline enum ib_ah_flags
  3384. rdma_ah_get_ah_flags(const struct rdma_ah_attr *attr)
  3385. {
  3386. return attr->ah_flags;
  3387. }
  3388. static inline const struct ib_global_route
  3389. *rdma_ah_read_grh(const struct rdma_ah_attr *attr)
  3390. {
  3391. return &attr->grh;
  3392. }
  3393. /*To retrieve and modify the grh */
  3394. static inline struct ib_global_route
  3395. *rdma_ah_retrieve_grh(struct rdma_ah_attr *attr)
  3396. {
  3397. return &attr->grh;
  3398. }
  3399. static inline void rdma_ah_set_dgid_raw(struct rdma_ah_attr *attr, void *dgid)
  3400. {
  3401. struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
  3402. memcpy(grh->dgid.raw, dgid, sizeof(grh->dgid));
  3403. }
  3404. static inline void rdma_ah_set_subnet_prefix(struct rdma_ah_attr *attr,
  3405. __be64 prefix)
  3406. {
  3407. struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
  3408. grh->dgid.global.subnet_prefix = prefix;
  3409. }
  3410. static inline void rdma_ah_set_interface_id(struct rdma_ah_attr *attr,
  3411. __be64 if_id)
  3412. {
  3413. struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
  3414. grh->dgid.global.interface_id = if_id;
  3415. }
  3416. static inline void rdma_ah_set_grh(struct rdma_ah_attr *attr,
  3417. union ib_gid *dgid, u32 flow_label,
  3418. u8 sgid_index, u8 hop_limit,
  3419. u8 traffic_class)
  3420. {
  3421. struct ib_global_route *grh = rdma_ah_retrieve_grh(attr);
  3422. attr->ah_flags = IB_AH_GRH;
  3423. if (dgid)
  3424. grh->dgid = *dgid;
  3425. grh->flow_label = flow_label;
  3426. grh->sgid_index = sgid_index;
  3427. grh->hop_limit = hop_limit;
  3428. grh->traffic_class = traffic_class;
  3429. }
  3430. /**
  3431. * rdma_ah_find_type - Return address handle type.
  3432. *
  3433. * @dev: Device to be checked
  3434. * @port_num: Port number
  3435. */
  3436. static inline enum rdma_ah_attr_type rdma_ah_find_type(struct ib_device *dev,
  3437. u8 port_num)
  3438. {
  3439. if (rdma_protocol_roce(dev, port_num))
  3440. return RDMA_AH_ATTR_TYPE_ROCE;
  3441. if (rdma_protocol_ib(dev, port_num)) {
  3442. if (rdma_cap_opa_ah(dev, port_num))
  3443. return RDMA_AH_ATTR_TYPE_OPA;
  3444. return RDMA_AH_ATTR_TYPE_IB;
  3445. }
  3446. return RDMA_AH_ATTR_TYPE_UNDEFINED;
  3447. }
  3448. /**
  3449. * ib_lid_cpu16 - Return lid in 16bit CPU encoding.
  3450. * In the current implementation the only way to get
  3451. * get the 32bit lid is from other sources for OPA.
  3452. * For IB, lids will always be 16bits so cast the
  3453. * value accordingly.
  3454. *
  3455. * @lid: A 32bit LID
  3456. */
  3457. static inline u16 ib_lid_cpu16(u32 lid)
  3458. {
  3459. WARN_ON_ONCE(lid & 0xFFFF0000);
  3460. return (u16)lid;
  3461. }
  3462. /**
  3463. * ib_lid_be16 - Return lid in 16bit BE encoding.
  3464. *
  3465. * @lid: A 32bit LID
  3466. */
  3467. static inline __be16 ib_lid_be16(u32 lid)
  3468. {
  3469. WARN_ON_ONCE(lid & 0xFFFF0000);
  3470. return cpu_to_be16((u16)lid);
  3471. }
  3472. /**
  3473. * ib_get_vector_affinity - Get the affinity mappings of a given completion
  3474. * vector
  3475. * @device: the rdma device
  3476. * @comp_vector: index of completion vector
  3477. *
  3478. * Returns NULL on failure, otherwise a corresponding cpu map of the
  3479. * completion vector (returns all-cpus map if the device driver doesn't
  3480. * implement get_vector_affinity).
  3481. */
  3482. static inline const struct cpumask *
  3483. ib_get_vector_affinity(struct ib_device *device, int comp_vector)
  3484. {
  3485. if (comp_vector < 0 || comp_vector >= device->num_comp_vectors ||
  3486. !device->get_vector_affinity)
  3487. return NULL;
  3488. return device->get_vector_affinity(device, comp_vector);
  3489. }
  3490. /**
  3491. * rdma_roce_rescan_device - Rescan all of the network devices in the system
  3492. * and add their gids, as needed, to the relevant RoCE devices.
  3493. *
  3494. * @device: the rdma device
  3495. */
  3496. void rdma_roce_rescan_device(struct ib_device *ibdev);
  3497. #endif /* IB_VERBS_H */