cm.c 128 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569
  1. /*
  2. * Copyright (c) 2004-2007 Intel Corporation. All rights reserved.
  3. * Copyright (c) 2004 Topspin Corporation. All rights reserved.
  4. * Copyright (c) 2004, 2005 Voltaire Corporation. All rights reserved.
  5. * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved.
  6. *
  7. * This software is available to you under a choice of one of two
  8. * licenses. You may choose to be licensed under the terms of the GNU
  9. * General Public License (GPL) Version 2, available from the file
  10. * COPYING in the main directory of this source tree, or the
  11. * OpenIB.org BSD license below:
  12. *
  13. * Redistribution and use in source and binary forms, with or
  14. * without modification, are permitted provided that the following
  15. * conditions are met:
  16. *
  17. * - Redistributions of source code must retain the above
  18. * copyright notice, this list of conditions and the following
  19. * disclaimer.
  20. *
  21. * - Redistributions in binary form must reproduce the above
  22. * copyright notice, this list of conditions and the following
  23. * disclaimer in the documentation and/or other materials
  24. * provided with the distribution.
  25. *
  26. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  27. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  28. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  29. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  30. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  31. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  32. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  33. * SOFTWARE.
  34. */
  35. #include <linux/completion.h>
  36. #include <linux/dma-mapping.h>
  37. #include <linux/device.h>
  38. #include <linux/module.h>
  39. #include <linux/err.h>
  40. #include <linux/idr.h>
  41. #include <linux/interrupt.h>
  42. #include <linux/random.h>
  43. #include <linux/rbtree.h>
  44. #include <linux/spinlock.h>
  45. #include <linux/slab.h>
  46. #include <linux/sysfs.h>
  47. #include <linux/workqueue.h>
  48. #include <linux/kdev_t.h>
  49. #include <linux/etherdevice.h>
  50. #include <rdma/ib_cache.h>
  51. #include <rdma/ib_cm.h>
  52. #include "cm_msgs.h"
  53. MODULE_AUTHOR("Sean Hefty");
  54. MODULE_DESCRIPTION("InfiniBand CM");
  55. MODULE_LICENSE("Dual BSD/GPL");
  56. static const char * const ibcm_rej_reason_strs[] = {
  57. [IB_CM_REJ_NO_QP] = "no QP",
  58. [IB_CM_REJ_NO_EEC] = "no EEC",
  59. [IB_CM_REJ_NO_RESOURCES] = "no resources",
  60. [IB_CM_REJ_TIMEOUT] = "timeout",
  61. [IB_CM_REJ_UNSUPPORTED] = "unsupported",
  62. [IB_CM_REJ_INVALID_COMM_ID] = "invalid comm ID",
  63. [IB_CM_REJ_INVALID_COMM_INSTANCE] = "invalid comm instance",
  64. [IB_CM_REJ_INVALID_SERVICE_ID] = "invalid service ID",
  65. [IB_CM_REJ_INVALID_TRANSPORT_TYPE] = "invalid transport type",
  66. [IB_CM_REJ_STALE_CONN] = "stale conn",
  67. [IB_CM_REJ_RDC_NOT_EXIST] = "RDC not exist",
  68. [IB_CM_REJ_INVALID_GID] = "invalid GID",
  69. [IB_CM_REJ_INVALID_LID] = "invalid LID",
  70. [IB_CM_REJ_INVALID_SL] = "invalid SL",
  71. [IB_CM_REJ_INVALID_TRAFFIC_CLASS] = "invalid traffic class",
  72. [IB_CM_REJ_INVALID_HOP_LIMIT] = "invalid hop limit",
  73. [IB_CM_REJ_INVALID_PACKET_RATE] = "invalid packet rate",
  74. [IB_CM_REJ_INVALID_ALT_GID] = "invalid alt GID",
  75. [IB_CM_REJ_INVALID_ALT_LID] = "invalid alt LID",
  76. [IB_CM_REJ_INVALID_ALT_SL] = "invalid alt SL",
  77. [IB_CM_REJ_INVALID_ALT_TRAFFIC_CLASS] = "invalid alt traffic class",
  78. [IB_CM_REJ_INVALID_ALT_HOP_LIMIT] = "invalid alt hop limit",
  79. [IB_CM_REJ_INVALID_ALT_PACKET_RATE] = "invalid alt packet rate",
  80. [IB_CM_REJ_PORT_CM_REDIRECT] = "port CM redirect",
  81. [IB_CM_REJ_PORT_REDIRECT] = "port redirect",
  82. [IB_CM_REJ_INVALID_MTU] = "invalid MTU",
  83. [IB_CM_REJ_INSUFFICIENT_RESP_RESOURCES] = "insufficient resp resources",
  84. [IB_CM_REJ_CONSUMER_DEFINED] = "consumer defined",
  85. [IB_CM_REJ_INVALID_RNR_RETRY] = "invalid RNR retry",
  86. [IB_CM_REJ_DUPLICATE_LOCAL_COMM_ID] = "duplicate local comm ID",
  87. [IB_CM_REJ_INVALID_CLASS_VERSION] = "invalid class version",
  88. [IB_CM_REJ_INVALID_FLOW_LABEL] = "invalid flow label",
  89. [IB_CM_REJ_INVALID_ALT_FLOW_LABEL] = "invalid alt flow label",
  90. };
  91. const char *__attribute_const__ ibcm_reject_msg(int reason)
  92. {
  93. size_t index = reason;
  94. if (index < ARRAY_SIZE(ibcm_rej_reason_strs) &&
  95. ibcm_rej_reason_strs[index])
  96. return ibcm_rej_reason_strs[index];
  97. else
  98. return "unrecognized reason";
  99. }
  100. EXPORT_SYMBOL(ibcm_reject_msg);
  101. static void cm_add_one(struct ib_device *device);
  102. static void cm_remove_one(struct ib_device *device, void *client_data);
  103. static struct ib_client cm_client = {
  104. .name = "cm",
  105. .add = cm_add_one,
  106. .remove = cm_remove_one
  107. };
  108. static struct ib_cm {
  109. spinlock_t lock;
  110. struct list_head device_list;
  111. rwlock_t device_lock;
  112. struct rb_root listen_service_table;
  113. u64 listen_service_id;
  114. /* struct rb_root peer_service_table; todo: fix peer to peer */
  115. struct rb_root remote_qp_table;
  116. struct rb_root remote_id_table;
  117. struct rb_root remote_sidr_table;
  118. struct idr local_id_table;
  119. __be32 random_id_operand;
  120. struct list_head timewait_list;
  121. struct workqueue_struct *wq;
  122. /* Sync on cm change port state */
  123. spinlock_t state_lock;
  124. } cm;
  125. /* Counter indexes ordered by attribute ID */
  126. enum {
  127. CM_REQ_COUNTER,
  128. CM_MRA_COUNTER,
  129. CM_REJ_COUNTER,
  130. CM_REP_COUNTER,
  131. CM_RTU_COUNTER,
  132. CM_DREQ_COUNTER,
  133. CM_DREP_COUNTER,
  134. CM_SIDR_REQ_COUNTER,
  135. CM_SIDR_REP_COUNTER,
  136. CM_LAP_COUNTER,
  137. CM_APR_COUNTER,
  138. CM_ATTR_COUNT,
  139. CM_ATTR_ID_OFFSET = 0x0010,
  140. };
  141. enum {
  142. CM_XMIT,
  143. CM_XMIT_RETRIES,
  144. CM_RECV,
  145. CM_RECV_DUPLICATES,
  146. CM_COUNTER_GROUPS
  147. };
  148. static char const counter_group_names[CM_COUNTER_GROUPS]
  149. [sizeof("cm_rx_duplicates")] = {
  150. "cm_tx_msgs", "cm_tx_retries",
  151. "cm_rx_msgs", "cm_rx_duplicates"
  152. };
  153. struct cm_counter_group {
  154. struct kobject obj;
  155. atomic_long_t counter[CM_ATTR_COUNT];
  156. };
  157. struct cm_counter_attribute {
  158. struct attribute attr;
  159. int index;
  160. };
  161. #define CM_COUNTER_ATTR(_name, _index) \
  162. struct cm_counter_attribute cm_##_name##_counter_attr = { \
  163. .attr = { .name = __stringify(_name), .mode = 0444 }, \
  164. .index = _index \
  165. }
  166. static CM_COUNTER_ATTR(req, CM_REQ_COUNTER);
  167. static CM_COUNTER_ATTR(mra, CM_MRA_COUNTER);
  168. static CM_COUNTER_ATTR(rej, CM_REJ_COUNTER);
  169. static CM_COUNTER_ATTR(rep, CM_REP_COUNTER);
  170. static CM_COUNTER_ATTR(rtu, CM_RTU_COUNTER);
  171. static CM_COUNTER_ATTR(dreq, CM_DREQ_COUNTER);
  172. static CM_COUNTER_ATTR(drep, CM_DREP_COUNTER);
  173. static CM_COUNTER_ATTR(sidr_req, CM_SIDR_REQ_COUNTER);
  174. static CM_COUNTER_ATTR(sidr_rep, CM_SIDR_REP_COUNTER);
  175. static CM_COUNTER_ATTR(lap, CM_LAP_COUNTER);
  176. static CM_COUNTER_ATTR(apr, CM_APR_COUNTER);
  177. static struct attribute *cm_counter_default_attrs[] = {
  178. &cm_req_counter_attr.attr,
  179. &cm_mra_counter_attr.attr,
  180. &cm_rej_counter_attr.attr,
  181. &cm_rep_counter_attr.attr,
  182. &cm_rtu_counter_attr.attr,
  183. &cm_dreq_counter_attr.attr,
  184. &cm_drep_counter_attr.attr,
  185. &cm_sidr_req_counter_attr.attr,
  186. &cm_sidr_rep_counter_attr.attr,
  187. &cm_lap_counter_attr.attr,
  188. &cm_apr_counter_attr.attr,
  189. NULL
  190. };
  191. struct cm_port {
  192. struct cm_device *cm_dev;
  193. struct ib_mad_agent *mad_agent;
  194. struct kobject port_obj;
  195. u8 port_num;
  196. struct list_head cm_priv_prim_list;
  197. struct list_head cm_priv_altr_list;
  198. struct cm_counter_group counter_group[CM_COUNTER_GROUPS];
  199. };
  200. struct cm_device {
  201. struct list_head list;
  202. struct ib_device *ib_device;
  203. struct device *device;
  204. u8 ack_delay;
  205. int going_down;
  206. struct cm_port *port[0];
  207. };
  208. struct cm_av {
  209. struct cm_port *port;
  210. union ib_gid dgid;
  211. struct rdma_ah_attr ah_attr;
  212. u16 pkey_index;
  213. u8 timeout;
  214. };
  215. struct cm_work {
  216. struct delayed_work work;
  217. struct list_head list;
  218. struct cm_port *port;
  219. struct ib_mad_recv_wc *mad_recv_wc; /* Received MADs */
  220. __be32 local_id; /* Established / timewait */
  221. __be32 remote_id;
  222. struct ib_cm_event cm_event;
  223. struct sa_path_rec path[0];
  224. };
  225. struct cm_timewait_info {
  226. struct cm_work work; /* Must be first. */
  227. struct list_head list;
  228. struct rb_node remote_qp_node;
  229. struct rb_node remote_id_node;
  230. __be64 remote_ca_guid;
  231. __be32 remote_qpn;
  232. u8 inserted_remote_qp;
  233. u8 inserted_remote_id;
  234. };
  235. struct cm_id_private {
  236. struct ib_cm_id id;
  237. struct rb_node service_node;
  238. struct rb_node sidr_id_node;
  239. spinlock_t lock; /* Do not acquire inside cm.lock */
  240. struct completion comp;
  241. atomic_t refcount;
  242. /* Number of clients sharing this ib_cm_id. Only valid for listeners.
  243. * Protected by the cm.lock spinlock. */
  244. int listen_sharecount;
  245. struct ib_mad_send_buf *msg;
  246. struct cm_timewait_info *timewait_info;
  247. /* todo: use alternate port on send failure */
  248. struct cm_av av;
  249. struct cm_av alt_av;
  250. void *private_data;
  251. __be64 tid;
  252. __be32 local_qpn;
  253. __be32 remote_qpn;
  254. enum ib_qp_type qp_type;
  255. __be32 sq_psn;
  256. __be32 rq_psn;
  257. int timeout_ms;
  258. enum ib_mtu path_mtu;
  259. __be16 pkey;
  260. u8 private_data_len;
  261. u8 max_cm_retries;
  262. u8 peer_to_peer;
  263. u8 responder_resources;
  264. u8 initiator_depth;
  265. u8 retry_count;
  266. u8 rnr_retry_count;
  267. u8 service_timeout;
  268. u8 target_ack_delay;
  269. struct list_head prim_list;
  270. struct list_head altr_list;
  271. /* Indicates that the send port mad is registered and av is set */
  272. int prim_send_port_not_ready;
  273. int altr_send_port_not_ready;
  274. struct list_head work_list;
  275. atomic_t work_count;
  276. };
  277. static void cm_work_handler(struct work_struct *work);
  278. static inline void cm_deref_id(struct cm_id_private *cm_id_priv)
  279. {
  280. if (atomic_dec_and_test(&cm_id_priv->refcount))
  281. complete(&cm_id_priv->comp);
  282. }
  283. static int cm_alloc_msg(struct cm_id_private *cm_id_priv,
  284. struct ib_mad_send_buf **msg)
  285. {
  286. struct ib_mad_agent *mad_agent;
  287. struct ib_mad_send_buf *m;
  288. struct ib_ah *ah;
  289. struct cm_av *av;
  290. unsigned long flags, flags2;
  291. int ret = 0;
  292. /* don't let the port to be released till the agent is down */
  293. spin_lock_irqsave(&cm.state_lock, flags2);
  294. spin_lock_irqsave(&cm.lock, flags);
  295. if (!cm_id_priv->prim_send_port_not_ready)
  296. av = &cm_id_priv->av;
  297. else if (!cm_id_priv->altr_send_port_not_ready &&
  298. (cm_id_priv->alt_av.port))
  299. av = &cm_id_priv->alt_av;
  300. else {
  301. pr_info("%s: not valid CM id\n", __func__);
  302. ret = -ENODEV;
  303. spin_unlock_irqrestore(&cm.lock, flags);
  304. goto out;
  305. }
  306. spin_unlock_irqrestore(&cm.lock, flags);
  307. /* Make sure the port haven't released the mad yet */
  308. mad_agent = cm_id_priv->av.port->mad_agent;
  309. if (!mad_agent) {
  310. pr_info("%s: not a valid MAD agent\n", __func__);
  311. ret = -ENODEV;
  312. goto out;
  313. }
  314. ah = rdma_create_ah(mad_agent->qp->pd, &av->ah_attr);
  315. if (IS_ERR(ah)) {
  316. ret = PTR_ERR(ah);
  317. goto out;
  318. }
  319. m = ib_create_send_mad(mad_agent, cm_id_priv->id.remote_cm_qpn,
  320. av->pkey_index,
  321. 0, IB_MGMT_MAD_HDR, IB_MGMT_MAD_DATA,
  322. GFP_ATOMIC,
  323. IB_MGMT_BASE_VERSION);
  324. if (IS_ERR(m)) {
  325. rdma_destroy_ah(ah);
  326. ret = PTR_ERR(m);
  327. goto out;
  328. }
  329. /* Timeout set by caller if response is expected. */
  330. m->ah = ah;
  331. m->retries = cm_id_priv->max_cm_retries;
  332. atomic_inc(&cm_id_priv->refcount);
  333. m->context[0] = cm_id_priv;
  334. *msg = m;
  335. out:
  336. spin_unlock_irqrestore(&cm.state_lock, flags2);
  337. return ret;
  338. }
  339. static struct ib_mad_send_buf *cm_alloc_response_msg_no_ah(struct cm_port *port,
  340. struct ib_mad_recv_wc *mad_recv_wc)
  341. {
  342. return ib_create_send_mad(port->mad_agent, 1, mad_recv_wc->wc->pkey_index,
  343. 0, IB_MGMT_MAD_HDR, IB_MGMT_MAD_DATA,
  344. GFP_ATOMIC,
  345. IB_MGMT_BASE_VERSION);
  346. }
  347. static int cm_create_response_msg_ah(struct cm_port *port,
  348. struct ib_mad_recv_wc *mad_recv_wc,
  349. struct ib_mad_send_buf *msg)
  350. {
  351. struct ib_ah *ah;
  352. ah = ib_create_ah_from_wc(port->mad_agent->qp->pd, mad_recv_wc->wc,
  353. mad_recv_wc->recv_buf.grh, port->port_num);
  354. if (IS_ERR(ah))
  355. return PTR_ERR(ah);
  356. msg->ah = ah;
  357. return 0;
  358. }
  359. static void cm_free_msg(struct ib_mad_send_buf *msg)
  360. {
  361. if (msg->ah)
  362. rdma_destroy_ah(msg->ah);
  363. if (msg->context[0])
  364. cm_deref_id(msg->context[0]);
  365. ib_free_send_mad(msg);
  366. }
  367. static int cm_alloc_response_msg(struct cm_port *port,
  368. struct ib_mad_recv_wc *mad_recv_wc,
  369. struct ib_mad_send_buf **msg)
  370. {
  371. struct ib_mad_send_buf *m;
  372. int ret;
  373. m = cm_alloc_response_msg_no_ah(port, mad_recv_wc);
  374. if (IS_ERR(m))
  375. return PTR_ERR(m);
  376. ret = cm_create_response_msg_ah(port, mad_recv_wc, m);
  377. if (ret) {
  378. cm_free_msg(m);
  379. return ret;
  380. }
  381. *msg = m;
  382. return 0;
  383. }
  384. static void * cm_copy_private_data(const void *private_data,
  385. u8 private_data_len)
  386. {
  387. void *data;
  388. if (!private_data || !private_data_len)
  389. return NULL;
  390. data = kmemdup(private_data, private_data_len, GFP_KERNEL);
  391. if (!data)
  392. return ERR_PTR(-ENOMEM);
  393. return data;
  394. }
  395. static void cm_set_private_data(struct cm_id_private *cm_id_priv,
  396. void *private_data, u8 private_data_len)
  397. {
  398. if (cm_id_priv->private_data && cm_id_priv->private_data_len)
  399. kfree(cm_id_priv->private_data);
  400. cm_id_priv->private_data = private_data;
  401. cm_id_priv->private_data_len = private_data_len;
  402. }
  403. static int cm_init_av_for_lap(struct cm_port *port, struct ib_wc *wc,
  404. struct ib_grh *grh, struct cm_av *av)
  405. {
  406. struct rdma_ah_attr new_ah_attr;
  407. int ret;
  408. av->port = port;
  409. av->pkey_index = wc->pkey_index;
  410. /*
  411. * av->ah_attr might be initialized based on past wc during incoming
  412. * connect request or while sending out connect request. So initialize
  413. * a new ah_attr on stack. If initialization fails, old ah_attr is
  414. * used for sending any responses. If initialization is successful,
  415. * than new ah_attr is used by overwriting old one.
  416. */
  417. ret = ib_init_ah_attr_from_wc(port->cm_dev->ib_device,
  418. port->port_num, wc,
  419. grh, &new_ah_attr);
  420. if (ret)
  421. return ret;
  422. rdma_move_ah_attr(&av->ah_attr, &new_ah_attr);
  423. return 0;
  424. }
  425. static int cm_init_av_for_response(struct cm_port *port, struct ib_wc *wc,
  426. struct ib_grh *grh, struct cm_av *av)
  427. {
  428. av->port = port;
  429. av->pkey_index = wc->pkey_index;
  430. return ib_init_ah_attr_from_wc(port->cm_dev->ib_device,
  431. port->port_num, wc,
  432. grh, &av->ah_attr);
  433. }
  434. static int add_cm_id_to_port_list(struct cm_id_private *cm_id_priv,
  435. struct cm_av *av,
  436. struct cm_port *port)
  437. {
  438. unsigned long flags;
  439. int ret = 0;
  440. spin_lock_irqsave(&cm.lock, flags);
  441. if (&cm_id_priv->av == av)
  442. list_add_tail(&cm_id_priv->prim_list, &port->cm_priv_prim_list);
  443. else if (&cm_id_priv->alt_av == av)
  444. list_add_tail(&cm_id_priv->altr_list, &port->cm_priv_altr_list);
  445. else
  446. ret = -EINVAL;
  447. spin_unlock_irqrestore(&cm.lock, flags);
  448. return ret;
  449. }
  450. static struct cm_port *
  451. get_cm_port_from_path(struct sa_path_rec *path, const struct ib_gid_attr *attr)
  452. {
  453. struct cm_device *cm_dev;
  454. struct cm_port *port = NULL;
  455. unsigned long flags;
  456. if (attr) {
  457. read_lock_irqsave(&cm.device_lock, flags);
  458. list_for_each_entry(cm_dev, &cm.device_list, list) {
  459. if (cm_dev->ib_device == attr->device) {
  460. port = cm_dev->port[attr->port_num - 1];
  461. break;
  462. }
  463. }
  464. read_unlock_irqrestore(&cm.device_lock, flags);
  465. } else {
  466. /* SGID attribute can be NULL in following
  467. * conditions.
  468. * (a) Alternative path
  469. * (b) IB link layer without GRH
  470. * (c) LAP send messages
  471. */
  472. read_lock_irqsave(&cm.device_lock, flags);
  473. list_for_each_entry(cm_dev, &cm.device_list, list) {
  474. attr = rdma_find_gid(cm_dev->ib_device,
  475. &path->sgid,
  476. sa_conv_pathrec_to_gid_type(path),
  477. NULL);
  478. if (!IS_ERR(attr)) {
  479. port = cm_dev->port[attr->port_num - 1];
  480. break;
  481. }
  482. }
  483. read_unlock_irqrestore(&cm.device_lock, flags);
  484. if (port)
  485. rdma_put_gid_attr(attr);
  486. }
  487. return port;
  488. }
  489. static int cm_init_av_by_path(struct sa_path_rec *path,
  490. const struct ib_gid_attr *sgid_attr,
  491. struct cm_av *av,
  492. struct cm_id_private *cm_id_priv)
  493. {
  494. struct rdma_ah_attr new_ah_attr;
  495. struct cm_device *cm_dev;
  496. struct cm_port *port;
  497. int ret;
  498. port = get_cm_port_from_path(path, sgid_attr);
  499. if (!port)
  500. return -EINVAL;
  501. cm_dev = port->cm_dev;
  502. ret = ib_find_cached_pkey(cm_dev->ib_device, port->port_num,
  503. be16_to_cpu(path->pkey), &av->pkey_index);
  504. if (ret)
  505. return ret;
  506. av->port = port;
  507. /*
  508. * av->ah_attr might be initialized based on wc or during
  509. * request processing time which might have reference to sgid_attr.
  510. * So initialize a new ah_attr on stack.
  511. * If initialization fails, old ah_attr is used for sending any
  512. * responses. If initialization is successful, than new ah_attr
  513. * is used by overwriting the old one. So that right ah_attr
  514. * can be used to return an error response.
  515. */
  516. ret = ib_init_ah_attr_from_path(cm_dev->ib_device, port->port_num, path,
  517. &new_ah_attr, sgid_attr);
  518. if (ret)
  519. return ret;
  520. av->timeout = path->packet_life_time + 1;
  521. ret = add_cm_id_to_port_list(cm_id_priv, av, port);
  522. if (ret) {
  523. rdma_destroy_ah_attr(&new_ah_attr);
  524. return ret;
  525. }
  526. rdma_move_ah_attr(&av->ah_attr, &new_ah_attr);
  527. return 0;
  528. }
  529. static int cm_alloc_id(struct cm_id_private *cm_id_priv)
  530. {
  531. unsigned long flags;
  532. int id;
  533. idr_preload(GFP_KERNEL);
  534. spin_lock_irqsave(&cm.lock, flags);
  535. id = idr_alloc_cyclic(&cm.local_id_table, cm_id_priv, 0, 0, GFP_NOWAIT);
  536. spin_unlock_irqrestore(&cm.lock, flags);
  537. idr_preload_end();
  538. cm_id_priv->id.local_id = (__force __be32)id ^ cm.random_id_operand;
  539. return id < 0 ? id : 0;
  540. }
  541. static void cm_free_id(__be32 local_id)
  542. {
  543. spin_lock_irq(&cm.lock);
  544. idr_remove(&cm.local_id_table,
  545. (__force int) (local_id ^ cm.random_id_operand));
  546. spin_unlock_irq(&cm.lock);
  547. }
  548. static struct cm_id_private * cm_get_id(__be32 local_id, __be32 remote_id)
  549. {
  550. struct cm_id_private *cm_id_priv;
  551. cm_id_priv = idr_find(&cm.local_id_table,
  552. (__force int) (local_id ^ cm.random_id_operand));
  553. if (cm_id_priv) {
  554. if (cm_id_priv->id.remote_id == remote_id)
  555. atomic_inc(&cm_id_priv->refcount);
  556. else
  557. cm_id_priv = NULL;
  558. }
  559. return cm_id_priv;
  560. }
  561. static struct cm_id_private * cm_acquire_id(__be32 local_id, __be32 remote_id)
  562. {
  563. struct cm_id_private *cm_id_priv;
  564. spin_lock_irq(&cm.lock);
  565. cm_id_priv = cm_get_id(local_id, remote_id);
  566. spin_unlock_irq(&cm.lock);
  567. return cm_id_priv;
  568. }
  569. /*
  570. * Trivial helpers to strip endian annotation and compare; the
  571. * endianness doesn't actually matter since we just need a stable
  572. * order for the RB tree.
  573. */
  574. static int be32_lt(__be32 a, __be32 b)
  575. {
  576. return (__force u32) a < (__force u32) b;
  577. }
  578. static int be32_gt(__be32 a, __be32 b)
  579. {
  580. return (__force u32) a > (__force u32) b;
  581. }
  582. static int be64_lt(__be64 a, __be64 b)
  583. {
  584. return (__force u64) a < (__force u64) b;
  585. }
  586. static int be64_gt(__be64 a, __be64 b)
  587. {
  588. return (__force u64) a > (__force u64) b;
  589. }
  590. static struct cm_id_private * cm_insert_listen(struct cm_id_private *cm_id_priv)
  591. {
  592. struct rb_node **link = &cm.listen_service_table.rb_node;
  593. struct rb_node *parent = NULL;
  594. struct cm_id_private *cur_cm_id_priv;
  595. __be64 service_id = cm_id_priv->id.service_id;
  596. __be64 service_mask = cm_id_priv->id.service_mask;
  597. while (*link) {
  598. parent = *link;
  599. cur_cm_id_priv = rb_entry(parent, struct cm_id_private,
  600. service_node);
  601. if ((cur_cm_id_priv->id.service_mask & service_id) ==
  602. (service_mask & cur_cm_id_priv->id.service_id) &&
  603. (cm_id_priv->id.device == cur_cm_id_priv->id.device))
  604. return cur_cm_id_priv;
  605. if (cm_id_priv->id.device < cur_cm_id_priv->id.device)
  606. link = &(*link)->rb_left;
  607. else if (cm_id_priv->id.device > cur_cm_id_priv->id.device)
  608. link = &(*link)->rb_right;
  609. else if (be64_lt(service_id, cur_cm_id_priv->id.service_id))
  610. link = &(*link)->rb_left;
  611. else if (be64_gt(service_id, cur_cm_id_priv->id.service_id))
  612. link = &(*link)->rb_right;
  613. else
  614. link = &(*link)->rb_right;
  615. }
  616. rb_link_node(&cm_id_priv->service_node, parent, link);
  617. rb_insert_color(&cm_id_priv->service_node, &cm.listen_service_table);
  618. return NULL;
  619. }
  620. static struct cm_id_private * cm_find_listen(struct ib_device *device,
  621. __be64 service_id)
  622. {
  623. struct rb_node *node = cm.listen_service_table.rb_node;
  624. struct cm_id_private *cm_id_priv;
  625. while (node) {
  626. cm_id_priv = rb_entry(node, struct cm_id_private, service_node);
  627. if ((cm_id_priv->id.service_mask & service_id) ==
  628. cm_id_priv->id.service_id &&
  629. (cm_id_priv->id.device == device))
  630. return cm_id_priv;
  631. if (device < cm_id_priv->id.device)
  632. node = node->rb_left;
  633. else if (device > cm_id_priv->id.device)
  634. node = node->rb_right;
  635. else if (be64_lt(service_id, cm_id_priv->id.service_id))
  636. node = node->rb_left;
  637. else if (be64_gt(service_id, cm_id_priv->id.service_id))
  638. node = node->rb_right;
  639. else
  640. node = node->rb_right;
  641. }
  642. return NULL;
  643. }
  644. static struct cm_timewait_info * cm_insert_remote_id(struct cm_timewait_info
  645. *timewait_info)
  646. {
  647. struct rb_node **link = &cm.remote_id_table.rb_node;
  648. struct rb_node *parent = NULL;
  649. struct cm_timewait_info *cur_timewait_info;
  650. __be64 remote_ca_guid = timewait_info->remote_ca_guid;
  651. __be32 remote_id = timewait_info->work.remote_id;
  652. while (*link) {
  653. parent = *link;
  654. cur_timewait_info = rb_entry(parent, struct cm_timewait_info,
  655. remote_id_node);
  656. if (be32_lt(remote_id, cur_timewait_info->work.remote_id))
  657. link = &(*link)->rb_left;
  658. else if (be32_gt(remote_id, cur_timewait_info->work.remote_id))
  659. link = &(*link)->rb_right;
  660. else if (be64_lt(remote_ca_guid, cur_timewait_info->remote_ca_guid))
  661. link = &(*link)->rb_left;
  662. else if (be64_gt(remote_ca_guid, cur_timewait_info->remote_ca_guid))
  663. link = &(*link)->rb_right;
  664. else
  665. return cur_timewait_info;
  666. }
  667. timewait_info->inserted_remote_id = 1;
  668. rb_link_node(&timewait_info->remote_id_node, parent, link);
  669. rb_insert_color(&timewait_info->remote_id_node, &cm.remote_id_table);
  670. return NULL;
  671. }
  672. static struct cm_timewait_info * cm_find_remote_id(__be64 remote_ca_guid,
  673. __be32 remote_id)
  674. {
  675. struct rb_node *node = cm.remote_id_table.rb_node;
  676. struct cm_timewait_info *timewait_info;
  677. while (node) {
  678. timewait_info = rb_entry(node, struct cm_timewait_info,
  679. remote_id_node);
  680. if (be32_lt(remote_id, timewait_info->work.remote_id))
  681. node = node->rb_left;
  682. else if (be32_gt(remote_id, timewait_info->work.remote_id))
  683. node = node->rb_right;
  684. else if (be64_lt(remote_ca_guid, timewait_info->remote_ca_guid))
  685. node = node->rb_left;
  686. else if (be64_gt(remote_ca_guid, timewait_info->remote_ca_guid))
  687. node = node->rb_right;
  688. else
  689. return timewait_info;
  690. }
  691. return NULL;
  692. }
  693. static struct cm_timewait_info * cm_insert_remote_qpn(struct cm_timewait_info
  694. *timewait_info)
  695. {
  696. struct rb_node **link = &cm.remote_qp_table.rb_node;
  697. struct rb_node *parent = NULL;
  698. struct cm_timewait_info *cur_timewait_info;
  699. __be64 remote_ca_guid = timewait_info->remote_ca_guid;
  700. __be32 remote_qpn = timewait_info->remote_qpn;
  701. while (*link) {
  702. parent = *link;
  703. cur_timewait_info = rb_entry(parent, struct cm_timewait_info,
  704. remote_qp_node);
  705. if (be32_lt(remote_qpn, cur_timewait_info->remote_qpn))
  706. link = &(*link)->rb_left;
  707. else if (be32_gt(remote_qpn, cur_timewait_info->remote_qpn))
  708. link = &(*link)->rb_right;
  709. else if (be64_lt(remote_ca_guid, cur_timewait_info->remote_ca_guid))
  710. link = &(*link)->rb_left;
  711. else if (be64_gt(remote_ca_guid, cur_timewait_info->remote_ca_guid))
  712. link = &(*link)->rb_right;
  713. else
  714. return cur_timewait_info;
  715. }
  716. timewait_info->inserted_remote_qp = 1;
  717. rb_link_node(&timewait_info->remote_qp_node, parent, link);
  718. rb_insert_color(&timewait_info->remote_qp_node, &cm.remote_qp_table);
  719. return NULL;
  720. }
  721. static struct cm_id_private * cm_insert_remote_sidr(struct cm_id_private
  722. *cm_id_priv)
  723. {
  724. struct rb_node **link = &cm.remote_sidr_table.rb_node;
  725. struct rb_node *parent = NULL;
  726. struct cm_id_private *cur_cm_id_priv;
  727. union ib_gid *port_gid = &cm_id_priv->av.dgid;
  728. __be32 remote_id = cm_id_priv->id.remote_id;
  729. while (*link) {
  730. parent = *link;
  731. cur_cm_id_priv = rb_entry(parent, struct cm_id_private,
  732. sidr_id_node);
  733. if (be32_lt(remote_id, cur_cm_id_priv->id.remote_id))
  734. link = &(*link)->rb_left;
  735. else if (be32_gt(remote_id, cur_cm_id_priv->id.remote_id))
  736. link = &(*link)->rb_right;
  737. else {
  738. int cmp;
  739. cmp = memcmp(port_gid, &cur_cm_id_priv->av.dgid,
  740. sizeof *port_gid);
  741. if (cmp < 0)
  742. link = &(*link)->rb_left;
  743. else if (cmp > 0)
  744. link = &(*link)->rb_right;
  745. else
  746. return cur_cm_id_priv;
  747. }
  748. }
  749. rb_link_node(&cm_id_priv->sidr_id_node, parent, link);
  750. rb_insert_color(&cm_id_priv->sidr_id_node, &cm.remote_sidr_table);
  751. return NULL;
  752. }
  753. static void cm_reject_sidr_req(struct cm_id_private *cm_id_priv,
  754. enum ib_cm_sidr_status status)
  755. {
  756. struct ib_cm_sidr_rep_param param;
  757. memset(&param, 0, sizeof param);
  758. param.status = status;
  759. ib_send_cm_sidr_rep(&cm_id_priv->id, &param);
  760. }
  761. struct ib_cm_id *ib_create_cm_id(struct ib_device *device,
  762. ib_cm_handler cm_handler,
  763. void *context)
  764. {
  765. struct cm_id_private *cm_id_priv;
  766. int ret;
  767. cm_id_priv = kzalloc(sizeof *cm_id_priv, GFP_KERNEL);
  768. if (!cm_id_priv)
  769. return ERR_PTR(-ENOMEM);
  770. cm_id_priv->id.state = IB_CM_IDLE;
  771. cm_id_priv->id.device = device;
  772. cm_id_priv->id.cm_handler = cm_handler;
  773. cm_id_priv->id.context = context;
  774. cm_id_priv->id.remote_cm_qpn = 1;
  775. ret = cm_alloc_id(cm_id_priv);
  776. if (ret)
  777. goto error;
  778. spin_lock_init(&cm_id_priv->lock);
  779. init_completion(&cm_id_priv->comp);
  780. INIT_LIST_HEAD(&cm_id_priv->work_list);
  781. INIT_LIST_HEAD(&cm_id_priv->prim_list);
  782. INIT_LIST_HEAD(&cm_id_priv->altr_list);
  783. atomic_set(&cm_id_priv->work_count, -1);
  784. atomic_set(&cm_id_priv->refcount, 1);
  785. return &cm_id_priv->id;
  786. error:
  787. kfree(cm_id_priv);
  788. return ERR_PTR(-ENOMEM);
  789. }
  790. EXPORT_SYMBOL(ib_create_cm_id);
  791. static struct cm_work * cm_dequeue_work(struct cm_id_private *cm_id_priv)
  792. {
  793. struct cm_work *work;
  794. if (list_empty(&cm_id_priv->work_list))
  795. return NULL;
  796. work = list_entry(cm_id_priv->work_list.next, struct cm_work, list);
  797. list_del(&work->list);
  798. return work;
  799. }
  800. static void cm_free_work(struct cm_work *work)
  801. {
  802. if (work->mad_recv_wc)
  803. ib_free_recv_mad(work->mad_recv_wc);
  804. kfree(work);
  805. }
  806. static inline int cm_convert_to_ms(int iba_time)
  807. {
  808. /* approximate conversion to ms from 4.096us x 2^iba_time */
  809. return 1 << max(iba_time - 8, 0);
  810. }
  811. /*
  812. * calculate: 4.096x2^ack_timeout = 4.096x2^ack_delay + 2x4.096x2^life_time
  813. * Because of how ack_timeout is stored, adding one doubles the timeout.
  814. * To avoid large timeouts, select the max(ack_delay, life_time + 1), and
  815. * increment it (round up) only if the other is within 50%.
  816. */
  817. static u8 cm_ack_timeout(u8 ca_ack_delay, u8 packet_life_time)
  818. {
  819. int ack_timeout = packet_life_time + 1;
  820. if (ack_timeout >= ca_ack_delay)
  821. ack_timeout += (ca_ack_delay >= (ack_timeout - 1));
  822. else
  823. ack_timeout = ca_ack_delay +
  824. (ack_timeout >= (ca_ack_delay - 1));
  825. return min(31, ack_timeout);
  826. }
  827. static void cm_cleanup_timewait(struct cm_timewait_info *timewait_info)
  828. {
  829. if (timewait_info->inserted_remote_id) {
  830. rb_erase(&timewait_info->remote_id_node, &cm.remote_id_table);
  831. timewait_info->inserted_remote_id = 0;
  832. }
  833. if (timewait_info->inserted_remote_qp) {
  834. rb_erase(&timewait_info->remote_qp_node, &cm.remote_qp_table);
  835. timewait_info->inserted_remote_qp = 0;
  836. }
  837. }
  838. static struct cm_timewait_info * cm_create_timewait_info(__be32 local_id)
  839. {
  840. struct cm_timewait_info *timewait_info;
  841. timewait_info = kzalloc(sizeof *timewait_info, GFP_KERNEL);
  842. if (!timewait_info)
  843. return ERR_PTR(-ENOMEM);
  844. timewait_info->work.local_id = local_id;
  845. INIT_DELAYED_WORK(&timewait_info->work.work, cm_work_handler);
  846. timewait_info->work.cm_event.event = IB_CM_TIMEWAIT_EXIT;
  847. return timewait_info;
  848. }
  849. static void cm_enter_timewait(struct cm_id_private *cm_id_priv)
  850. {
  851. int wait_time;
  852. unsigned long flags;
  853. struct cm_device *cm_dev;
  854. cm_dev = ib_get_client_data(cm_id_priv->id.device, &cm_client);
  855. if (!cm_dev)
  856. return;
  857. spin_lock_irqsave(&cm.lock, flags);
  858. cm_cleanup_timewait(cm_id_priv->timewait_info);
  859. list_add_tail(&cm_id_priv->timewait_info->list, &cm.timewait_list);
  860. spin_unlock_irqrestore(&cm.lock, flags);
  861. /*
  862. * The cm_id could be destroyed by the user before we exit timewait.
  863. * To protect against this, we search for the cm_id after exiting
  864. * timewait before notifying the user that we've exited timewait.
  865. */
  866. cm_id_priv->id.state = IB_CM_TIMEWAIT;
  867. wait_time = cm_convert_to_ms(cm_id_priv->av.timeout);
  868. /* Check if the device started its remove_one */
  869. spin_lock_irqsave(&cm.lock, flags);
  870. if (!cm_dev->going_down)
  871. queue_delayed_work(cm.wq, &cm_id_priv->timewait_info->work.work,
  872. msecs_to_jiffies(wait_time));
  873. spin_unlock_irqrestore(&cm.lock, flags);
  874. cm_id_priv->timewait_info = NULL;
  875. }
  876. static void cm_reset_to_idle(struct cm_id_private *cm_id_priv)
  877. {
  878. unsigned long flags;
  879. cm_id_priv->id.state = IB_CM_IDLE;
  880. if (cm_id_priv->timewait_info) {
  881. spin_lock_irqsave(&cm.lock, flags);
  882. cm_cleanup_timewait(cm_id_priv->timewait_info);
  883. spin_unlock_irqrestore(&cm.lock, flags);
  884. kfree(cm_id_priv->timewait_info);
  885. cm_id_priv->timewait_info = NULL;
  886. }
  887. }
  888. static void cm_destroy_id(struct ib_cm_id *cm_id, int err)
  889. {
  890. struct cm_id_private *cm_id_priv;
  891. struct cm_work *work;
  892. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  893. retest:
  894. spin_lock_irq(&cm_id_priv->lock);
  895. switch (cm_id->state) {
  896. case IB_CM_LISTEN:
  897. spin_unlock_irq(&cm_id_priv->lock);
  898. spin_lock_irq(&cm.lock);
  899. if (--cm_id_priv->listen_sharecount > 0) {
  900. /* The id is still shared. */
  901. cm_deref_id(cm_id_priv);
  902. spin_unlock_irq(&cm.lock);
  903. return;
  904. }
  905. rb_erase(&cm_id_priv->service_node, &cm.listen_service_table);
  906. spin_unlock_irq(&cm.lock);
  907. break;
  908. case IB_CM_SIDR_REQ_SENT:
  909. cm_id->state = IB_CM_IDLE;
  910. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  911. spin_unlock_irq(&cm_id_priv->lock);
  912. break;
  913. case IB_CM_SIDR_REQ_RCVD:
  914. spin_unlock_irq(&cm_id_priv->lock);
  915. cm_reject_sidr_req(cm_id_priv, IB_SIDR_REJECT);
  916. spin_lock_irq(&cm.lock);
  917. if (!RB_EMPTY_NODE(&cm_id_priv->sidr_id_node))
  918. rb_erase(&cm_id_priv->sidr_id_node,
  919. &cm.remote_sidr_table);
  920. spin_unlock_irq(&cm.lock);
  921. break;
  922. case IB_CM_REQ_SENT:
  923. case IB_CM_MRA_REQ_RCVD:
  924. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  925. spin_unlock_irq(&cm_id_priv->lock);
  926. ib_send_cm_rej(cm_id, IB_CM_REJ_TIMEOUT,
  927. &cm_id_priv->id.device->node_guid,
  928. sizeof cm_id_priv->id.device->node_guid,
  929. NULL, 0);
  930. break;
  931. case IB_CM_REQ_RCVD:
  932. if (err == -ENOMEM) {
  933. /* Do not reject to allow future retries. */
  934. cm_reset_to_idle(cm_id_priv);
  935. spin_unlock_irq(&cm_id_priv->lock);
  936. } else {
  937. spin_unlock_irq(&cm_id_priv->lock);
  938. ib_send_cm_rej(cm_id, IB_CM_REJ_CONSUMER_DEFINED,
  939. NULL, 0, NULL, 0);
  940. }
  941. break;
  942. case IB_CM_REP_SENT:
  943. case IB_CM_MRA_REP_RCVD:
  944. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  945. /* Fall through */
  946. case IB_CM_MRA_REQ_SENT:
  947. case IB_CM_REP_RCVD:
  948. case IB_CM_MRA_REP_SENT:
  949. spin_unlock_irq(&cm_id_priv->lock);
  950. ib_send_cm_rej(cm_id, IB_CM_REJ_CONSUMER_DEFINED,
  951. NULL, 0, NULL, 0);
  952. break;
  953. case IB_CM_ESTABLISHED:
  954. spin_unlock_irq(&cm_id_priv->lock);
  955. if (cm_id_priv->qp_type == IB_QPT_XRC_TGT)
  956. break;
  957. ib_send_cm_dreq(cm_id, NULL, 0);
  958. goto retest;
  959. case IB_CM_DREQ_SENT:
  960. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  961. cm_enter_timewait(cm_id_priv);
  962. spin_unlock_irq(&cm_id_priv->lock);
  963. break;
  964. case IB_CM_DREQ_RCVD:
  965. spin_unlock_irq(&cm_id_priv->lock);
  966. ib_send_cm_drep(cm_id, NULL, 0);
  967. break;
  968. default:
  969. spin_unlock_irq(&cm_id_priv->lock);
  970. break;
  971. }
  972. spin_lock_irq(&cm.lock);
  973. if (!list_empty(&cm_id_priv->altr_list) &&
  974. (!cm_id_priv->altr_send_port_not_ready))
  975. list_del(&cm_id_priv->altr_list);
  976. if (!list_empty(&cm_id_priv->prim_list) &&
  977. (!cm_id_priv->prim_send_port_not_ready))
  978. list_del(&cm_id_priv->prim_list);
  979. spin_unlock_irq(&cm.lock);
  980. cm_free_id(cm_id->local_id);
  981. cm_deref_id(cm_id_priv);
  982. wait_for_completion(&cm_id_priv->comp);
  983. while ((work = cm_dequeue_work(cm_id_priv)) != NULL)
  984. cm_free_work(work);
  985. rdma_destroy_ah_attr(&cm_id_priv->av.ah_attr);
  986. rdma_destroy_ah_attr(&cm_id_priv->alt_av.ah_attr);
  987. kfree(cm_id_priv->private_data);
  988. kfree(cm_id_priv);
  989. }
  990. void ib_destroy_cm_id(struct ib_cm_id *cm_id)
  991. {
  992. cm_destroy_id(cm_id, 0);
  993. }
  994. EXPORT_SYMBOL(ib_destroy_cm_id);
  995. /**
  996. * __ib_cm_listen - Initiates listening on the specified service ID for
  997. * connection and service ID resolution requests.
  998. * @cm_id: Connection identifier associated with the listen request.
  999. * @service_id: Service identifier matched against incoming connection
  1000. * and service ID resolution requests. The service ID should be specified
  1001. * network-byte order. If set to IB_CM_ASSIGN_SERVICE_ID, the CM will
  1002. * assign a service ID to the caller.
  1003. * @service_mask: Mask applied to service ID used to listen across a
  1004. * range of service IDs. If set to 0, the service ID is matched
  1005. * exactly. This parameter is ignored if %service_id is set to
  1006. * IB_CM_ASSIGN_SERVICE_ID.
  1007. */
  1008. static int __ib_cm_listen(struct ib_cm_id *cm_id, __be64 service_id,
  1009. __be64 service_mask)
  1010. {
  1011. struct cm_id_private *cm_id_priv, *cur_cm_id_priv;
  1012. int ret = 0;
  1013. service_mask = service_mask ? service_mask : ~cpu_to_be64(0);
  1014. service_id &= service_mask;
  1015. if ((service_id & IB_SERVICE_ID_AGN_MASK) == IB_CM_ASSIGN_SERVICE_ID &&
  1016. (service_id != IB_CM_ASSIGN_SERVICE_ID))
  1017. return -EINVAL;
  1018. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  1019. if (cm_id->state != IB_CM_IDLE)
  1020. return -EINVAL;
  1021. cm_id->state = IB_CM_LISTEN;
  1022. ++cm_id_priv->listen_sharecount;
  1023. if (service_id == IB_CM_ASSIGN_SERVICE_ID) {
  1024. cm_id->service_id = cpu_to_be64(cm.listen_service_id++);
  1025. cm_id->service_mask = ~cpu_to_be64(0);
  1026. } else {
  1027. cm_id->service_id = service_id;
  1028. cm_id->service_mask = service_mask;
  1029. }
  1030. cur_cm_id_priv = cm_insert_listen(cm_id_priv);
  1031. if (cur_cm_id_priv) {
  1032. cm_id->state = IB_CM_IDLE;
  1033. --cm_id_priv->listen_sharecount;
  1034. ret = -EBUSY;
  1035. }
  1036. return ret;
  1037. }
  1038. int ib_cm_listen(struct ib_cm_id *cm_id, __be64 service_id, __be64 service_mask)
  1039. {
  1040. unsigned long flags;
  1041. int ret;
  1042. spin_lock_irqsave(&cm.lock, flags);
  1043. ret = __ib_cm_listen(cm_id, service_id, service_mask);
  1044. spin_unlock_irqrestore(&cm.lock, flags);
  1045. return ret;
  1046. }
  1047. EXPORT_SYMBOL(ib_cm_listen);
  1048. /**
  1049. * Create a new listening ib_cm_id and listen on the given service ID.
  1050. *
  1051. * If there's an existing ID listening on that same device and service ID,
  1052. * return it.
  1053. *
  1054. * @device: Device associated with the cm_id. All related communication will
  1055. * be associated with the specified device.
  1056. * @cm_handler: Callback invoked to notify the user of CM events.
  1057. * @service_id: Service identifier matched against incoming connection
  1058. * and service ID resolution requests. The service ID should be specified
  1059. * network-byte order. If set to IB_CM_ASSIGN_SERVICE_ID, the CM will
  1060. * assign a service ID to the caller.
  1061. *
  1062. * Callers should call ib_destroy_cm_id when done with the listener ID.
  1063. */
  1064. struct ib_cm_id *ib_cm_insert_listen(struct ib_device *device,
  1065. ib_cm_handler cm_handler,
  1066. __be64 service_id)
  1067. {
  1068. struct cm_id_private *cm_id_priv;
  1069. struct ib_cm_id *cm_id;
  1070. unsigned long flags;
  1071. int err = 0;
  1072. /* Create an ID in advance, since the creation may sleep */
  1073. cm_id = ib_create_cm_id(device, cm_handler, NULL);
  1074. if (IS_ERR(cm_id))
  1075. return cm_id;
  1076. spin_lock_irqsave(&cm.lock, flags);
  1077. if (service_id == IB_CM_ASSIGN_SERVICE_ID)
  1078. goto new_id;
  1079. /* Find an existing ID */
  1080. cm_id_priv = cm_find_listen(device, service_id);
  1081. if (cm_id_priv) {
  1082. if (cm_id->cm_handler != cm_handler || cm_id->context) {
  1083. /* Sharing an ib_cm_id with different handlers is not
  1084. * supported */
  1085. spin_unlock_irqrestore(&cm.lock, flags);
  1086. return ERR_PTR(-EINVAL);
  1087. }
  1088. atomic_inc(&cm_id_priv->refcount);
  1089. ++cm_id_priv->listen_sharecount;
  1090. spin_unlock_irqrestore(&cm.lock, flags);
  1091. ib_destroy_cm_id(cm_id);
  1092. cm_id = &cm_id_priv->id;
  1093. return cm_id;
  1094. }
  1095. new_id:
  1096. /* Use newly created ID */
  1097. err = __ib_cm_listen(cm_id, service_id, 0);
  1098. spin_unlock_irqrestore(&cm.lock, flags);
  1099. if (err) {
  1100. ib_destroy_cm_id(cm_id);
  1101. return ERR_PTR(err);
  1102. }
  1103. return cm_id;
  1104. }
  1105. EXPORT_SYMBOL(ib_cm_insert_listen);
  1106. static __be64 cm_form_tid(struct cm_id_private *cm_id_priv)
  1107. {
  1108. u64 hi_tid, low_tid;
  1109. hi_tid = ((u64) cm_id_priv->av.port->mad_agent->hi_tid) << 32;
  1110. low_tid = (u64)cm_id_priv->id.local_id;
  1111. return cpu_to_be64(hi_tid | low_tid);
  1112. }
  1113. static void cm_format_mad_hdr(struct ib_mad_hdr *hdr,
  1114. __be16 attr_id, __be64 tid)
  1115. {
  1116. hdr->base_version = IB_MGMT_BASE_VERSION;
  1117. hdr->mgmt_class = IB_MGMT_CLASS_CM;
  1118. hdr->class_version = IB_CM_CLASS_VERSION;
  1119. hdr->method = IB_MGMT_METHOD_SEND;
  1120. hdr->attr_id = attr_id;
  1121. hdr->tid = tid;
  1122. }
  1123. static void cm_format_req(struct cm_req_msg *req_msg,
  1124. struct cm_id_private *cm_id_priv,
  1125. struct ib_cm_req_param *param)
  1126. {
  1127. struct sa_path_rec *pri_path = param->primary_path;
  1128. struct sa_path_rec *alt_path = param->alternate_path;
  1129. bool pri_ext = false;
  1130. if (pri_path->rec_type == SA_PATH_REC_TYPE_OPA)
  1131. pri_ext = opa_is_extended_lid(pri_path->opa.dlid,
  1132. pri_path->opa.slid);
  1133. cm_format_mad_hdr(&req_msg->hdr, CM_REQ_ATTR_ID,
  1134. cm_form_tid(cm_id_priv));
  1135. req_msg->local_comm_id = cm_id_priv->id.local_id;
  1136. req_msg->service_id = param->service_id;
  1137. req_msg->local_ca_guid = cm_id_priv->id.device->node_guid;
  1138. cm_req_set_local_qpn(req_msg, cpu_to_be32(param->qp_num));
  1139. cm_req_set_init_depth(req_msg, param->initiator_depth);
  1140. cm_req_set_remote_resp_timeout(req_msg,
  1141. param->remote_cm_response_timeout);
  1142. cm_req_set_qp_type(req_msg, param->qp_type);
  1143. cm_req_set_flow_ctrl(req_msg, param->flow_control);
  1144. cm_req_set_starting_psn(req_msg, cpu_to_be32(param->starting_psn));
  1145. cm_req_set_local_resp_timeout(req_msg,
  1146. param->local_cm_response_timeout);
  1147. req_msg->pkey = param->primary_path->pkey;
  1148. cm_req_set_path_mtu(req_msg, param->primary_path->mtu);
  1149. cm_req_set_max_cm_retries(req_msg, param->max_cm_retries);
  1150. if (param->qp_type != IB_QPT_XRC_INI) {
  1151. cm_req_set_resp_res(req_msg, param->responder_resources);
  1152. cm_req_set_retry_count(req_msg, param->retry_count);
  1153. cm_req_set_rnr_retry_count(req_msg, param->rnr_retry_count);
  1154. cm_req_set_srq(req_msg, param->srq);
  1155. }
  1156. req_msg->primary_local_gid = pri_path->sgid;
  1157. req_msg->primary_remote_gid = pri_path->dgid;
  1158. if (pri_ext) {
  1159. req_msg->primary_local_gid.global.interface_id
  1160. = OPA_MAKE_ID(be32_to_cpu(pri_path->opa.slid));
  1161. req_msg->primary_remote_gid.global.interface_id
  1162. = OPA_MAKE_ID(be32_to_cpu(pri_path->opa.dlid));
  1163. }
  1164. if (pri_path->hop_limit <= 1) {
  1165. req_msg->primary_local_lid = pri_ext ? 0 :
  1166. htons(ntohl(sa_path_get_slid(pri_path)));
  1167. req_msg->primary_remote_lid = pri_ext ? 0 :
  1168. htons(ntohl(sa_path_get_dlid(pri_path)));
  1169. } else {
  1170. /* Work-around until there's a way to obtain remote LID info */
  1171. req_msg->primary_local_lid = IB_LID_PERMISSIVE;
  1172. req_msg->primary_remote_lid = IB_LID_PERMISSIVE;
  1173. }
  1174. cm_req_set_primary_flow_label(req_msg, pri_path->flow_label);
  1175. cm_req_set_primary_packet_rate(req_msg, pri_path->rate);
  1176. req_msg->primary_traffic_class = pri_path->traffic_class;
  1177. req_msg->primary_hop_limit = pri_path->hop_limit;
  1178. cm_req_set_primary_sl(req_msg, pri_path->sl);
  1179. cm_req_set_primary_subnet_local(req_msg, (pri_path->hop_limit <= 1));
  1180. cm_req_set_primary_local_ack_timeout(req_msg,
  1181. cm_ack_timeout(cm_id_priv->av.port->cm_dev->ack_delay,
  1182. pri_path->packet_life_time));
  1183. if (alt_path) {
  1184. bool alt_ext = false;
  1185. if (alt_path->rec_type == SA_PATH_REC_TYPE_OPA)
  1186. alt_ext = opa_is_extended_lid(alt_path->opa.dlid,
  1187. alt_path->opa.slid);
  1188. req_msg->alt_local_gid = alt_path->sgid;
  1189. req_msg->alt_remote_gid = alt_path->dgid;
  1190. if (alt_ext) {
  1191. req_msg->alt_local_gid.global.interface_id
  1192. = OPA_MAKE_ID(be32_to_cpu(alt_path->opa.slid));
  1193. req_msg->alt_remote_gid.global.interface_id
  1194. = OPA_MAKE_ID(be32_to_cpu(alt_path->opa.dlid));
  1195. }
  1196. if (alt_path->hop_limit <= 1) {
  1197. req_msg->alt_local_lid = alt_ext ? 0 :
  1198. htons(ntohl(sa_path_get_slid(alt_path)));
  1199. req_msg->alt_remote_lid = alt_ext ? 0 :
  1200. htons(ntohl(sa_path_get_dlid(alt_path)));
  1201. } else {
  1202. req_msg->alt_local_lid = IB_LID_PERMISSIVE;
  1203. req_msg->alt_remote_lid = IB_LID_PERMISSIVE;
  1204. }
  1205. cm_req_set_alt_flow_label(req_msg,
  1206. alt_path->flow_label);
  1207. cm_req_set_alt_packet_rate(req_msg, alt_path->rate);
  1208. req_msg->alt_traffic_class = alt_path->traffic_class;
  1209. req_msg->alt_hop_limit = alt_path->hop_limit;
  1210. cm_req_set_alt_sl(req_msg, alt_path->sl);
  1211. cm_req_set_alt_subnet_local(req_msg, (alt_path->hop_limit <= 1));
  1212. cm_req_set_alt_local_ack_timeout(req_msg,
  1213. cm_ack_timeout(cm_id_priv->av.port->cm_dev->ack_delay,
  1214. alt_path->packet_life_time));
  1215. }
  1216. if (param->private_data && param->private_data_len)
  1217. memcpy(req_msg->private_data, param->private_data,
  1218. param->private_data_len);
  1219. }
  1220. static int cm_validate_req_param(struct ib_cm_req_param *param)
  1221. {
  1222. /* peer-to-peer not supported */
  1223. if (param->peer_to_peer)
  1224. return -EINVAL;
  1225. if (!param->primary_path)
  1226. return -EINVAL;
  1227. if (param->qp_type != IB_QPT_RC && param->qp_type != IB_QPT_UC &&
  1228. param->qp_type != IB_QPT_XRC_INI)
  1229. return -EINVAL;
  1230. if (param->private_data &&
  1231. param->private_data_len > IB_CM_REQ_PRIVATE_DATA_SIZE)
  1232. return -EINVAL;
  1233. if (param->alternate_path &&
  1234. (param->alternate_path->pkey != param->primary_path->pkey ||
  1235. param->alternate_path->mtu != param->primary_path->mtu))
  1236. return -EINVAL;
  1237. return 0;
  1238. }
  1239. int ib_send_cm_req(struct ib_cm_id *cm_id,
  1240. struct ib_cm_req_param *param)
  1241. {
  1242. struct cm_id_private *cm_id_priv;
  1243. struct cm_req_msg *req_msg;
  1244. unsigned long flags;
  1245. int ret;
  1246. ret = cm_validate_req_param(param);
  1247. if (ret)
  1248. return ret;
  1249. /* Verify that we're not in timewait. */
  1250. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  1251. spin_lock_irqsave(&cm_id_priv->lock, flags);
  1252. if (cm_id->state != IB_CM_IDLE) {
  1253. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  1254. ret = -EINVAL;
  1255. goto out;
  1256. }
  1257. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  1258. cm_id_priv->timewait_info = cm_create_timewait_info(cm_id_priv->
  1259. id.local_id);
  1260. if (IS_ERR(cm_id_priv->timewait_info)) {
  1261. ret = PTR_ERR(cm_id_priv->timewait_info);
  1262. goto out;
  1263. }
  1264. ret = cm_init_av_by_path(param->primary_path,
  1265. param->ppath_sgid_attr, &cm_id_priv->av,
  1266. cm_id_priv);
  1267. if (ret)
  1268. goto error1;
  1269. if (param->alternate_path) {
  1270. ret = cm_init_av_by_path(param->alternate_path, NULL,
  1271. &cm_id_priv->alt_av, cm_id_priv);
  1272. if (ret)
  1273. goto error1;
  1274. }
  1275. cm_id->service_id = param->service_id;
  1276. cm_id->service_mask = ~cpu_to_be64(0);
  1277. cm_id_priv->timeout_ms = cm_convert_to_ms(
  1278. param->primary_path->packet_life_time) * 2 +
  1279. cm_convert_to_ms(
  1280. param->remote_cm_response_timeout);
  1281. cm_id_priv->max_cm_retries = param->max_cm_retries;
  1282. cm_id_priv->initiator_depth = param->initiator_depth;
  1283. cm_id_priv->responder_resources = param->responder_resources;
  1284. cm_id_priv->retry_count = param->retry_count;
  1285. cm_id_priv->path_mtu = param->primary_path->mtu;
  1286. cm_id_priv->pkey = param->primary_path->pkey;
  1287. cm_id_priv->qp_type = param->qp_type;
  1288. ret = cm_alloc_msg(cm_id_priv, &cm_id_priv->msg);
  1289. if (ret)
  1290. goto error1;
  1291. req_msg = (struct cm_req_msg *) cm_id_priv->msg->mad;
  1292. cm_format_req(req_msg, cm_id_priv, param);
  1293. cm_id_priv->tid = req_msg->hdr.tid;
  1294. cm_id_priv->msg->timeout_ms = cm_id_priv->timeout_ms;
  1295. cm_id_priv->msg->context[1] = (void *) (unsigned long) IB_CM_REQ_SENT;
  1296. cm_id_priv->local_qpn = cm_req_get_local_qpn(req_msg);
  1297. cm_id_priv->rq_psn = cm_req_get_starting_psn(req_msg);
  1298. spin_lock_irqsave(&cm_id_priv->lock, flags);
  1299. ret = ib_post_send_mad(cm_id_priv->msg, NULL);
  1300. if (ret) {
  1301. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  1302. goto error2;
  1303. }
  1304. BUG_ON(cm_id->state != IB_CM_IDLE);
  1305. cm_id->state = IB_CM_REQ_SENT;
  1306. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  1307. return 0;
  1308. error2: cm_free_msg(cm_id_priv->msg);
  1309. error1: kfree(cm_id_priv->timewait_info);
  1310. out: return ret;
  1311. }
  1312. EXPORT_SYMBOL(ib_send_cm_req);
  1313. static int cm_issue_rej(struct cm_port *port,
  1314. struct ib_mad_recv_wc *mad_recv_wc,
  1315. enum ib_cm_rej_reason reason,
  1316. enum cm_msg_response msg_rejected,
  1317. void *ari, u8 ari_length)
  1318. {
  1319. struct ib_mad_send_buf *msg = NULL;
  1320. struct cm_rej_msg *rej_msg, *rcv_msg;
  1321. int ret;
  1322. ret = cm_alloc_response_msg(port, mad_recv_wc, &msg);
  1323. if (ret)
  1324. return ret;
  1325. /* We just need common CM header information. Cast to any message. */
  1326. rcv_msg = (struct cm_rej_msg *) mad_recv_wc->recv_buf.mad;
  1327. rej_msg = (struct cm_rej_msg *) msg->mad;
  1328. cm_format_mad_hdr(&rej_msg->hdr, CM_REJ_ATTR_ID, rcv_msg->hdr.tid);
  1329. rej_msg->remote_comm_id = rcv_msg->local_comm_id;
  1330. rej_msg->local_comm_id = rcv_msg->remote_comm_id;
  1331. cm_rej_set_msg_rejected(rej_msg, msg_rejected);
  1332. rej_msg->reason = cpu_to_be16(reason);
  1333. if (ari && ari_length) {
  1334. cm_rej_set_reject_info_len(rej_msg, ari_length);
  1335. memcpy(rej_msg->ari, ari, ari_length);
  1336. }
  1337. ret = ib_post_send_mad(msg, NULL);
  1338. if (ret)
  1339. cm_free_msg(msg);
  1340. return ret;
  1341. }
  1342. static inline int cm_is_active_peer(__be64 local_ca_guid, __be64 remote_ca_guid,
  1343. __be32 local_qpn, __be32 remote_qpn)
  1344. {
  1345. return (be64_to_cpu(local_ca_guid) > be64_to_cpu(remote_ca_guid) ||
  1346. ((local_ca_guid == remote_ca_guid) &&
  1347. (be32_to_cpu(local_qpn) > be32_to_cpu(remote_qpn))));
  1348. }
  1349. static bool cm_req_has_alt_path(struct cm_req_msg *req_msg)
  1350. {
  1351. return ((req_msg->alt_local_lid) ||
  1352. (ib_is_opa_gid(&req_msg->alt_local_gid)));
  1353. }
  1354. static void cm_path_set_rec_type(struct ib_device *ib_device, u8 port_num,
  1355. struct sa_path_rec *path, union ib_gid *gid)
  1356. {
  1357. if (ib_is_opa_gid(gid) && rdma_cap_opa_ah(ib_device, port_num))
  1358. path->rec_type = SA_PATH_REC_TYPE_OPA;
  1359. else
  1360. path->rec_type = SA_PATH_REC_TYPE_IB;
  1361. }
  1362. static void cm_format_path_lid_from_req(struct cm_req_msg *req_msg,
  1363. struct sa_path_rec *primary_path,
  1364. struct sa_path_rec *alt_path)
  1365. {
  1366. u32 lid;
  1367. if (primary_path->rec_type != SA_PATH_REC_TYPE_OPA) {
  1368. sa_path_set_dlid(primary_path,
  1369. ntohs(req_msg->primary_local_lid));
  1370. sa_path_set_slid(primary_path,
  1371. ntohs(req_msg->primary_remote_lid));
  1372. } else {
  1373. lid = opa_get_lid_from_gid(&req_msg->primary_local_gid);
  1374. sa_path_set_dlid(primary_path, lid);
  1375. lid = opa_get_lid_from_gid(&req_msg->primary_remote_gid);
  1376. sa_path_set_slid(primary_path, lid);
  1377. }
  1378. if (!cm_req_has_alt_path(req_msg))
  1379. return;
  1380. if (alt_path->rec_type != SA_PATH_REC_TYPE_OPA) {
  1381. sa_path_set_dlid(alt_path, ntohs(req_msg->alt_local_lid));
  1382. sa_path_set_slid(alt_path, ntohs(req_msg->alt_remote_lid));
  1383. } else {
  1384. lid = opa_get_lid_from_gid(&req_msg->alt_local_gid);
  1385. sa_path_set_dlid(alt_path, lid);
  1386. lid = opa_get_lid_from_gid(&req_msg->alt_remote_gid);
  1387. sa_path_set_slid(alt_path, lid);
  1388. }
  1389. }
  1390. static void cm_format_paths_from_req(struct cm_req_msg *req_msg,
  1391. struct sa_path_rec *primary_path,
  1392. struct sa_path_rec *alt_path)
  1393. {
  1394. primary_path->dgid = req_msg->primary_local_gid;
  1395. primary_path->sgid = req_msg->primary_remote_gid;
  1396. primary_path->flow_label = cm_req_get_primary_flow_label(req_msg);
  1397. primary_path->hop_limit = req_msg->primary_hop_limit;
  1398. primary_path->traffic_class = req_msg->primary_traffic_class;
  1399. primary_path->reversible = 1;
  1400. primary_path->pkey = req_msg->pkey;
  1401. primary_path->sl = cm_req_get_primary_sl(req_msg);
  1402. primary_path->mtu_selector = IB_SA_EQ;
  1403. primary_path->mtu = cm_req_get_path_mtu(req_msg);
  1404. primary_path->rate_selector = IB_SA_EQ;
  1405. primary_path->rate = cm_req_get_primary_packet_rate(req_msg);
  1406. primary_path->packet_life_time_selector = IB_SA_EQ;
  1407. primary_path->packet_life_time =
  1408. cm_req_get_primary_local_ack_timeout(req_msg);
  1409. primary_path->packet_life_time -= (primary_path->packet_life_time > 0);
  1410. primary_path->service_id = req_msg->service_id;
  1411. if (sa_path_is_roce(primary_path))
  1412. primary_path->roce.route_resolved = false;
  1413. if (cm_req_has_alt_path(req_msg)) {
  1414. alt_path->dgid = req_msg->alt_local_gid;
  1415. alt_path->sgid = req_msg->alt_remote_gid;
  1416. alt_path->flow_label = cm_req_get_alt_flow_label(req_msg);
  1417. alt_path->hop_limit = req_msg->alt_hop_limit;
  1418. alt_path->traffic_class = req_msg->alt_traffic_class;
  1419. alt_path->reversible = 1;
  1420. alt_path->pkey = req_msg->pkey;
  1421. alt_path->sl = cm_req_get_alt_sl(req_msg);
  1422. alt_path->mtu_selector = IB_SA_EQ;
  1423. alt_path->mtu = cm_req_get_path_mtu(req_msg);
  1424. alt_path->rate_selector = IB_SA_EQ;
  1425. alt_path->rate = cm_req_get_alt_packet_rate(req_msg);
  1426. alt_path->packet_life_time_selector = IB_SA_EQ;
  1427. alt_path->packet_life_time =
  1428. cm_req_get_alt_local_ack_timeout(req_msg);
  1429. alt_path->packet_life_time -= (alt_path->packet_life_time > 0);
  1430. alt_path->service_id = req_msg->service_id;
  1431. if (sa_path_is_roce(alt_path))
  1432. alt_path->roce.route_resolved = false;
  1433. }
  1434. cm_format_path_lid_from_req(req_msg, primary_path, alt_path);
  1435. }
  1436. static u16 cm_get_bth_pkey(struct cm_work *work)
  1437. {
  1438. struct ib_device *ib_dev = work->port->cm_dev->ib_device;
  1439. u8 port_num = work->port->port_num;
  1440. u16 pkey_index = work->mad_recv_wc->wc->pkey_index;
  1441. u16 pkey;
  1442. int ret;
  1443. ret = ib_get_cached_pkey(ib_dev, port_num, pkey_index, &pkey);
  1444. if (ret) {
  1445. dev_warn_ratelimited(&ib_dev->dev, "ib_cm: Couldn't retrieve pkey for incoming request (port %d, pkey index %d). %d\n",
  1446. port_num, pkey_index, ret);
  1447. return 0;
  1448. }
  1449. return pkey;
  1450. }
  1451. /**
  1452. * Convert OPA SGID to IB SGID
  1453. * ULPs (such as IPoIB) do not understand OPA GIDs and will
  1454. * reject them as the local_gid will not match the sgid. Therefore,
  1455. * change the pathrec's SGID to an IB SGID.
  1456. *
  1457. * @work: Work completion
  1458. * @path: Path record
  1459. */
  1460. static void cm_opa_to_ib_sgid(struct cm_work *work,
  1461. struct sa_path_rec *path)
  1462. {
  1463. struct ib_device *dev = work->port->cm_dev->ib_device;
  1464. u8 port_num = work->port->port_num;
  1465. if (rdma_cap_opa_ah(dev, port_num) &&
  1466. (ib_is_opa_gid(&path->sgid))) {
  1467. union ib_gid sgid;
  1468. if (rdma_query_gid(dev, port_num, 0, &sgid)) {
  1469. dev_warn(&dev->dev,
  1470. "Error updating sgid in CM request\n");
  1471. return;
  1472. }
  1473. path->sgid = sgid;
  1474. }
  1475. }
  1476. static void cm_format_req_event(struct cm_work *work,
  1477. struct cm_id_private *cm_id_priv,
  1478. struct ib_cm_id *listen_id)
  1479. {
  1480. struct cm_req_msg *req_msg;
  1481. struct ib_cm_req_event_param *param;
  1482. req_msg = (struct cm_req_msg *)work->mad_recv_wc->recv_buf.mad;
  1483. param = &work->cm_event.param.req_rcvd;
  1484. param->listen_id = listen_id;
  1485. param->bth_pkey = cm_get_bth_pkey(work);
  1486. param->port = cm_id_priv->av.port->port_num;
  1487. param->primary_path = &work->path[0];
  1488. cm_opa_to_ib_sgid(work, param->primary_path);
  1489. if (cm_req_has_alt_path(req_msg)) {
  1490. param->alternate_path = &work->path[1];
  1491. cm_opa_to_ib_sgid(work, param->alternate_path);
  1492. } else {
  1493. param->alternate_path = NULL;
  1494. }
  1495. param->remote_ca_guid = req_msg->local_ca_guid;
  1496. param->remote_qkey = be32_to_cpu(req_msg->local_qkey);
  1497. param->remote_qpn = be32_to_cpu(cm_req_get_local_qpn(req_msg));
  1498. param->qp_type = cm_req_get_qp_type(req_msg);
  1499. param->starting_psn = be32_to_cpu(cm_req_get_starting_psn(req_msg));
  1500. param->responder_resources = cm_req_get_init_depth(req_msg);
  1501. param->initiator_depth = cm_req_get_resp_res(req_msg);
  1502. param->local_cm_response_timeout =
  1503. cm_req_get_remote_resp_timeout(req_msg);
  1504. param->flow_control = cm_req_get_flow_ctrl(req_msg);
  1505. param->remote_cm_response_timeout =
  1506. cm_req_get_local_resp_timeout(req_msg);
  1507. param->retry_count = cm_req_get_retry_count(req_msg);
  1508. param->rnr_retry_count = cm_req_get_rnr_retry_count(req_msg);
  1509. param->srq = cm_req_get_srq(req_msg);
  1510. param->ppath_sgid_attr = cm_id_priv->av.ah_attr.grh.sgid_attr;
  1511. work->cm_event.private_data = &req_msg->private_data;
  1512. }
  1513. static void cm_process_work(struct cm_id_private *cm_id_priv,
  1514. struct cm_work *work)
  1515. {
  1516. int ret;
  1517. /* We will typically only have the current event to report. */
  1518. ret = cm_id_priv->id.cm_handler(&cm_id_priv->id, &work->cm_event);
  1519. cm_free_work(work);
  1520. while (!ret && !atomic_add_negative(-1, &cm_id_priv->work_count)) {
  1521. spin_lock_irq(&cm_id_priv->lock);
  1522. work = cm_dequeue_work(cm_id_priv);
  1523. spin_unlock_irq(&cm_id_priv->lock);
  1524. if (!work)
  1525. return;
  1526. ret = cm_id_priv->id.cm_handler(&cm_id_priv->id,
  1527. &work->cm_event);
  1528. cm_free_work(work);
  1529. }
  1530. cm_deref_id(cm_id_priv);
  1531. if (ret)
  1532. cm_destroy_id(&cm_id_priv->id, ret);
  1533. }
  1534. static void cm_format_mra(struct cm_mra_msg *mra_msg,
  1535. struct cm_id_private *cm_id_priv,
  1536. enum cm_msg_response msg_mraed, u8 service_timeout,
  1537. const void *private_data, u8 private_data_len)
  1538. {
  1539. cm_format_mad_hdr(&mra_msg->hdr, CM_MRA_ATTR_ID, cm_id_priv->tid);
  1540. cm_mra_set_msg_mraed(mra_msg, msg_mraed);
  1541. mra_msg->local_comm_id = cm_id_priv->id.local_id;
  1542. mra_msg->remote_comm_id = cm_id_priv->id.remote_id;
  1543. cm_mra_set_service_timeout(mra_msg, service_timeout);
  1544. if (private_data && private_data_len)
  1545. memcpy(mra_msg->private_data, private_data, private_data_len);
  1546. }
  1547. static void cm_format_rej(struct cm_rej_msg *rej_msg,
  1548. struct cm_id_private *cm_id_priv,
  1549. enum ib_cm_rej_reason reason,
  1550. void *ari,
  1551. u8 ari_length,
  1552. const void *private_data,
  1553. u8 private_data_len)
  1554. {
  1555. cm_format_mad_hdr(&rej_msg->hdr, CM_REJ_ATTR_ID, cm_id_priv->tid);
  1556. rej_msg->remote_comm_id = cm_id_priv->id.remote_id;
  1557. switch(cm_id_priv->id.state) {
  1558. case IB_CM_REQ_RCVD:
  1559. rej_msg->local_comm_id = 0;
  1560. cm_rej_set_msg_rejected(rej_msg, CM_MSG_RESPONSE_REQ);
  1561. break;
  1562. case IB_CM_MRA_REQ_SENT:
  1563. rej_msg->local_comm_id = cm_id_priv->id.local_id;
  1564. cm_rej_set_msg_rejected(rej_msg, CM_MSG_RESPONSE_REQ);
  1565. break;
  1566. case IB_CM_REP_RCVD:
  1567. case IB_CM_MRA_REP_SENT:
  1568. rej_msg->local_comm_id = cm_id_priv->id.local_id;
  1569. cm_rej_set_msg_rejected(rej_msg, CM_MSG_RESPONSE_REP);
  1570. break;
  1571. default:
  1572. rej_msg->local_comm_id = cm_id_priv->id.local_id;
  1573. cm_rej_set_msg_rejected(rej_msg, CM_MSG_RESPONSE_OTHER);
  1574. break;
  1575. }
  1576. rej_msg->reason = cpu_to_be16(reason);
  1577. if (ari && ari_length) {
  1578. cm_rej_set_reject_info_len(rej_msg, ari_length);
  1579. memcpy(rej_msg->ari, ari, ari_length);
  1580. }
  1581. if (private_data && private_data_len)
  1582. memcpy(rej_msg->private_data, private_data, private_data_len);
  1583. }
  1584. static void cm_dup_req_handler(struct cm_work *work,
  1585. struct cm_id_private *cm_id_priv)
  1586. {
  1587. struct ib_mad_send_buf *msg = NULL;
  1588. int ret;
  1589. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  1590. counter[CM_REQ_COUNTER]);
  1591. /* Quick state check to discard duplicate REQs. */
  1592. if (cm_id_priv->id.state == IB_CM_REQ_RCVD)
  1593. return;
  1594. ret = cm_alloc_response_msg(work->port, work->mad_recv_wc, &msg);
  1595. if (ret)
  1596. return;
  1597. spin_lock_irq(&cm_id_priv->lock);
  1598. switch (cm_id_priv->id.state) {
  1599. case IB_CM_MRA_REQ_SENT:
  1600. cm_format_mra((struct cm_mra_msg *) msg->mad, cm_id_priv,
  1601. CM_MSG_RESPONSE_REQ, cm_id_priv->service_timeout,
  1602. cm_id_priv->private_data,
  1603. cm_id_priv->private_data_len);
  1604. break;
  1605. case IB_CM_TIMEWAIT:
  1606. cm_format_rej((struct cm_rej_msg *) msg->mad, cm_id_priv,
  1607. IB_CM_REJ_STALE_CONN, NULL, 0, NULL, 0);
  1608. break;
  1609. default:
  1610. goto unlock;
  1611. }
  1612. spin_unlock_irq(&cm_id_priv->lock);
  1613. ret = ib_post_send_mad(msg, NULL);
  1614. if (ret)
  1615. goto free;
  1616. return;
  1617. unlock: spin_unlock_irq(&cm_id_priv->lock);
  1618. free: cm_free_msg(msg);
  1619. }
  1620. static struct cm_id_private * cm_match_req(struct cm_work *work,
  1621. struct cm_id_private *cm_id_priv)
  1622. {
  1623. struct cm_id_private *listen_cm_id_priv, *cur_cm_id_priv;
  1624. struct cm_timewait_info *timewait_info;
  1625. struct cm_req_msg *req_msg;
  1626. struct ib_cm_id *cm_id;
  1627. req_msg = (struct cm_req_msg *)work->mad_recv_wc->recv_buf.mad;
  1628. /* Check for possible duplicate REQ. */
  1629. spin_lock_irq(&cm.lock);
  1630. timewait_info = cm_insert_remote_id(cm_id_priv->timewait_info);
  1631. if (timewait_info) {
  1632. cur_cm_id_priv = cm_get_id(timewait_info->work.local_id,
  1633. timewait_info->work.remote_id);
  1634. spin_unlock_irq(&cm.lock);
  1635. if (cur_cm_id_priv) {
  1636. cm_dup_req_handler(work, cur_cm_id_priv);
  1637. cm_deref_id(cur_cm_id_priv);
  1638. }
  1639. return NULL;
  1640. }
  1641. /* Check for stale connections. */
  1642. timewait_info = cm_insert_remote_qpn(cm_id_priv->timewait_info);
  1643. if (timewait_info) {
  1644. cm_cleanup_timewait(cm_id_priv->timewait_info);
  1645. cur_cm_id_priv = cm_get_id(timewait_info->work.local_id,
  1646. timewait_info->work.remote_id);
  1647. spin_unlock_irq(&cm.lock);
  1648. cm_issue_rej(work->port, work->mad_recv_wc,
  1649. IB_CM_REJ_STALE_CONN, CM_MSG_RESPONSE_REQ,
  1650. NULL, 0);
  1651. if (cur_cm_id_priv) {
  1652. cm_id = &cur_cm_id_priv->id;
  1653. ib_send_cm_dreq(cm_id, NULL, 0);
  1654. cm_deref_id(cur_cm_id_priv);
  1655. }
  1656. return NULL;
  1657. }
  1658. /* Find matching listen request. */
  1659. listen_cm_id_priv = cm_find_listen(cm_id_priv->id.device,
  1660. req_msg->service_id);
  1661. if (!listen_cm_id_priv) {
  1662. cm_cleanup_timewait(cm_id_priv->timewait_info);
  1663. spin_unlock_irq(&cm.lock);
  1664. cm_issue_rej(work->port, work->mad_recv_wc,
  1665. IB_CM_REJ_INVALID_SERVICE_ID, CM_MSG_RESPONSE_REQ,
  1666. NULL, 0);
  1667. goto out;
  1668. }
  1669. atomic_inc(&listen_cm_id_priv->refcount);
  1670. atomic_inc(&cm_id_priv->refcount);
  1671. cm_id_priv->id.state = IB_CM_REQ_RCVD;
  1672. atomic_inc(&cm_id_priv->work_count);
  1673. spin_unlock_irq(&cm.lock);
  1674. out:
  1675. return listen_cm_id_priv;
  1676. }
  1677. /*
  1678. * Work-around for inter-subnet connections. If the LIDs are permissive,
  1679. * we need to override the LID/SL data in the REQ with the LID information
  1680. * in the work completion.
  1681. */
  1682. static void cm_process_routed_req(struct cm_req_msg *req_msg, struct ib_wc *wc)
  1683. {
  1684. if (!cm_req_get_primary_subnet_local(req_msg)) {
  1685. if (req_msg->primary_local_lid == IB_LID_PERMISSIVE) {
  1686. req_msg->primary_local_lid = ib_lid_be16(wc->slid);
  1687. cm_req_set_primary_sl(req_msg, wc->sl);
  1688. }
  1689. if (req_msg->primary_remote_lid == IB_LID_PERMISSIVE)
  1690. req_msg->primary_remote_lid = cpu_to_be16(wc->dlid_path_bits);
  1691. }
  1692. if (!cm_req_get_alt_subnet_local(req_msg)) {
  1693. if (req_msg->alt_local_lid == IB_LID_PERMISSIVE) {
  1694. req_msg->alt_local_lid = ib_lid_be16(wc->slid);
  1695. cm_req_set_alt_sl(req_msg, wc->sl);
  1696. }
  1697. if (req_msg->alt_remote_lid == IB_LID_PERMISSIVE)
  1698. req_msg->alt_remote_lid = cpu_to_be16(wc->dlid_path_bits);
  1699. }
  1700. }
  1701. static int cm_req_handler(struct cm_work *work)
  1702. {
  1703. struct ib_cm_id *cm_id;
  1704. struct cm_id_private *cm_id_priv, *listen_cm_id_priv;
  1705. struct cm_req_msg *req_msg;
  1706. const struct ib_global_route *grh;
  1707. const struct ib_gid_attr *gid_attr;
  1708. int ret;
  1709. req_msg = (struct cm_req_msg *)work->mad_recv_wc->recv_buf.mad;
  1710. cm_id = ib_create_cm_id(work->port->cm_dev->ib_device, NULL, NULL);
  1711. if (IS_ERR(cm_id))
  1712. return PTR_ERR(cm_id);
  1713. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  1714. cm_id_priv->id.remote_id = req_msg->local_comm_id;
  1715. ret = cm_init_av_for_response(work->port, work->mad_recv_wc->wc,
  1716. work->mad_recv_wc->recv_buf.grh,
  1717. &cm_id_priv->av);
  1718. if (ret)
  1719. goto destroy;
  1720. cm_id_priv->timewait_info = cm_create_timewait_info(cm_id_priv->
  1721. id.local_id);
  1722. if (IS_ERR(cm_id_priv->timewait_info)) {
  1723. ret = PTR_ERR(cm_id_priv->timewait_info);
  1724. goto destroy;
  1725. }
  1726. cm_id_priv->timewait_info->work.remote_id = req_msg->local_comm_id;
  1727. cm_id_priv->timewait_info->remote_ca_guid = req_msg->local_ca_guid;
  1728. cm_id_priv->timewait_info->remote_qpn = cm_req_get_local_qpn(req_msg);
  1729. listen_cm_id_priv = cm_match_req(work, cm_id_priv);
  1730. if (!listen_cm_id_priv) {
  1731. pr_debug("%s: local_id %d, no listen_cm_id_priv\n", __func__,
  1732. be32_to_cpu(cm_id->local_id));
  1733. ret = -EINVAL;
  1734. goto free_timeinfo;
  1735. }
  1736. cm_id_priv->id.cm_handler = listen_cm_id_priv->id.cm_handler;
  1737. cm_id_priv->id.context = listen_cm_id_priv->id.context;
  1738. cm_id_priv->id.service_id = req_msg->service_id;
  1739. cm_id_priv->id.service_mask = ~cpu_to_be64(0);
  1740. cm_process_routed_req(req_msg, work->mad_recv_wc->wc);
  1741. memset(&work->path[0], 0, sizeof(work->path[0]));
  1742. if (cm_req_has_alt_path(req_msg))
  1743. memset(&work->path[1], 0, sizeof(work->path[1]));
  1744. grh = rdma_ah_read_grh(&cm_id_priv->av.ah_attr);
  1745. gid_attr = grh->sgid_attr;
  1746. if (gid_attr && gid_attr->ndev) {
  1747. work->path[0].rec_type =
  1748. sa_conv_gid_to_pathrec_type(gid_attr->gid_type);
  1749. } else {
  1750. /* If no GID attribute or ndev is null, it is not RoCE. */
  1751. cm_path_set_rec_type(work->port->cm_dev->ib_device,
  1752. work->port->port_num,
  1753. &work->path[0],
  1754. &req_msg->primary_local_gid);
  1755. }
  1756. if (cm_req_has_alt_path(req_msg))
  1757. work->path[1].rec_type = work->path[0].rec_type;
  1758. cm_format_paths_from_req(req_msg, &work->path[0],
  1759. &work->path[1]);
  1760. if (cm_id_priv->av.ah_attr.type == RDMA_AH_ATTR_TYPE_ROCE)
  1761. sa_path_set_dmac(&work->path[0],
  1762. cm_id_priv->av.ah_attr.roce.dmac);
  1763. work->path[0].hop_limit = grh->hop_limit;
  1764. ret = cm_init_av_by_path(&work->path[0], gid_attr, &cm_id_priv->av,
  1765. cm_id_priv);
  1766. if (ret) {
  1767. int err;
  1768. err = rdma_query_gid(work->port->cm_dev->ib_device,
  1769. work->port->port_num, 0,
  1770. &work->path[0].sgid);
  1771. if (err)
  1772. ib_send_cm_rej(cm_id, IB_CM_REJ_INVALID_GID,
  1773. NULL, 0, NULL, 0);
  1774. else
  1775. ib_send_cm_rej(cm_id, IB_CM_REJ_INVALID_GID,
  1776. &work->path[0].sgid,
  1777. sizeof(work->path[0].sgid),
  1778. NULL, 0);
  1779. goto rejected;
  1780. }
  1781. if (cm_req_has_alt_path(req_msg)) {
  1782. ret = cm_init_av_by_path(&work->path[1], NULL,
  1783. &cm_id_priv->alt_av, cm_id_priv);
  1784. if (ret) {
  1785. ib_send_cm_rej(cm_id, IB_CM_REJ_INVALID_ALT_GID,
  1786. &work->path[0].sgid,
  1787. sizeof(work->path[0].sgid), NULL, 0);
  1788. goto rejected;
  1789. }
  1790. }
  1791. cm_id_priv->tid = req_msg->hdr.tid;
  1792. cm_id_priv->timeout_ms = cm_convert_to_ms(
  1793. cm_req_get_local_resp_timeout(req_msg));
  1794. cm_id_priv->max_cm_retries = cm_req_get_max_cm_retries(req_msg);
  1795. cm_id_priv->remote_qpn = cm_req_get_local_qpn(req_msg);
  1796. cm_id_priv->initiator_depth = cm_req_get_resp_res(req_msg);
  1797. cm_id_priv->responder_resources = cm_req_get_init_depth(req_msg);
  1798. cm_id_priv->path_mtu = cm_req_get_path_mtu(req_msg);
  1799. cm_id_priv->pkey = req_msg->pkey;
  1800. cm_id_priv->sq_psn = cm_req_get_starting_psn(req_msg);
  1801. cm_id_priv->retry_count = cm_req_get_retry_count(req_msg);
  1802. cm_id_priv->rnr_retry_count = cm_req_get_rnr_retry_count(req_msg);
  1803. cm_id_priv->qp_type = cm_req_get_qp_type(req_msg);
  1804. cm_format_req_event(work, cm_id_priv, &listen_cm_id_priv->id);
  1805. cm_process_work(cm_id_priv, work);
  1806. cm_deref_id(listen_cm_id_priv);
  1807. return 0;
  1808. rejected:
  1809. atomic_dec(&cm_id_priv->refcount);
  1810. cm_deref_id(listen_cm_id_priv);
  1811. free_timeinfo:
  1812. kfree(cm_id_priv->timewait_info);
  1813. destroy:
  1814. ib_destroy_cm_id(cm_id);
  1815. return ret;
  1816. }
  1817. static void cm_format_rep(struct cm_rep_msg *rep_msg,
  1818. struct cm_id_private *cm_id_priv,
  1819. struct ib_cm_rep_param *param)
  1820. {
  1821. cm_format_mad_hdr(&rep_msg->hdr, CM_REP_ATTR_ID, cm_id_priv->tid);
  1822. rep_msg->local_comm_id = cm_id_priv->id.local_id;
  1823. rep_msg->remote_comm_id = cm_id_priv->id.remote_id;
  1824. cm_rep_set_starting_psn(rep_msg, cpu_to_be32(param->starting_psn));
  1825. rep_msg->resp_resources = param->responder_resources;
  1826. cm_rep_set_target_ack_delay(rep_msg,
  1827. cm_id_priv->av.port->cm_dev->ack_delay);
  1828. cm_rep_set_failover(rep_msg, param->failover_accepted);
  1829. cm_rep_set_rnr_retry_count(rep_msg, param->rnr_retry_count);
  1830. rep_msg->local_ca_guid = cm_id_priv->id.device->node_guid;
  1831. if (cm_id_priv->qp_type != IB_QPT_XRC_TGT) {
  1832. rep_msg->initiator_depth = param->initiator_depth;
  1833. cm_rep_set_flow_ctrl(rep_msg, param->flow_control);
  1834. cm_rep_set_srq(rep_msg, param->srq);
  1835. cm_rep_set_local_qpn(rep_msg, cpu_to_be32(param->qp_num));
  1836. } else {
  1837. cm_rep_set_srq(rep_msg, 1);
  1838. cm_rep_set_local_eecn(rep_msg, cpu_to_be32(param->qp_num));
  1839. }
  1840. if (param->private_data && param->private_data_len)
  1841. memcpy(rep_msg->private_data, param->private_data,
  1842. param->private_data_len);
  1843. }
  1844. int ib_send_cm_rep(struct ib_cm_id *cm_id,
  1845. struct ib_cm_rep_param *param)
  1846. {
  1847. struct cm_id_private *cm_id_priv;
  1848. struct ib_mad_send_buf *msg;
  1849. struct cm_rep_msg *rep_msg;
  1850. unsigned long flags;
  1851. int ret;
  1852. if (param->private_data &&
  1853. param->private_data_len > IB_CM_REP_PRIVATE_DATA_SIZE)
  1854. return -EINVAL;
  1855. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  1856. spin_lock_irqsave(&cm_id_priv->lock, flags);
  1857. if (cm_id->state != IB_CM_REQ_RCVD &&
  1858. cm_id->state != IB_CM_MRA_REQ_SENT) {
  1859. pr_debug("%s: local_comm_id %d, cm_id->state: %d\n", __func__,
  1860. be32_to_cpu(cm_id_priv->id.local_id), cm_id->state);
  1861. ret = -EINVAL;
  1862. goto out;
  1863. }
  1864. ret = cm_alloc_msg(cm_id_priv, &msg);
  1865. if (ret)
  1866. goto out;
  1867. rep_msg = (struct cm_rep_msg *) msg->mad;
  1868. cm_format_rep(rep_msg, cm_id_priv, param);
  1869. msg->timeout_ms = cm_id_priv->timeout_ms;
  1870. msg->context[1] = (void *) (unsigned long) IB_CM_REP_SENT;
  1871. ret = ib_post_send_mad(msg, NULL);
  1872. if (ret) {
  1873. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  1874. cm_free_msg(msg);
  1875. return ret;
  1876. }
  1877. cm_id->state = IB_CM_REP_SENT;
  1878. cm_id_priv->msg = msg;
  1879. cm_id_priv->initiator_depth = param->initiator_depth;
  1880. cm_id_priv->responder_resources = param->responder_resources;
  1881. cm_id_priv->rq_psn = cm_rep_get_starting_psn(rep_msg);
  1882. cm_id_priv->local_qpn = cpu_to_be32(param->qp_num & 0xFFFFFF);
  1883. out: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  1884. return ret;
  1885. }
  1886. EXPORT_SYMBOL(ib_send_cm_rep);
  1887. static void cm_format_rtu(struct cm_rtu_msg *rtu_msg,
  1888. struct cm_id_private *cm_id_priv,
  1889. const void *private_data,
  1890. u8 private_data_len)
  1891. {
  1892. cm_format_mad_hdr(&rtu_msg->hdr, CM_RTU_ATTR_ID, cm_id_priv->tid);
  1893. rtu_msg->local_comm_id = cm_id_priv->id.local_id;
  1894. rtu_msg->remote_comm_id = cm_id_priv->id.remote_id;
  1895. if (private_data && private_data_len)
  1896. memcpy(rtu_msg->private_data, private_data, private_data_len);
  1897. }
  1898. int ib_send_cm_rtu(struct ib_cm_id *cm_id,
  1899. const void *private_data,
  1900. u8 private_data_len)
  1901. {
  1902. struct cm_id_private *cm_id_priv;
  1903. struct ib_mad_send_buf *msg;
  1904. unsigned long flags;
  1905. void *data;
  1906. int ret;
  1907. if (private_data && private_data_len > IB_CM_RTU_PRIVATE_DATA_SIZE)
  1908. return -EINVAL;
  1909. data = cm_copy_private_data(private_data, private_data_len);
  1910. if (IS_ERR(data))
  1911. return PTR_ERR(data);
  1912. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  1913. spin_lock_irqsave(&cm_id_priv->lock, flags);
  1914. if (cm_id->state != IB_CM_REP_RCVD &&
  1915. cm_id->state != IB_CM_MRA_REP_SENT) {
  1916. pr_debug("%s: local_id %d, cm_id->state %d\n", __func__,
  1917. be32_to_cpu(cm_id->local_id), cm_id->state);
  1918. ret = -EINVAL;
  1919. goto error;
  1920. }
  1921. ret = cm_alloc_msg(cm_id_priv, &msg);
  1922. if (ret)
  1923. goto error;
  1924. cm_format_rtu((struct cm_rtu_msg *) msg->mad, cm_id_priv,
  1925. private_data, private_data_len);
  1926. ret = ib_post_send_mad(msg, NULL);
  1927. if (ret) {
  1928. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  1929. cm_free_msg(msg);
  1930. kfree(data);
  1931. return ret;
  1932. }
  1933. cm_id->state = IB_CM_ESTABLISHED;
  1934. cm_set_private_data(cm_id_priv, data, private_data_len);
  1935. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  1936. return 0;
  1937. error: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  1938. kfree(data);
  1939. return ret;
  1940. }
  1941. EXPORT_SYMBOL(ib_send_cm_rtu);
  1942. static void cm_format_rep_event(struct cm_work *work, enum ib_qp_type qp_type)
  1943. {
  1944. struct cm_rep_msg *rep_msg;
  1945. struct ib_cm_rep_event_param *param;
  1946. rep_msg = (struct cm_rep_msg *)work->mad_recv_wc->recv_buf.mad;
  1947. param = &work->cm_event.param.rep_rcvd;
  1948. param->remote_ca_guid = rep_msg->local_ca_guid;
  1949. param->remote_qkey = be32_to_cpu(rep_msg->local_qkey);
  1950. param->remote_qpn = be32_to_cpu(cm_rep_get_qpn(rep_msg, qp_type));
  1951. param->starting_psn = be32_to_cpu(cm_rep_get_starting_psn(rep_msg));
  1952. param->responder_resources = rep_msg->initiator_depth;
  1953. param->initiator_depth = rep_msg->resp_resources;
  1954. param->target_ack_delay = cm_rep_get_target_ack_delay(rep_msg);
  1955. param->failover_accepted = cm_rep_get_failover(rep_msg);
  1956. param->flow_control = cm_rep_get_flow_ctrl(rep_msg);
  1957. param->rnr_retry_count = cm_rep_get_rnr_retry_count(rep_msg);
  1958. param->srq = cm_rep_get_srq(rep_msg);
  1959. work->cm_event.private_data = &rep_msg->private_data;
  1960. }
  1961. static void cm_dup_rep_handler(struct cm_work *work)
  1962. {
  1963. struct cm_id_private *cm_id_priv;
  1964. struct cm_rep_msg *rep_msg;
  1965. struct ib_mad_send_buf *msg = NULL;
  1966. int ret;
  1967. rep_msg = (struct cm_rep_msg *) work->mad_recv_wc->recv_buf.mad;
  1968. cm_id_priv = cm_acquire_id(rep_msg->remote_comm_id,
  1969. rep_msg->local_comm_id);
  1970. if (!cm_id_priv)
  1971. return;
  1972. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  1973. counter[CM_REP_COUNTER]);
  1974. ret = cm_alloc_response_msg(work->port, work->mad_recv_wc, &msg);
  1975. if (ret)
  1976. goto deref;
  1977. spin_lock_irq(&cm_id_priv->lock);
  1978. if (cm_id_priv->id.state == IB_CM_ESTABLISHED)
  1979. cm_format_rtu((struct cm_rtu_msg *) msg->mad, cm_id_priv,
  1980. cm_id_priv->private_data,
  1981. cm_id_priv->private_data_len);
  1982. else if (cm_id_priv->id.state == IB_CM_MRA_REP_SENT)
  1983. cm_format_mra((struct cm_mra_msg *) msg->mad, cm_id_priv,
  1984. CM_MSG_RESPONSE_REP, cm_id_priv->service_timeout,
  1985. cm_id_priv->private_data,
  1986. cm_id_priv->private_data_len);
  1987. else
  1988. goto unlock;
  1989. spin_unlock_irq(&cm_id_priv->lock);
  1990. ret = ib_post_send_mad(msg, NULL);
  1991. if (ret)
  1992. goto free;
  1993. goto deref;
  1994. unlock: spin_unlock_irq(&cm_id_priv->lock);
  1995. free: cm_free_msg(msg);
  1996. deref: cm_deref_id(cm_id_priv);
  1997. }
  1998. static int cm_rep_handler(struct cm_work *work)
  1999. {
  2000. struct cm_id_private *cm_id_priv;
  2001. struct cm_rep_msg *rep_msg;
  2002. int ret;
  2003. struct cm_id_private *cur_cm_id_priv;
  2004. struct ib_cm_id *cm_id;
  2005. struct cm_timewait_info *timewait_info;
  2006. rep_msg = (struct cm_rep_msg *)work->mad_recv_wc->recv_buf.mad;
  2007. cm_id_priv = cm_acquire_id(rep_msg->remote_comm_id, 0);
  2008. if (!cm_id_priv) {
  2009. cm_dup_rep_handler(work);
  2010. pr_debug("%s: remote_comm_id %d, no cm_id_priv\n", __func__,
  2011. be32_to_cpu(rep_msg->remote_comm_id));
  2012. return -EINVAL;
  2013. }
  2014. cm_format_rep_event(work, cm_id_priv->qp_type);
  2015. spin_lock_irq(&cm_id_priv->lock);
  2016. switch (cm_id_priv->id.state) {
  2017. case IB_CM_REQ_SENT:
  2018. case IB_CM_MRA_REQ_RCVD:
  2019. break;
  2020. default:
  2021. spin_unlock_irq(&cm_id_priv->lock);
  2022. ret = -EINVAL;
  2023. pr_debug("%s: cm_id_priv->id.state: %d, local_comm_id %d, remote_comm_id %d\n",
  2024. __func__, cm_id_priv->id.state,
  2025. be32_to_cpu(rep_msg->local_comm_id),
  2026. be32_to_cpu(rep_msg->remote_comm_id));
  2027. goto error;
  2028. }
  2029. cm_id_priv->timewait_info->work.remote_id = rep_msg->local_comm_id;
  2030. cm_id_priv->timewait_info->remote_ca_guid = rep_msg->local_ca_guid;
  2031. cm_id_priv->timewait_info->remote_qpn = cm_rep_get_qpn(rep_msg, cm_id_priv->qp_type);
  2032. spin_lock(&cm.lock);
  2033. /* Check for duplicate REP. */
  2034. if (cm_insert_remote_id(cm_id_priv->timewait_info)) {
  2035. spin_unlock(&cm.lock);
  2036. spin_unlock_irq(&cm_id_priv->lock);
  2037. ret = -EINVAL;
  2038. pr_debug("%s: Failed to insert remote id %d\n", __func__,
  2039. be32_to_cpu(rep_msg->remote_comm_id));
  2040. goto error;
  2041. }
  2042. /* Check for a stale connection. */
  2043. timewait_info = cm_insert_remote_qpn(cm_id_priv->timewait_info);
  2044. if (timewait_info) {
  2045. rb_erase(&cm_id_priv->timewait_info->remote_id_node,
  2046. &cm.remote_id_table);
  2047. cm_id_priv->timewait_info->inserted_remote_id = 0;
  2048. cur_cm_id_priv = cm_get_id(timewait_info->work.local_id,
  2049. timewait_info->work.remote_id);
  2050. spin_unlock(&cm.lock);
  2051. spin_unlock_irq(&cm_id_priv->lock);
  2052. cm_issue_rej(work->port, work->mad_recv_wc,
  2053. IB_CM_REJ_STALE_CONN, CM_MSG_RESPONSE_REP,
  2054. NULL, 0);
  2055. ret = -EINVAL;
  2056. pr_debug("%s: Stale connection. local_comm_id %d, remote_comm_id %d\n",
  2057. __func__, be32_to_cpu(rep_msg->local_comm_id),
  2058. be32_to_cpu(rep_msg->remote_comm_id));
  2059. if (cur_cm_id_priv) {
  2060. cm_id = &cur_cm_id_priv->id;
  2061. ib_send_cm_dreq(cm_id, NULL, 0);
  2062. cm_deref_id(cur_cm_id_priv);
  2063. }
  2064. goto error;
  2065. }
  2066. spin_unlock(&cm.lock);
  2067. cm_id_priv->id.state = IB_CM_REP_RCVD;
  2068. cm_id_priv->id.remote_id = rep_msg->local_comm_id;
  2069. cm_id_priv->remote_qpn = cm_rep_get_qpn(rep_msg, cm_id_priv->qp_type);
  2070. cm_id_priv->initiator_depth = rep_msg->resp_resources;
  2071. cm_id_priv->responder_resources = rep_msg->initiator_depth;
  2072. cm_id_priv->sq_psn = cm_rep_get_starting_psn(rep_msg);
  2073. cm_id_priv->rnr_retry_count = cm_rep_get_rnr_retry_count(rep_msg);
  2074. cm_id_priv->target_ack_delay = cm_rep_get_target_ack_delay(rep_msg);
  2075. cm_id_priv->av.timeout =
  2076. cm_ack_timeout(cm_id_priv->target_ack_delay,
  2077. cm_id_priv->av.timeout - 1);
  2078. cm_id_priv->alt_av.timeout =
  2079. cm_ack_timeout(cm_id_priv->target_ack_delay,
  2080. cm_id_priv->alt_av.timeout - 1);
  2081. /* todo: handle peer_to_peer */
  2082. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2083. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  2084. if (!ret)
  2085. list_add_tail(&work->list, &cm_id_priv->work_list);
  2086. spin_unlock_irq(&cm_id_priv->lock);
  2087. if (ret)
  2088. cm_process_work(cm_id_priv, work);
  2089. else
  2090. cm_deref_id(cm_id_priv);
  2091. return 0;
  2092. error:
  2093. cm_deref_id(cm_id_priv);
  2094. return ret;
  2095. }
  2096. static int cm_establish_handler(struct cm_work *work)
  2097. {
  2098. struct cm_id_private *cm_id_priv;
  2099. int ret;
  2100. /* See comment in cm_establish about lookup. */
  2101. cm_id_priv = cm_acquire_id(work->local_id, work->remote_id);
  2102. if (!cm_id_priv)
  2103. return -EINVAL;
  2104. spin_lock_irq(&cm_id_priv->lock);
  2105. if (cm_id_priv->id.state != IB_CM_ESTABLISHED) {
  2106. spin_unlock_irq(&cm_id_priv->lock);
  2107. goto out;
  2108. }
  2109. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2110. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  2111. if (!ret)
  2112. list_add_tail(&work->list, &cm_id_priv->work_list);
  2113. spin_unlock_irq(&cm_id_priv->lock);
  2114. if (ret)
  2115. cm_process_work(cm_id_priv, work);
  2116. else
  2117. cm_deref_id(cm_id_priv);
  2118. return 0;
  2119. out:
  2120. cm_deref_id(cm_id_priv);
  2121. return -EINVAL;
  2122. }
  2123. static int cm_rtu_handler(struct cm_work *work)
  2124. {
  2125. struct cm_id_private *cm_id_priv;
  2126. struct cm_rtu_msg *rtu_msg;
  2127. int ret;
  2128. rtu_msg = (struct cm_rtu_msg *)work->mad_recv_wc->recv_buf.mad;
  2129. cm_id_priv = cm_acquire_id(rtu_msg->remote_comm_id,
  2130. rtu_msg->local_comm_id);
  2131. if (!cm_id_priv)
  2132. return -EINVAL;
  2133. work->cm_event.private_data = &rtu_msg->private_data;
  2134. spin_lock_irq(&cm_id_priv->lock);
  2135. if (cm_id_priv->id.state != IB_CM_REP_SENT &&
  2136. cm_id_priv->id.state != IB_CM_MRA_REP_RCVD) {
  2137. spin_unlock_irq(&cm_id_priv->lock);
  2138. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  2139. counter[CM_RTU_COUNTER]);
  2140. goto out;
  2141. }
  2142. cm_id_priv->id.state = IB_CM_ESTABLISHED;
  2143. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2144. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  2145. if (!ret)
  2146. list_add_tail(&work->list, &cm_id_priv->work_list);
  2147. spin_unlock_irq(&cm_id_priv->lock);
  2148. if (ret)
  2149. cm_process_work(cm_id_priv, work);
  2150. else
  2151. cm_deref_id(cm_id_priv);
  2152. return 0;
  2153. out:
  2154. cm_deref_id(cm_id_priv);
  2155. return -EINVAL;
  2156. }
  2157. static void cm_format_dreq(struct cm_dreq_msg *dreq_msg,
  2158. struct cm_id_private *cm_id_priv,
  2159. const void *private_data,
  2160. u8 private_data_len)
  2161. {
  2162. cm_format_mad_hdr(&dreq_msg->hdr, CM_DREQ_ATTR_ID,
  2163. cm_form_tid(cm_id_priv));
  2164. dreq_msg->local_comm_id = cm_id_priv->id.local_id;
  2165. dreq_msg->remote_comm_id = cm_id_priv->id.remote_id;
  2166. cm_dreq_set_remote_qpn(dreq_msg, cm_id_priv->remote_qpn);
  2167. if (private_data && private_data_len)
  2168. memcpy(dreq_msg->private_data, private_data, private_data_len);
  2169. }
  2170. int ib_send_cm_dreq(struct ib_cm_id *cm_id,
  2171. const void *private_data,
  2172. u8 private_data_len)
  2173. {
  2174. struct cm_id_private *cm_id_priv;
  2175. struct ib_mad_send_buf *msg;
  2176. unsigned long flags;
  2177. int ret;
  2178. if (private_data && private_data_len > IB_CM_DREQ_PRIVATE_DATA_SIZE)
  2179. return -EINVAL;
  2180. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  2181. spin_lock_irqsave(&cm_id_priv->lock, flags);
  2182. if (cm_id->state != IB_CM_ESTABLISHED) {
  2183. pr_debug("%s: local_id %d, cm_id->state: %d\n", __func__,
  2184. be32_to_cpu(cm_id->local_id), cm_id->state);
  2185. ret = -EINVAL;
  2186. goto out;
  2187. }
  2188. if (cm_id->lap_state == IB_CM_LAP_SENT ||
  2189. cm_id->lap_state == IB_CM_MRA_LAP_RCVD)
  2190. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2191. ret = cm_alloc_msg(cm_id_priv, &msg);
  2192. if (ret) {
  2193. cm_enter_timewait(cm_id_priv);
  2194. goto out;
  2195. }
  2196. cm_format_dreq((struct cm_dreq_msg *) msg->mad, cm_id_priv,
  2197. private_data, private_data_len);
  2198. msg->timeout_ms = cm_id_priv->timeout_ms;
  2199. msg->context[1] = (void *) (unsigned long) IB_CM_DREQ_SENT;
  2200. ret = ib_post_send_mad(msg, NULL);
  2201. if (ret) {
  2202. cm_enter_timewait(cm_id_priv);
  2203. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2204. cm_free_msg(msg);
  2205. return ret;
  2206. }
  2207. cm_id->state = IB_CM_DREQ_SENT;
  2208. cm_id_priv->msg = msg;
  2209. out: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2210. return ret;
  2211. }
  2212. EXPORT_SYMBOL(ib_send_cm_dreq);
  2213. static void cm_format_drep(struct cm_drep_msg *drep_msg,
  2214. struct cm_id_private *cm_id_priv,
  2215. const void *private_data,
  2216. u8 private_data_len)
  2217. {
  2218. cm_format_mad_hdr(&drep_msg->hdr, CM_DREP_ATTR_ID, cm_id_priv->tid);
  2219. drep_msg->local_comm_id = cm_id_priv->id.local_id;
  2220. drep_msg->remote_comm_id = cm_id_priv->id.remote_id;
  2221. if (private_data && private_data_len)
  2222. memcpy(drep_msg->private_data, private_data, private_data_len);
  2223. }
  2224. int ib_send_cm_drep(struct ib_cm_id *cm_id,
  2225. const void *private_data,
  2226. u8 private_data_len)
  2227. {
  2228. struct cm_id_private *cm_id_priv;
  2229. struct ib_mad_send_buf *msg;
  2230. unsigned long flags;
  2231. void *data;
  2232. int ret;
  2233. if (private_data && private_data_len > IB_CM_DREP_PRIVATE_DATA_SIZE)
  2234. return -EINVAL;
  2235. data = cm_copy_private_data(private_data, private_data_len);
  2236. if (IS_ERR(data))
  2237. return PTR_ERR(data);
  2238. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  2239. spin_lock_irqsave(&cm_id_priv->lock, flags);
  2240. if (cm_id->state != IB_CM_DREQ_RCVD) {
  2241. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2242. kfree(data);
  2243. pr_debug("%s: local_id %d, cm_idcm_id->state(%d) != IB_CM_DREQ_RCVD\n",
  2244. __func__, be32_to_cpu(cm_id->local_id), cm_id->state);
  2245. return -EINVAL;
  2246. }
  2247. cm_set_private_data(cm_id_priv, data, private_data_len);
  2248. cm_enter_timewait(cm_id_priv);
  2249. ret = cm_alloc_msg(cm_id_priv, &msg);
  2250. if (ret)
  2251. goto out;
  2252. cm_format_drep((struct cm_drep_msg *) msg->mad, cm_id_priv,
  2253. private_data, private_data_len);
  2254. ret = ib_post_send_mad(msg, NULL);
  2255. if (ret) {
  2256. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2257. cm_free_msg(msg);
  2258. return ret;
  2259. }
  2260. out: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2261. return ret;
  2262. }
  2263. EXPORT_SYMBOL(ib_send_cm_drep);
  2264. static int cm_issue_drep(struct cm_port *port,
  2265. struct ib_mad_recv_wc *mad_recv_wc)
  2266. {
  2267. struct ib_mad_send_buf *msg = NULL;
  2268. struct cm_dreq_msg *dreq_msg;
  2269. struct cm_drep_msg *drep_msg;
  2270. int ret;
  2271. ret = cm_alloc_response_msg(port, mad_recv_wc, &msg);
  2272. if (ret)
  2273. return ret;
  2274. dreq_msg = (struct cm_dreq_msg *) mad_recv_wc->recv_buf.mad;
  2275. drep_msg = (struct cm_drep_msg *) msg->mad;
  2276. cm_format_mad_hdr(&drep_msg->hdr, CM_DREP_ATTR_ID, dreq_msg->hdr.tid);
  2277. drep_msg->remote_comm_id = dreq_msg->local_comm_id;
  2278. drep_msg->local_comm_id = dreq_msg->remote_comm_id;
  2279. ret = ib_post_send_mad(msg, NULL);
  2280. if (ret)
  2281. cm_free_msg(msg);
  2282. return ret;
  2283. }
  2284. static int cm_dreq_handler(struct cm_work *work)
  2285. {
  2286. struct cm_id_private *cm_id_priv;
  2287. struct cm_dreq_msg *dreq_msg;
  2288. struct ib_mad_send_buf *msg = NULL;
  2289. int ret;
  2290. dreq_msg = (struct cm_dreq_msg *)work->mad_recv_wc->recv_buf.mad;
  2291. cm_id_priv = cm_acquire_id(dreq_msg->remote_comm_id,
  2292. dreq_msg->local_comm_id);
  2293. if (!cm_id_priv) {
  2294. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  2295. counter[CM_DREQ_COUNTER]);
  2296. cm_issue_drep(work->port, work->mad_recv_wc);
  2297. pr_debug("%s: no cm_id_priv, local_comm_id %d, remote_comm_id %d\n",
  2298. __func__, be32_to_cpu(dreq_msg->local_comm_id),
  2299. be32_to_cpu(dreq_msg->remote_comm_id));
  2300. return -EINVAL;
  2301. }
  2302. work->cm_event.private_data = &dreq_msg->private_data;
  2303. spin_lock_irq(&cm_id_priv->lock);
  2304. if (cm_id_priv->local_qpn != cm_dreq_get_remote_qpn(dreq_msg))
  2305. goto unlock;
  2306. switch (cm_id_priv->id.state) {
  2307. case IB_CM_REP_SENT:
  2308. case IB_CM_DREQ_SENT:
  2309. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2310. break;
  2311. case IB_CM_ESTABLISHED:
  2312. if (cm_id_priv->id.lap_state == IB_CM_LAP_SENT ||
  2313. cm_id_priv->id.lap_state == IB_CM_MRA_LAP_RCVD)
  2314. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2315. break;
  2316. case IB_CM_MRA_REP_RCVD:
  2317. break;
  2318. case IB_CM_TIMEWAIT:
  2319. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  2320. counter[CM_DREQ_COUNTER]);
  2321. msg = cm_alloc_response_msg_no_ah(work->port, work->mad_recv_wc);
  2322. if (IS_ERR(msg))
  2323. goto unlock;
  2324. cm_format_drep((struct cm_drep_msg *) msg->mad, cm_id_priv,
  2325. cm_id_priv->private_data,
  2326. cm_id_priv->private_data_len);
  2327. spin_unlock_irq(&cm_id_priv->lock);
  2328. if (cm_create_response_msg_ah(work->port, work->mad_recv_wc, msg) ||
  2329. ib_post_send_mad(msg, NULL))
  2330. cm_free_msg(msg);
  2331. goto deref;
  2332. case IB_CM_DREQ_RCVD:
  2333. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  2334. counter[CM_DREQ_COUNTER]);
  2335. goto unlock;
  2336. default:
  2337. pr_debug("%s: local_id %d, cm_id_priv->id.state: %d\n",
  2338. __func__, be32_to_cpu(cm_id_priv->id.local_id),
  2339. cm_id_priv->id.state);
  2340. goto unlock;
  2341. }
  2342. cm_id_priv->id.state = IB_CM_DREQ_RCVD;
  2343. cm_id_priv->tid = dreq_msg->hdr.tid;
  2344. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  2345. if (!ret)
  2346. list_add_tail(&work->list, &cm_id_priv->work_list);
  2347. spin_unlock_irq(&cm_id_priv->lock);
  2348. if (ret)
  2349. cm_process_work(cm_id_priv, work);
  2350. else
  2351. cm_deref_id(cm_id_priv);
  2352. return 0;
  2353. unlock: spin_unlock_irq(&cm_id_priv->lock);
  2354. deref: cm_deref_id(cm_id_priv);
  2355. return -EINVAL;
  2356. }
  2357. static int cm_drep_handler(struct cm_work *work)
  2358. {
  2359. struct cm_id_private *cm_id_priv;
  2360. struct cm_drep_msg *drep_msg;
  2361. int ret;
  2362. drep_msg = (struct cm_drep_msg *)work->mad_recv_wc->recv_buf.mad;
  2363. cm_id_priv = cm_acquire_id(drep_msg->remote_comm_id,
  2364. drep_msg->local_comm_id);
  2365. if (!cm_id_priv)
  2366. return -EINVAL;
  2367. work->cm_event.private_data = &drep_msg->private_data;
  2368. spin_lock_irq(&cm_id_priv->lock);
  2369. if (cm_id_priv->id.state != IB_CM_DREQ_SENT &&
  2370. cm_id_priv->id.state != IB_CM_DREQ_RCVD) {
  2371. spin_unlock_irq(&cm_id_priv->lock);
  2372. goto out;
  2373. }
  2374. cm_enter_timewait(cm_id_priv);
  2375. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2376. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  2377. if (!ret)
  2378. list_add_tail(&work->list, &cm_id_priv->work_list);
  2379. spin_unlock_irq(&cm_id_priv->lock);
  2380. if (ret)
  2381. cm_process_work(cm_id_priv, work);
  2382. else
  2383. cm_deref_id(cm_id_priv);
  2384. return 0;
  2385. out:
  2386. cm_deref_id(cm_id_priv);
  2387. return -EINVAL;
  2388. }
  2389. int ib_send_cm_rej(struct ib_cm_id *cm_id,
  2390. enum ib_cm_rej_reason reason,
  2391. void *ari,
  2392. u8 ari_length,
  2393. const void *private_data,
  2394. u8 private_data_len)
  2395. {
  2396. struct cm_id_private *cm_id_priv;
  2397. struct ib_mad_send_buf *msg;
  2398. unsigned long flags;
  2399. int ret;
  2400. if ((private_data && private_data_len > IB_CM_REJ_PRIVATE_DATA_SIZE) ||
  2401. (ari && ari_length > IB_CM_REJ_ARI_LENGTH))
  2402. return -EINVAL;
  2403. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  2404. spin_lock_irqsave(&cm_id_priv->lock, flags);
  2405. switch (cm_id->state) {
  2406. case IB_CM_REQ_SENT:
  2407. case IB_CM_MRA_REQ_RCVD:
  2408. case IB_CM_REQ_RCVD:
  2409. case IB_CM_MRA_REQ_SENT:
  2410. case IB_CM_REP_RCVD:
  2411. case IB_CM_MRA_REP_SENT:
  2412. ret = cm_alloc_msg(cm_id_priv, &msg);
  2413. if (!ret)
  2414. cm_format_rej((struct cm_rej_msg *) msg->mad,
  2415. cm_id_priv, reason, ari, ari_length,
  2416. private_data, private_data_len);
  2417. cm_reset_to_idle(cm_id_priv);
  2418. break;
  2419. case IB_CM_REP_SENT:
  2420. case IB_CM_MRA_REP_RCVD:
  2421. ret = cm_alloc_msg(cm_id_priv, &msg);
  2422. if (!ret)
  2423. cm_format_rej((struct cm_rej_msg *) msg->mad,
  2424. cm_id_priv, reason, ari, ari_length,
  2425. private_data, private_data_len);
  2426. cm_enter_timewait(cm_id_priv);
  2427. break;
  2428. default:
  2429. pr_debug("%s: local_id %d, cm_id->state: %d\n", __func__,
  2430. be32_to_cpu(cm_id_priv->id.local_id), cm_id->state);
  2431. ret = -EINVAL;
  2432. goto out;
  2433. }
  2434. if (ret)
  2435. goto out;
  2436. ret = ib_post_send_mad(msg, NULL);
  2437. if (ret)
  2438. cm_free_msg(msg);
  2439. out: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2440. return ret;
  2441. }
  2442. EXPORT_SYMBOL(ib_send_cm_rej);
  2443. static void cm_format_rej_event(struct cm_work *work)
  2444. {
  2445. struct cm_rej_msg *rej_msg;
  2446. struct ib_cm_rej_event_param *param;
  2447. rej_msg = (struct cm_rej_msg *)work->mad_recv_wc->recv_buf.mad;
  2448. param = &work->cm_event.param.rej_rcvd;
  2449. param->ari = rej_msg->ari;
  2450. param->ari_length = cm_rej_get_reject_info_len(rej_msg);
  2451. param->reason = __be16_to_cpu(rej_msg->reason);
  2452. work->cm_event.private_data = &rej_msg->private_data;
  2453. }
  2454. static struct cm_id_private * cm_acquire_rejected_id(struct cm_rej_msg *rej_msg)
  2455. {
  2456. struct cm_timewait_info *timewait_info;
  2457. struct cm_id_private *cm_id_priv;
  2458. __be32 remote_id;
  2459. remote_id = rej_msg->local_comm_id;
  2460. if (__be16_to_cpu(rej_msg->reason) == IB_CM_REJ_TIMEOUT) {
  2461. spin_lock_irq(&cm.lock);
  2462. timewait_info = cm_find_remote_id( *((__be64 *) rej_msg->ari),
  2463. remote_id);
  2464. if (!timewait_info) {
  2465. spin_unlock_irq(&cm.lock);
  2466. return NULL;
  2467. }
  2468. cm_id_priv = idr_find(&cm.local_id_table, (__force int)
  2469. (timewait_info->work.local_id ^
  2470. cm.random_id_operand));
  2471. if (cm_id_priv) {
  2472. if (cm_id_priv->id.remote_id == remote_id)
  2473. atomic_inc(&cm_id_priv->refcount);
  2474. else
  2475. cm_id_priv = NULL;
  2476. }
  2477. spin_unlock_irq(&cm.lock);
  2478. } else if (cm_rej_get_msg_rejected(rej_msg) == CM_MSG_RESPONSE_REQ)
  2479. cm_id_priv = cm_acquire_id(rej_msg->remote_comm_id, 0);
  2480. else
  2481. cm_id_priv = cm_acquire_id(rej_msg->remote_comm_id, remote_id);
  2482. return cm_id_priv;
  2483. }
  2484. static int cm_rej_handler(struct cm_work *work)
  2485. {
  2486. struct cm_id_private *cm_id_priv;
  2487. struct cm_rej_msg *rej_msg;
  2488. int ret;
  2489. rej_msg = (struct cm_rej_msg *)work->mad_recv_wc->recv_buf.mad;
  2490. cm_id_priv = cm_acquire_rejected_id(rej_msg);
  2491. if (!cm_id_priv)
  2492. return -EINVAL;
  2493. cm_format_rej_event(work);
  2494. spin_lock_irq(&cm_id_priv->lock);
  2495. switch (cm_id_priv->id.state) {
  2496. case IB_CM_REQ_SENT:
  2497. case IB_CM_MRA_REQ_RCVD:
  2498. case IB_CM_REP_SENT:
  2499. case IB_CM_MRA_REP_RCVD:
  2500. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2501. /* fall through */
  2502. case IB_CM_REQ_RCVD:
  2503. case IB_CM_MRA_REQ_SENT:
  2504. if (__be16_to_cpu(rej_msg->reason) == IB_CM_REJ_STALE_CONN)
  2505. cm_enter_timewait(cm_id_priv);
  2506. else
  2507. cm_reset_to_idle(cm_id_priv);
  2508. break;
  2509. case IB_CM_DREQ_SENT:
  2510. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2511. /* fall through */
  2512. case IB_CM_REP_RCVD:
  2513. case IB_CM_MRA_REP_SENT:
  2514. cm_enter_timewait(cm_id_priv);
  2515. break;
  2516. case IB_CM_ESTABLISHED:
  2517. if (cm_id_priv->id.lap_state == IB_CM_LAP_UNINIT ||
  2518. cm_id_priv->id.lap_state == IB_CM_LAP_SENT) {
  2519. if (cm_id_priv->id.lap_state == IB_CM_LAP_SENT)
  2520. ib_cancel_mad(cm_id_priv->av.port->mad_agent,
  2521. cm_id_priv->msg);
  2522. cm_enter_timewait(cm_id_priv);
  2523. break;
  2524. }
  2525. /* fall through */
  2526. default:
  2527. spin_unlock_irq(&cm_id_priv->lock);
  2528. pr_debug("%s: local_id %d, cm_id_priv->id.state: %d\n",
  2529. __func__, be32_to_cpu(cm_id_priv->id.local_id),
  2530. cm_id_priv->id.state);
  2531. ret = -EINVAL;
  2532. goto out;
  2533. }
  2534. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  2535. if (!ret)
  2536. list_add_tail(&work->list, &cm_id_priv->work_list);
  2537. spin_unlock_irq(&cm_id_priv->lock);
  2538. if (ret)
  2539. cm_process_work(cm_id_priv, work);
  2540. else
  2541. cm_deref_id(cm_id_priv);
  2542. return 0;
  2543. out:
  2544. cm_deref_id(cm_id_priv);
  2545. return -EINVAL;
  2546. }
  2547. int ib_send_cm_mra(struct ib_cm_id *cm_id,
  2548. u8 service_timeout,
  2549. const void *private_data,
  2550. u8 private_data_len)
  2551. {
  2552. struct cm_id_private *cm_id_priv;
  2553. struct ib_mad_send_buf *msg;
  2554. enum ib_cm_state cm_state;
  2555. enum ib_cm_lap_state lap_state;
  2556. enum cm_msg_response msg_response;
  2557. void *data;
  2558. unsigned long flags;
  2559. int ret;
  2560. if (private_data && private_data_len > IB_CM_MRA_PRIVATE_DATA_SIZE)
  2561. return -EINVAL;
  2562. data = cm_copy_private_data(private_data, private_data_len);
  2563. if (IS_ERR(data))
  2564. return PTR_ERR(data);
  2565. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  2566. spin_lock_irqsave(&cm_id_priv->lock, flags);
  2567. switch(cm_id_priv->id.state) {
  2568. case IB_CM_REQ_RCVD:
  2569. cm_state = IB_CM_MRA_REQ_SENT;
  2570. lap_state = cm_id->lap_state;
  2571. msg_response = CM_MSG_RESPONSE_REQ;
  2572. break;
  2573. case IB_CM_REP_RCVD:
  2574. cm_state = IB_CM_MRA_REP_SENT;
  2575. lap_state = cm_id->lap_state;
  2576. msg_response = CM_MSG_RESPONSE_REP;
  2577. break;
  2578. case IB_CM_ESTABLISHED:
  2579. if (cm_id->lap_state == IB_CM_LAP_RCVD) {
  2580. cm_state = cm_id->state;
  2581. lap_state = IB_CM_MRA_LAP_SENT;
  2582. msg_response = CM_MSG_RESPONSE_OTHER;
  2583. break;
  2584. }
  2585. /* fall through */
  2586. default:
  2587. pr_debug("%s: local_id %d, cm_id_priv->id.state: %d\n",
  2588. __func__, be32_to_cpu(cm_id_priv->id.local_id),
  2589. cm_id_priv->id.state);
  2590. ret = -EINVAL;
  2591. goto error1;
  2592. }
  2593. if (!(service_timeout & IB_CM_MRA_FLAG_DELAY)) {
  2594. ret = cm_alloc_msg(cm_id_priv, &msg);
  2595. if (ret)
  2596. goto error1;
  2597. cm_format_mra((struct cm_mra_msg *) msg->mad, cm_id_priv,
  2598. msg_response, service_timeout,
  2599. private_data, private_data_len);
  2600. ret = ib_post_send_mad(msg, NULL);
  2601. if (ret)
  2602. goto error2;
  2603. }
  2604. cm_id->state = cm_state;
  2605. cm_id->lap_state = lap_state;
  2606. cm_id_priv->service_timeout = service_timeout;
  2607. cm_set_private_data(cm_id_priv, data, private_data_len);
  2608. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2609. return 0;
  2610. error1: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2611. kfree(data);
  2612. return ret;
  2613. error2: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2614. kfree(data);
  2615. cm_free_msg(msg);
  2616. return ret;
  2617. }
  2618. EXPORT_SYMBOL(ib_send_cm_mra);
  2619. static struct cm_id_private * cm_acquire_mraed_id(struct cm_mra_msg *mra_msg)
  2620. {
  2621. switch (cm_mra_get_msg_mraed(mra_msg)) {
  2622. case CM_MSG_RESPONSE_REQ:
  2623. return cm_acquire_id(mra_msg->remote_comm_id, 0);
  2624. case CM_MSG_RESPONSE_REP:
  2625. case CM_MSG_RESPONSE_OTHER:
  2626. return cm_acquire_id(mra_msg->remote_comm_id,
  2627. mra_msg->local_comm_id);
  2628. default:
  2629. return NULL;
  2630. }
  2631. }
  2632. static int cm_mra_handler(struct cm_work *work)
  2633. {
  2634. struct cm_id_private *cm_id_priv;
  2635. struct cm_mra_msg *mra_msg;
  2636. int timeout, ret;
  2637. mra_msg = (struct cm_mra_msg *)work->mad_recv_wc->recv_buf.mad;
  2638. cm_id_priv = cm_acquire_mraed_id(mra_msg);
  2639. if (!cm_id_priv)
  2640. return -EINVAL;
  2641. work->cm_event.private_data = &mra_msg->private_data;
  2642. work->cm_event.param.mra_rcvd.service_timeout =
  2643. cm_mra_get_service_timeout(mra_msg);
  2644. timeout = cm_convert_to_ms(cm_mra_get_service_timeout(mra_msg)) +
  2645. cm_convert_to_ms(cm_id_priv->av.timeout);
  2646. spin_lock_irq(&cm_id_priv->lock);
  2647. switch (cm_id_priv->id.state) {
  2648. case IB_CM_REQ_SENT:
  2649. if (cm_mra_get_msg_mraed(mra_msg) != CM_MSG_RESPONSE_REQ ||
  2650. ib_modify_mad(cm_id_priv->av.port->mad_agent,
  2651. cm_id_priv->msg, timeout))
  2652. goto out;
  2653. cm_id_priv->id.state = IB_CM_MRA_REQ_RCVD;
  2654. break;
  2655. case IB_CM_REP_SENT:
  2656. if (cm_mra_get_msg_mraed(mra_msg) != CM_MSG_RESPONSE_REP ||
  2657. ib_modify_mad(cm_id_priv->av.port->mad_agent,
  2658. cm_id_priv->msg, timeout))
  2659. goto out;
  2660. cm_id_priv->id.state = IB_CM_MRA_REP_RCVD;
  2661. break;
  2662. case IB_CM_ESTABLISHED:
  2663. if (cm_mra_get_msg_mraed(mra_msg) != CM_MSG_RESPONSE_OTHER ||
  2664. cm_id_priv->id.lap_state != IB_CM_LAP_SENT ||
  2665. ib_modify_mad(cm_id_priv->av.port->mad_agent,
  2666. cm_id_priv->msg, timeout)) {
  2667. if (cm_id_priv->id.lap_state == IB_CM_MRA_LAP_RCVD)
  2668. atomic_long_inc(&work->port->
  2669. counter_group[CM_RECV_DUPLICATES].
  2670. counter[CM_MRA_COUNTER]);
  2671. goto out;
  2672. }
  2673. cm_id_priv->id.lap_state = IB_CM_MRA_LAP_RCVD;
  2674. break;
  2675. case IB_CM_MRA_REQ_RCVD:
  2676. case IB_CM_MRA_REP_RCVD:
  2677. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  2678. counter[CM_MRA_COUNTER]);
  2679. /* fall through */
  2680. default:
  2681. pr_debug("%s local_id %d, cm_id_priv->id.state: %d\n",
  2682. __func__, be32_to_cpu(cm_id_priv->id.local_id),
  2683. cm_id_priv->id.state);
  2684. goto out;
  2685. }
  2686. cm_id_priv->msg->context[1] = (void *) (unsigned long)
  2687. cm_id_priv->id.state;
  2688. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  2689. if (!ret)
  2690. list_add_tail(&work->list, &cm_id_priv->work_list);
  2691. spin_unlock_irq(&cm_id_priv->lock);
  2692. if (ret)
  2693. cm_process_work(cm_id_priv, work);
  2694. else
  2695. cm_deref_id(cm_id_priv);
  2696. return 0;
  2697. out:
  2698. spin_unlock_irq(&cm_id_priv->lock);
  2699. cm_deref_id(cm_id_priv);
  2700. return -EINVAL;
  2701. }
  2702. static void cm_format_lap(struct cm_lap_msg *lap_msg,
  2703. struct cm_id_private *cm_id_priv,
  2704. struct sa_path_rec *alternate_path,
  2705. const void *private_data,
  2706. u8 private_data_len)
  2707. {
  2708. bool alt_ext = false;
  2709. if (alternate_path->rec_type == SA_PATH_REC_TYPE_OPA)
  2710. alt_ext = opa_is_extended_lid(alternate_path->opa.dlid,
  2711. alternate_path->opa.slid);
  2712. cm_format_mad_hdr(&lap_msg->hdr, CM_LAP_ATTR_ID,
  2713. cm_form_tid(cm_id_priv));
  2714. lap_msg->local_comm_id = cm_id_priv->id.local_id;
  2715. lap_msg->remote_comm_id = cm_id_priv->id.remote_id;
  2716. cm_lap_set_remote_qpn(lap_msg, cm_id_priv->remote_qpn);
  2717. /* todo: need remote CM response timeout */
  2718. cm_lap_set_remote_resp_timeout(lap_msg, 0x1F);
  2719. lap_msg->alt_local_lid =
  2720. htons(ntohl(sa_path_get_slid(alternate_path)));
  2721. lap_msg->alt_remote_lid =
  2722. htons(ntohl(sa_path_get_dlid(alternate_path)));
  2723. lap_msg->alt_local_gid = alternate_path->sgid;
  2724. lap_msg->alt_remote_gid = alternate_path->dgid;
  2725. if (alt_ext) {
  2726. lap_msg->alt_local_gid.global.interface_id
  2727. = OPA_MAKE_ID(be32_to_cpu(alternate_path->opa.slid));
  2728. lap_msg->alt_remote_gid.global.interface_id
  2729. = OPA_MAKE_ID(be32_to_cpu(alternate_path->opa.dlid));
  2730. }
  2731. cm_lap_set_flow_label(lap_msg, alternate_path->flow_label);
  2732. cm_lap_set_traffic_class(lap_msg, alternate_path->traffic_class);
  2733. lap_msg->alt_hop_limit = alternate_path->hop_limit;
  2734. cm_lap_set_packet_rate(lap_msg, alternate_path->rate);
  2735. cm_lap_set_sl(lap_msg, alternate_path->sl);
  2736. cm_lap_set_subnet_local(lap_msg, 1); /* local only... */
  2737. cm_lap_set_local_ack_timeout(lap_msg,
  2738. cm_ack_timeout(cm_id_priv->av.port->cm_dev->ack_delay,
  2739. alternate_path->packet_life_time));
  2740. if (private_data && private_data_len)
  2741. memcpy(lap_msg->private_data, private_data, private_data_len);
  2742. }
  2743. int ib_send_cm_lap(struct ib_cm_id *cm_id,
  2744. struct sa_path_rec *alternate_path,
  2745. const void *private_data,
  2746. u8 private_data_len)
  2747. {
  2748. struct cm_id_private *cm_id_priv;
  2749. struct ib_mad_send_buf *msg;
  2750. unsigned long flags;
  2751. int ret;
  2752. if (private_data && private_data_len > IB_CM_LAP_PRIVATE_DATA_SIZE)
  2753. return -EINVAL;
  2754. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  2755. spin_lock_irqsave(&cm_id_priv->lock, flags);
  2756. if (cm_id->state != IB_CM_ESTABLISHED ||
  2757. (cm_id->lap_state != IB_CM_LAP_UNINIT &&
  2758. cm_id->lap_state != IB_CM_LAP_IDLE)) {
  2759. ret = -EINVAL;
  2760. goto out;
  2761. }
  2762. ret = cm_init_av_by_path(alternate_path, NULL, &cm_id_priv->alt_av,
  2763. cm_id_priv);
  2764. if (ret)
  2765. goto out;
  2766. cm_id_priv->alt_av.timeout =
  2767. cm_ack_timeout(cm_id_priv->target_ack_delay,
  2768. cm_id_priv->alt_av.timeout - 1);
  2769. ret = cm_alloc_msg(cm_id_priv, &msg);
  2770. if (ret)
  2771. goto out;
  2772. cm_format_lap((struct cm_lap_msg *) msg->mad, cm_id_priv,
  2773. alternate_path, private_data, private_data_len);
  2774. msg->timeout_ms = cm_id_priv->timeout_ms;
  2775. msg->context[1] = (void *) (unsigned long) IB_CM_ESTABLISHED;
  2776. ret = ib_post_send_mad(msg, NULL);
  2777. if (ret) {
  2778. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2779. cm_free_msg(msg);
  2780. return ret;
  2781. }
  2782. cm_id->lap_state = IB_CM_LAP_SENT;
  2783. cm_id_priv->msg = msg;
  2784. out: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2785. return ret;
  2786. }
  2787. EXPORT_SYMBOL(ib_send_cm_lap);
  2788. static void cm_format_path_lid_from_lap(struct cm_lap_msg *lap_msg,
  2789. struct sa_path_rec *path)
  2790. {
  2791. u32 lid;
  2792. if (path->rec_type != SA_PATH_REC_TYPE_OPA) {
  2793. sa_path_set_dlid(path, ntohs(lap_msg->alt_local_lid));
  2794. sa_path_set_slid(path, ntohs(lap_msg->alt_remote_lid));
  2795. } else {
  2796. lid = opa_get_lid_from_gid(&lap_msg->alt_local_gid);
  2797. sa_path_set_dlid(path, lid);
  2798. lid = opa_get_lid_from_gid(&lap_msg->alt_remote_gid);
  2799. sa_path_set_slid(path, lid);
  2800. }
  2801. }
  2802. static void cm_format_path_from_lap(struct cm_id_private *cm_id_priv,
  2803. struct sa_path_rec *path,
  2804. struct cm_lap_msg *lap_msg)
  2805. {
  2806. path->dgid = lap_msg->alt_local_gid;
  2807. path->sgid = lap_msg->alt_remote_gid;
  2808. path->flow_label = cm_lap_get_flow_label(lap_msg);
  2809. path->hop_limit = lap_msg->alt_hop_limit;
  2810. path->traffic_class = cm_lap_get_traffic_class(lap_msg);
  2811. path->reversible = 1;
  2812. path->pkey = cm_id_priv->pkey;
  2813. path->sl = cm_lap_get_sl(lap_msg);
  2814. path->mtu_selector = IB_SA_EQ;
  2815. path->mtu = cm_id_priv->path_mtu;
  2816. path->rate_selector = IB_SA_EQ;
  2817. path->rate = cm_lap_get_packet_rate(lap_msg);
  2818. path->packet_life_time_selector = IB_SA_EQ;
  2819. path->packet_life_time = cm_lap_get_local_ack_timeout(lap_msg);
  2820. path->packet_life_time -= (path->packet_life_time > 0);
  2821. cm_format_path_lid_from_lap(lap_msg, path);
  2822. }
  2823. static int cm_lap_handler(struct cm_work *work)
  2824. {
  2825. struct cm_id_private *cm_id_priv;
  2826. struct cm_lap_msg *lap_msg;
  2827. struct ib_cm_lap_event_param *param;
  2828. struct ib_mad_send_buf *msg = NULL;
  2829. int ret;
  2830. /* Currently Alternate path messages are not supported for
  2831. * RoCE link layer.
  2832. */
  2833. if (rdma_protocol_roce(work->port->cm_dev->ib_device,
  2834. work->port->port_num))
  2835. return -EINVAL;
  2836. /* todo: verify LAP request and send reject APR if invalid. */
  2837. lap_msg = (struct cm_lap_msg *)work->mad_recv_wc->recv_buf.mad;
  2838. cm_id_priv = cm_acquire_id(lap_msg->remote_comm_id,
  2839. lap_msg->local_comm_id);
  2840. if (!cm_id_priv)
  2841. return -EINVAL;
  2842. param = &work->cm_event.param.lap_rcvd;
  2843. memset(&work->path[0], 0, sizeof(work->path[1]));
  2844. cm_path_set_rec_type(work->port->cm_dev->ib_device,
  2845. work->port->port_num,
  2846. &work->path[0],
  2847. &lap_msg->alt_local_gid);
  2848. param->alternate_path = &work->path[0];
  2849. cm_format_path_from_lap(cm_id_priv, param->alternate_path, lap_msg);
  2850. work->cm_event.private_data = &lap_msg->private_data;
  2851. spin_lock_irq(&cm_id_priv->lock);
  2852. if (cm_id_priv->id.state != IB_CM_ESTABLISHED)
  2853. goto unlock;
  2854. switch (cm_id_priv->id.lap_state) {
  2855. case IB_CM_LAP_UNINIT:
  2856. case IB_CM_LAP_IDLE:
  2857. break;
  2858. case IB_CM_MRA_LAP_SENT:
  2859. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  2860. counter[CM_LAP_COUNTER]);
  2861. msg = cm_alloc_response_msg_no_ah(work->port, work->mad_recv_wc);
  2862. if (IS_ERR(msg))
  2863. goto unlock;
  2864. cm_format_mra((struct cm_mra_msg *) msg->mad, cm_id_priv,
  2865. CM_MSG_RESPONSE_OTHER,
  2866. cm_id_priv->service_timeout,
  2867. cm_id_priv->private_data,
  2868. cm_id_priv->private_data_len);
  2869. spin_unlock_irq(&cm_id_priv->lock);
  2870. if (cm_create_response_msg_ah(work->port, work->mad_recv_wc, msg) ||
  2871. ib_post_send_mad(msg, NULL))
  2872. cm_free_msg(msg);
  2873. goto deref;
  2874. case IB_CM_LAP_RCVD:
  2875. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  2876. counter[CM_LAP_COUNTER]);
  2877. goto unlock;
  2878. default:
  2879. goto unlock;
  2880. }
  2881. ret = cm_init_av_for_lap(work->port, work->mad_recv_wc->wc,
  2882. work->mad_recv_wc->recv_buf.grh,
  2883. &cm_id_priv->av);
  2884. if (ret)
  2885. goto unlock;
  2886. ret = cm_init_av_by_path(param->alternate_path, NULL,
  2887. &cm_id_priv->alt_av, cm_id_priv);
  2888. if (ret)
  2889. goto unlock;
  2890. cm_id_priv->id.lap_state = IB_CM_LAP_RCVD;
  2891. cm_id_priv->tid = lap_msg->hdr.tid;
  2892. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  2893. if (!ret)
  2894. list_add_tail(&work->list, &cm_id_priv->work_list);
  2895. spin_unlock_irq(&cm_id_priv->lock);
  2896. if (ret)
  2897. cm_process_work(cm_id_priv, work);
  2898. else
  2899. cm_deref_id(cm_id_priv);
  2900. return 0;
  2901. unlock: spin_unlock_irq(&cm_id_priv->lock);
  2902. deref: cm_deref_id(cm_id_priv);
  2903. return -EINVAL;
  2904. }
  2905. static void cm_format_apr(struct cm_apr_msg *apr_msg,
  2906. struct cm_id_private *cm_id_priv,
  2907. enum ib_cm_apr_status status,
  2908. void *info,
  2909. u8 info_length,
  2910. const void *private_data,
  2911. u8 private_data_len)
  2912. {
  2913. cm_format_mad_hdr(&apr_msg->hdr, CM_APR_ATTR_ID, cm_id_priv->tid);
  2914. apr_msg->local_comm_id = cm_id_priv->id.local_id;
  2915. apr_msg->remote_comm_id = cm_id_priv->id.remote_id;
  2916. apr_msg->ap_status = (u8) status;
  2917. if (info && info_length) {
  2918. apr_msg->info_length = info_length;
  2919. memcpy(apr_msg->info, info, info_length);
  2920. }
  2921. if (private_data && private_data_len)
  2922. memcpy(apr_msg->private_data, private_data, private_data_len);
  2923. }
  2924. int ib_send_cm_apr(struct ib_cm_id *cm_id,
  2925. enum ib_cm_apr_status status,
  2926. void *info,
  2927. u8 info_length,
  2928. const void *private_data,
  2929. u8 private_data_len)
  2930. {
  2931. struct cm_id_private *cm_id_priv;
  2932. struct ib_mad_send_buf *msg;
  2933. unsigned long flags;
  2934. int ret;
  2935. if ((private_data && private_data_len > IB_CM_APR_PRIVATE_DATA_SIZE) ||
  2936. (info && info_length > IB_CM_APR_INFO_LENGTH))
  2937. return -EINVAL;
  2938. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  2939. spin_lock_irqsave(&cm_id_priv->lock, flags);
  2940. if (cm_id->state != IB_CM_ESTABLISHED ||
  2941. (cm_id->lap_state != IB_CM_LAP_RCVD &&
  2942. cm_id->lap_state != IB_CM_MRA_LAP_SENT)) {
  2943. ret = -EINVAL;
  2944. goto out;
  2945. }
  2946. ret = cm_alloc_msg(cm_id_priv, &msg);
  2947. if (ret)
  2948. goto out;
  2949. cm_format_apr((struct cm_apr_msg *) msg->mad, cm_id_priv, status,
  2950. info, info_length, private_data, private_data_len);
  2951. ret = ib_post_send_mad(msg, NULL);
  2952. if (ret) {
  2953. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2954. cm_free_msg(msg);
  2955. return ret;
  2956. }
  2957. cm_id->lap_state = IB_CM_LAP_IDLE;
  2958. out: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  2959. return ret;
  2960. }
  2961. EXPORT_SYMBOL(ib_send_cm_apr);
  2962. static int cm_apr_handler(struct cm_work *work)
  2963. {
  2964. struct cm_id_private *cm_id_priv;
  2965. struct cm_apr_msg *apr_msg;
  2966. int ret;
  2967. /* Currently Alternate path messages are not supported for
  2968. * RoCE link layer.
  2969. */
  2970. if (rdma_protocol_roce(work->port->cm_dev->ib_device,
  2971. work->port->port_num))
  2972. return -EINVAL;
  2973. apr_msg = (struct cm_apr_msg *)work->mad_recv_wc->recv_buf.mad;
  2974. cm_id_priv = cm_acquire_id(apr_msg->remote_comm_id,
  2975. apr_msg->local_comm_id);
  2976. if (!cm_id_priv)
  2977. return -EINVAL; /* Unmatched reply. */
  2978. work->cm_event.param.apr_rcvd.ap_status = apr_msg->ap_status;
  2979. work->cm_event.param.apr_rcvd.apr_info = &apr_msg->info;
  2980. work->cm_event.param.apr_rcvd.info_len = apr_msg->info_length;
  2981. work->cm_event.private_data = &apr_msg->private_data;
  2982. spin_lock_irq(&cm_id_priv->lock);
  2983. if (cm_id_priv->id.state != IB_CM_ESTABLISHED ||
  2984. (cm_id_priv->id.lap_state != IB_CM_LAP_SENT &&
  2985. cm_id_priv->id.lap_state != IB_CM_MRA_LAP_RCVD)) {
  2986. spin_unlock_irq(&cm_id_priv->lock);
  2987. goto out;
  2988. }
  2989. cm_id_priv->id.lap_state = IB_CM_LAP_IDLE;
  2990. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  2991. cm_id_priv->msg = NULL;
  2992. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  2993. if (!ret)
  2994. list_add_tail(&work->list, &cm_id_priv->work_list);
  2995. spin_unlock_irq(&cm_id_priv->lock);
  2996. if (ret)
  2997. cm_process_work(cm_id_priv, work);
  2998. else
  2999. cm_deref_id(cm_id_priv);
  3000. return 0;
  3001. out:
  3002. cm_deref_id(cm_id_priv);
  3003. return -EINVAL;
  3004. }
  3005. static int cm_timewait_handler(struct cm_work *work)
  3006. {
  3007. struct cm_timewait_info *timewait_info;
  3008. struct cm_id_private *cm_id_priv;
  3009. int ret;
  3010. timewait_info = (struct cm_timewait_info *)work;
  3011. spin_lock_irq(&cm.lock);
  3012. list_del(&timewait_info->list);
  3013. spin_unlock_irq(&cm.lock);
  3014. cm_id_priv = cm_acquire_id(timewait_info->work.local_id,
  3015. timewait_info->work.remote_id);
  3016. if (!cm_id_priv)
  3017. return -EINVAL;
  3018. spin_lock_irq(&cm_id_priv->lock);
  3019. if (cm_id_priv->id.state != IB_CM_TIMEWAIT ||
  3020. cm_id_priv->remote_qpn != timewait_info->remote_qpn) {
  3021. spin_unlock_irq(&cm_id_priv->lock);
  3022. goto out;
  3023. }
  3024. cm_id_priv->id.state = IB_CM_IDLE;
  3025. ret = atomic_inc_and_test(&cm_id_priv->work_count);
  3026. if (!ret)
  3027. list_add_tail(&work->list, &cm_id_priv->work_list);
  3028. spin_unlock_irq(&cm_id_priv->lock);
  3029. if (ret)
  3030. cm_process_work(cm_id_priv, work);
  3031. else
  3032. cm_deref_id(cm_id_priv);
  3033. return 0;
  3034. out:
  3035. cm_deref_id(cm_id_priv);
  3036. return -EINVAL;
  3037. }
  3038. static void cm_format_sidr_req(struct cm_sidr_req_msg *sidr_req_msg,
  3039. struct cm_id_private *cm_id_priv,
  3040. struct ib_cm_sidr_req_param *param)
  3041. {
  3042. cm_format_mad_hdr(&sidr_req_msg->hdr, CM_SIDR_REQ_ATTR_ID,
  3043. cm_form_tid(cm_id_priv));
  3044. sidr_req_msg->request_id = cm_id_priv->id.local_id;
  3045. sidr_req_msg->pkey = param->path->pkey;
  3046. sidr_req_msg->service_id = param->service_id;
  3047. if (param->private_data && param->private_data_len)
  3048. memcpy(sidr_req_msg->private_data, param->private_data,
  3049. param->private_data_len);
  3050. }
  3051. int ib_send_cm_sidr_req(struct ib_cm_id *cm_id,
  3052. struct ib_cm_sidr_req_param *param)
  3053. {
  3054. struct cm_id_private *cm_id_priv;
  3055. struct ib_mad_send_buf *msg;
  3056. unsigned long flags;
  3057. int ret;
  3058. if (!param->path || (param->private_data &&
  3059. param->private_data_len > IB_CM_SIDR_REQ_PRIVATE_DATA_SIZE))
  3060. return -EINVAL;
  3061. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  3062. ret = cm_init_av_by_path(param->path, param->sgid_attr,
  3063. &cm_id_priv->av,
  3064. cm_id_priv);
  3065. if (ret)
  3066. goto out;
  3067. cm_id->service_id = param->service_id;
  3068. cm_id->service_mask = ~cpu_to_be64(0);
  3069. cm_id_priv->timeout_ms = param->timeout_ms;
  3070. cm_id_priv->max_cm_retries = param->max_cm_retries;
  3071. ret = cm_alloc_msg(cm_id_priv, &msg);
  3072. if (ret)
  3073. goto out;
  3074. cm_format_sidr_req((struct cm_sidr_req_msg *) msg->mad, cm_id_priv,
  3075. param);
  3076. msg->timeout_ms = cm_id_priv->timeout_ms;
  3077. msg->context[1] = (void *) (unsigned long) IB_CM_SIDR_REQ_SENT;
  3078. spin_lock_irqsave(&cm_id_priv->lock, flags);
  3079. if (cm_id->state == IB_CM_IDLE)
  3080. ret = ib_post_send_mad(msg, NULL);
  3081. else
  3082. ret = -EINVAL;
  3083. if (ret) {
  3084. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3085. cm_free_msg(msg);
  3086. goto out;
  3087. }
  3088. cm_id->state = IB_CM_SIDR_REQ_SENT;
  3089. cm_id_priv->msg = msg;
  3090. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3091. out:
  3092. return ret;
  3093. }
  3094. EXPORT_SYMBOL(ib_send_cm_sidr_req);
  3095. static void cm_format_sidr_req_event(struct cm_work *work,
  3096. const struct cm_id_private *rx_cm_id,
  3097. struct ib_cm_id *listen_id)
  3098. {
  3099. struct cm_sidr_req_msg *sidr_req_msg;
  3100. struct ib_cm_sidr_req_event_param *param;
  3101. sidr_req_msg = (struct cm_sidr_req_msg *)
  3102. work->mad_recv_wc->recv_buf.mad;
  3103. param = &work->cm_event.param.sidr_req_rcvd;
  3104. param->pkey = __be16_to_cpu(sidr_req_msg->pkey);
  3105. param->listen_id = listen_id;
  3106. param->service_id = sidr_req_msg->service_id;
  3107. param->bth_pkey = cm_get_bth_pkey(work);
  3108. param->port = work->port->port_num;
  3109. param->sgid_attr = rx_cm_id->av.ah_attr.grh.sgid_attr;
  3110. work->cm_event.private_data = &sidr_req_msg->private_data;
  3111. }
  3112. static int cm_sidr_req_handler(struct cm_work *work)
  3113. {
  3114. struct ib_cm_id *cm_id;
  3115. struct cm_id_private *cm_id_priv, *cur_cm_id_priv;
  3116. struct cm_sidr_req_msg *sidr_req_msg;
  3117. struct ib_wc *wc;
  3118. int ret;
  3119. cm_id = ib_create_cm_id(work->port->cm_dev->ib_device, NULL, NULL);
  3120. if (IS_ERR(cm_id))
  3121. return PTR_ERR(cm_id);
  3122. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  3123. /* Record SGID/SLID and request ID for lookup. */
  3124. sidr_req_msg = (struct cm_sidr_req_msg *)
  3125. work->mad_recv_wc->recv_buf.mad;
  3126. wc = work->mad_recv_wc->wc;
  3127. cm_id_priv->av.dgid.global.subnet_prefix = cpu_to_be64(wc->slid);
  3128. cm_id_priv->av.dgid.global.interface_id = 0;
  3129. ret = cm_init_av_for_response(work->port, work->mad_recv_wc->wc,
  3130. work->mad_recv_wc->recv_buf.grh,
  3131. &cm_id_priv->av);
  3132. if (ret)
  3133. goto out;
  3134. cm_id_priv->id.remote_id = sidr_req_msg->request_id;
  3135. cm_id_priv->tid = sidr_req_msg->hdr.tid;
  3136. atomic_inc(&cm_id_priv->work_count);
  3137. spin_lock_irq(&cm.lock);
  3138. cur_cm_id_priv = cm_insert_remote_sidr(cm_id_priv);
  3139. if (cur_cm_id_priv) {
  3140. spin_unlock_irq(&cm.lock);
  3141. atomic_long_inc(&work->port->counter_group[CM_RECV_DUPLICATES].
  3142. counter[CM_SIDR_REQ_COUNTER]);
  3143. goto out; /* Duplicate message. */
  3144. }
  3145. cm_id_priv->id.state = IB_CM_SIDR_REQ_RCVD;
  3146. cur_cm_id_priv = cm_find_listen(cm_id->device,
  3147. sidr_req_msg->service_id);
  3148. if (!cur_cm_id_priv) {
  3149. spin_unlock_irq(&cm.lock);
  3150. cm_reject_sidr_req(cm_id_priv, IB_SIDR_UNSUPPORTED);
  3151. goto out; /* No match. */
  3152. }
  3153. atomic_inc(&cur_cm_id_priv->refcount);
  3154. atomic_inc(&cm_id_priv->refcount);
  3155. spin_unlock_irq(&cm.lock);
  3156. cm_id_priv->id.cm_handler = cur_cm_id_priv->id.cm_handler;
  3157. cm_id_priv->id.context = cur_cm_id_priv->id.context;
  3158. cm_id_priv->id.service_id = sidr_req_msg->service_id;
  3159. cm_id_priv->id.service_mask = ~cpu_to_be64(0);
  3160. cm_format_sidr_req_event(work, cm_id_priv, &cur_cm_id_priv->id);
  3161. cm_process_work(cm_id_priv, work);
  3162. cm_deref_id(cur_cm_id_priv);
  3163. return 0;
  3164. out:
  3165. ib_destroy_cm_id(&cm_id_priv->id);
  3166. return -EINVAL;
  3167. }
  3168. static void cm_format_sidr_rep(struct cm_sidr_rep_msg *sidr_rep_msg,
  3169. struct cm_id_private *cm_id_priv,
  3170. struct ib_cm_sidr_rep_param *param)
  3171. {
  3172. cm_format_mad_hdr(&sidr_rep_msg->hdr, CM_SIDR_REP_ATTR_ID,
  3173. cm_id_priv->tid);
  3174. sidr_rep_msg->request_id = cm_id_priv->id.remote_id;
  3175. sidr_rep_msg->status = param->status;
  3176. cm_sidr_rep_set_qpn(sidr_rep_msg, cpu_to_be32(param->qp_num));
  3177. sidr_rep_msg->service_id = cm_id_priv->id.service_id;
  3178. sidr_rep_msg->qkey = cpu_to_be32(param->qkey);
  3179. if (param->info && param->info_length)
  3180. memcpy(sidr_rep_msg->info, param->info, param->info_length);
  3181. if (param->private_data && param->private_data_len)
  3182. memcpy(sidr_rep_msg->private_data, param->private_data,
  3183. param->private_data_len);
  3184. }
  3185. int ib_send_cm_sidr_rep(struct ib_cm_id *cm_id,
  3186. struct ib_cm_sidr_rep_param *param)
  3187. {
  3188. struct cm_id_private *cm_id_priv;
  3189. struct ib_mad_send_buf *msg;
  3190. unsigned long flags;
  3191. int ret;
  3192. if ((param->info && param->info_length > IB_CM_SIDR_REP_INFO_LENGTH) ||
  3193. (param->private_data &&
  3194. param->private_data_len > IB_CM_SIDR_REP_PRIVATE_DATA_SIZE))
  3195. return -EINVAL;
  3196. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  3197. spin_lock_irqsave(&cm_id_priv->lock, flags);
  3198. if (cm_id->state != IB_CM_SIDR_REQ_RCVD) {
  3199. ret = -EINVAL;
  3200. goto error;
  3201. }
  3202. ret = cm_alloc_msg(cm_id_priv, &msg);
  3203. if (ret)
  3204. goto error;
  3205. cm_format_sidr_rep((struct cm_sidr_rep_msg *) msg->mad, cm_id_priv,
  3206. param);
  3207. ret = ib_post_send_mad(msg, NULL);
  3208. if (ret) {
  3209. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3210. cm_free_msg(msg);
  3211. return ret;
  3212. }
  3213. cm_id->state = IB_CM_IDLE;
  3214. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3215. spin_lock_irqsave(&cm.lock, flags);
  3216. if (!RB_EMPTY_NODE(&cm_id_priv->sidr_id_node)) {
  3217. rb_erase(&cm_id_priv->sidr_id_node, &cm.remote_sidr_table);
  3218. RB_CLEAR_NODE(&cm_id_priv->sidr_id_node);
  3219. }
  3220. spin_unlock_irqrestore(&cm.lock, flags);
  3221. return 0;
  3222. error: spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3223. return ret;
  3224. }
  3225. EXPORT_SYMBOL(ib_send_cm_sidr_rep);
  3226. static void cm_format_sidr_rep_event(struct cm_work *work,
  3227. const struct cm_id_private *cm_id_priv)
  3228. {
  3229. struct cm_sidr_rep_msg *sidr_rep_msg;
  3230. struct ib_cm_sidr_rep_event_param *param;
  3231. sidr_rep_msg = (struct cm_sidr_rep_msg *)
  3232. work->mad_recv_wc->recv_buf.mad;
  3233. param = &work->cm_event.param.sidr_rep_rcvd;
  3234. param->status = sidr_rep_msg->status;
  3235. param->qkey = be32_to_cpu(sidr_rep_msg->qkey);
  3236. param->qpn = be32_to_cpu(cm_sidr_rep_get_qpn(sidr_rep_msg));
  3237. param->info = &sidr_rep_msg->info;
  3238. param->info_len = sidr_rep_msg->info_length;
  3239. param->sgid_attr = cm_id_priv->av.ah_attr.grh.sgid_attr;
  3240. work->cm_event.private_data = &sidr_rep_msg->private_data;
  3241. }
  3242. static int cm_sidr_rep_handler(struct cm_work *work)
  3243. {
  3244. struct cm_sidr_rep_msg *sidr_rep_msg;
  3245. struct cm_id_private *cm_id_priv;
  3246. sidr_rep_msg = (struct cm_sidr_rep_msg *)
  3247. work->mad_recv_wc->recv_buf.mad;
  3248. cm_id_priv = cm_acquire_id(sidr_rep_msg->request_id, 0);
  3249. if (!cm_id_priv)
  3250. return -EINVAL; /* Unmatched reply. */
  3251. spin_lock_irq(&cm_id_priv->lock);
  3252. if (cm_id_priv->id.state != IB_CM_SIDR_REQ_SENT) {
  3253. spin_unlock_irq(&cm_id_priv->lock);
  3254. goto out;
  3255. }
  3256. cm_id_priv->id.state = IB_CM_IDLE;
  3257. ib_cancel_mad(cm_id_priv->av.port->mad_agent, cm_id_priv->msg);
  3258. spin_unlock_irq(&cm_id_priv->lock);
  3259. cm_format_sidr_rep_event(work, cm_id_priv);
  3260. cm_process_work(cm_id_priv, work);
  3261. return 0;
  3262. out:
  3263. cm_deref_id(cm_id_priv);
  3264. return -EINVAL;
  3265. }
  3266. static void cm_process_send_error(struct ib_mad_send_buf *msg,
  3267. enum ib_wc_status wc_status)
  3268. {
  3269. struct cm_id_private *cm_id_priv;
  3270. struct ib_cm_event cm_event;
  3271. enum ib_cm_state state;
  3272. int ret;
  3273. memset(&cm_event, 0, sizeof cm_event);
  3274. cm_id_priv = msg->context[0];
  3275. /* Discard old sends or ones without a response. */
  3276. spin_lock_irq(&cm_id_priv->lock);
  3277. state = (enum ib_cm_state) (unsigned long) msg->context[1];
  3278. if (msg != cm_id_priv->msg || state != cm_id_priv->id.state)
  3279. goto discard;
  3280. pr_debug_ratelimited("CM: failed sending MAD in state %d. (%s)\n",
  3281. state, ib_wc_status_msg(wc_status));
  3282. switch (state) {
  3283. case IB_CM_REQ_SENT:
  3284. case IB_CM_MRA_REQ_RCVD:
  3285. cm_reset_to_idle(cm_id_priv);
  3286. cm_event.event = IB_CM_REQ_ERROR;
  3287. break;
  3288. case IB_CM_REP_SENT:
  3289. case IB_CM_MRA_REP_RCVD:
  3290. cm_reset_to_idle(cm_id_priv);
  3291. cm_event.event = IB_CM_REP_ERROR;
  3292. break;
  3293. case IB_CM_DREQ_SENT:
  3294. cm_enter_timewait(cm_id_priv);
  3295. cm_event.event = IB_CM_DREQ_ERROR;
  3296. break;
  3297. case IB_CM_SIDR_REQ_SENT:
  3298. cm_id_priv->id.state = IB_CM_IDLE;
  3299. cm_event.event = IB_CM_SIDR_REQ_ERROR;
  3300. break;
  3301. default:
  3302. goto discard;
  3303. }
  3304. spin_unlock_irq(&cm_id_priv->lock);
  3305. cm_event.param.send_status = wc_status;
  3306. /* No other events can occur on the cm_id at this point. */
  3307. ret = cm_id_priv->id.cm_handler(&cm_id_priv->id, &cm_event);
  3308. cm_free_msg(msg);
  3309. if (ret)
  3310. ib_destroy_cm_id(&cm_id_priv->id);
  3311. return;
  3312. discard:
  3313. spin_unlock_irq(&cm_id_priv->lock);
  3314. cm_free_msg(msg);
  3315. }
  3316. static void cm_send_handler(struct ib_mad_agent *mad_agent,
  3317. struct ib_mad_send_wc *mad_send_wc)
  3318. {
  3319. struct ib_mad_send_buf *msg = mad_send_wc->send_buf;
  3320. struct cm_port *port;
  3321. u16 attr_index;
  3322. port = mad_agent->context;
  3323. attr_index = be16_to_cpu(((struct ib_mad_hdr *)
  3324. msg->mad)->attr_id) - CM_ATTR_ID_OFFSET;
  3325. /*
  3326. * If the send was in response to a received message (context[0] is not
  3327. * set to a cm_id), and is not a REJ, then it is a send that was
  3328. * manually retried.
  3329. */
  3330. if (!msg->context[0] && (attr_index != CM_REJ_COUNTER))
  3331. msg->retries = 1;
  3332. atomic_long_add(1 + msg->retries,
  3333. &port->counter_group[CM_XMIT].counter[attr_index]);
  3334. if (msg->retries)
  3335. atomic_long_add(msg->retries,
  3336. &port->counter_group[CM_XMIT_RETRIES].
  3337. counter[attr_index]);
  3338. switch (mad_send_wc->status) {
  3339. case IB_WC_SUCCESS:
  3340. case IB_WC_WR_FLUSH_ERR:
  3341. cm_free_msg(msg);
  3342. break;
  3343. default:
  3344. if (msg->context[0] && msg->context[1])
  3345. cm_process_send_error(msg, mad_send_wc->status);
  3346. else
  3347. cm_free_msg(msg);
  3348. break;
  3349. }
  3350. }
  3351. static void cm_work_handler(struct work_struct *_work)
  3352. {
  3353. struct cm_work *work = container_of(_work, struct cm_work, work.work);
  3354. int ret;
  3355. switch (work->cm_event.event) {
  3356. case IB_CM_REQ_RECEIVED:
  3357. ret = cm_req_handler(work);
  3358. break;
  3359. case IB_CM_MRA_RECEIVED:
  3360. ret = cm_mra_handler(work);
  3361. break;
  3362. case IB_CM_REJ_RECEIVED:
  3363. ret = cm_rej_handler(work);
  3364. break;
  3365. case IB_CM_REP_RECEIVED:
  3366. ret = cm_rep_handler(work);
  3367. break;
  3368. case IB_CM_RTU_RECEIVED:
  3369. ret = cm_rtu_handler(work);
  3370. break;
  3371. case IB_CM_USER_ESTABLISHED:
  3372. ret = cm_establish_handler(work);
  3373. break;
  3374. case IB_CM_DREQ_RECEIVED:
  3375. ret = cm_dreq_handler(work);
  3376. break;
  3377. case IB_CM_DREP_RECEIVED:
  3378. ret = cm_drep_handler(work);
  3379. break;
  3380. case IB_CM_SIDR_REQ_RECEIVED:
  3381. ret = cm_sidr_req_handler(work);
  3382. break;
  3383. case IB_CM_SIDR_REP_RECEIVED:
  3384. ret = cm_sidr_rep_handler(work);
  3385. break;
  3386. case IB_CM_LAP_RECEIVED:
  3387. ret = cm_lap_handler(work);
  3388. break;
  3389. case IB_CM_APR_RECEIVED:
  3390. ret = cm_apr_handler(work);
  3391. break;
  3392. case IB_CM_TIMEWAIT_EXIT:
  3393. ret = cm_timewait_handler(work);
  3394. break;
  3395. default:
  3396. pr_debug("cm_event.event: 0x%x\n", work->cm_event.event);
  3397. ret = -EINVAL;
  3398. break;
  3399. }
  3400. if (ret)
  3401. cm_free_work(work);
  3402. }
  3403. static int cm_establish(struct ib_cm_id *cm_id)
  3404. {
  3405. struct cm_id_private *cm_id_priv;
  3406. struct cm_work *work;
  3407. unsigned long flags;
  3408. int ret = 0;
  3409. struct cm_device *cm_dev;
  3410. cm_dev = ib_get_client_data(cm_id->device, &cm_client);
  3411. if (!cm_dev)
  3412. return -ENODEV;
  3413. work = kmalloc(sizeof *work, GFP_ATOMIC);
  3414. if (!work)
  3415. return -ENOMEM;
  3416. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  3417. spin_lock_irqsave(&cm_id_priv->lock, flags);
  3418. switch (cm_id->state)
  3419. {
  3420. case IB_CM_REP_SENT:
  3421. case IB_CM_MRA_REP_RCVD:
  3422. cm_id->state = IB_CM_ESTABLISHED;
  3423. break;
  3424. case IB_CM_ESTABLISHED:
  3425. ret = -EISCONN;
  3426. break;
  3427. default:
  3428. pr_debug("%s: local_id %d, cm_id->state: %d\n", __func__,
  3429. be32_to_cpu(cm_id->local_id), cm_id->state);
  3430. ret = -EINVAL;
  3431. break;
  3432. }
  3433. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3434. if (ret) {
  3435. kfree(work);
  3436. goto out;
  3437. }
  3438. /*
  3439. * The CM worker thread may try to destroy the cm_id before it
  3440. * can execute this work item. To prevent potential deadlock,
  3441. * we need to find the cm_id once we're in the context of the
  3442. * worker thread, rather than holding a reference on it.
  3443. */
  3444. INIT_DELAYED_WORK(&work->work, cm_work_handler);
  3445. work->local_id = cm_id->local_id;
  3446. work->remote_id = cm_id->remote_id;
  3447. work->mad_recv_wc = NULL;
  3448. work->cm_event.event = IB_CM_USER_ESTABLISHED;
  3449. /* Check if the device started its remove_one */
  3450. spin_lock_irqsave(&cm.lock, flags);
  3451. if (!cm_dev->going_down) {
  3452. queue_delayed_work(cm.wq, &work->work, 0);
  3453. } else {
  3454. kfree(work);
  3455. ret = -ENODEV;
  3456. }
  3457. spin_unlock_irqrestore(&cm.lock, flags);
  3458. out:
  3459. return ret;
  3460. }
  3461. static int cm_migrate(struct ib_cm_id *cm_id)
  3462. {
  3463. struct cm_id_private *cm_id_priv;
  3464. struct cm_av tmp_av;
  3465. unsigned long flags;
  3466. int tmp_send_port_not_ready;
  3467. int ret = 0;
  3468. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  3469. spin_lock_irqsave(&cm_id_priv->lock, flags);
  3470. if (cm_id->state == IB_CM_ESTABLISHED &&
  3471. (cm_id->lap_state == IB_CM_LAP_UNINIT ||
  3472. cm_id->lap_state == IB_CM_LAP_IDLE)) {
  3473. cm_id->lap_state = IB_CM_LAP_IDLE;
  3474. /* Swap address vector */
  3475. tmp_av = cm_id_priv->av;
  3476. cm_id_priv->av = cm_id_priv->alt_av;
  3477. cm_id_priv->alt_av = tmp_av;
  3478. /* Swap port send ready state */
  3479. tmp_send_port_not_ready = cm_id_priv->prim_send_port_not_ready;
  3480. cm_id_priv->prim_send_port_not_ready = cm_id_priv->altr_send_port_not_ready;
  3481. cm_id_priv->altr_send_port_not_ready = tmp_send_port_not_ready;
  3482. } else
  3483. ret = -EINVAL;
  3484. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3485. return ret;
  3486. }
  3487. int ib_cm_notify(struct ib_cm_id *cm_id, enum ib_event_type event)
  3488. {
  3489. int ret;
  3490. switch (event) {
  3491. case IB_EVENT_COMM_EST:
  3492. ret = cm_establish(cm_id);
  3493. break;
  3494. case IB_EVENT_PATH_MIG:
  3495. ret = cm_migrate(cm_id);
  3496. break;
  3497. default:
  3498. ret = -EINVAL;
  3499. }
  3500. return ret;
  3501. }
  3502. EXPORT_SYMBOL(ib_cm_notify);
  3503. static void cm_recv_handler(struct ib_mad_agent *mad_agent,
  3504. struct ib_mad_send_buf *send_buf,
  3505. struct ib_mad_recv_wc *mad_recv_wc)
  3506. {
  3507. struct cm_port *port = mad_agent->context;
  3508. struct cm_work *work;
  3509. enum ib_cm_event_type event;
  3510. bool alt_path = false;
  3511. u16 attr_id;
  3512. int paths = 0;
  3513. int going_down = 0;
  3514. switch (mad_recv_wc->recv_buf.mad->mad_hdr.attr_id) {
  3515. case CM_REQ_ATTR_ID:
  3516. alt_path = cm_req_has_alt_path((struct cm_req_msg *)
  3517. mad_recv_wc->recv_buf.mad);
  3518. paths = 1 + (alt_path != 0);
  3519. event = IB_CM_REQ_RECEIVED;
  3520. break;
  3521. case CM_MRA_ATTR_ID:
  3522. event = IB_CM_MRA_RECEIVED;
  3523. break;
  3524. case CM_REJ_ATTR_ID:
  3525. event = IB_CM_REJ_RECEIVED;
  3526. break;
  3527. case CM_REP_ATTR_ID:
  3528. event = IB_CM_REP_RECEIVED;
  3529. break;
  3530. case CM_RTU_ATTR_ID:
  3531. event = IB_CM_RTU_RECEIVED;
  3532. break;
  3533. case CM_DREQ_ATTR_ID:
  3534. event = IB_CM_DREQ_RECEIVED;
  3535. break;
  3536. case CM_DREP_ATTR_ID:
  3537. event = IB_CM_DREP_RECEIVED;
  3538. break;
  3539. case CM_SIDR_REQ_ATTR_ID:
  3540. event = IB_CM_SIDR_REQ_RECEIVED;
  3541. break;
  3542. case CM_SIDR_REP_ATTR_ID:
  3543. event = IB_CM_SIDR_REP_RECEIVED;
  3544. break;
  3545. case CM_LAP_ATTR_ID:
  3546. paths = 1;
  3547. event = IB_CM_LAP_RECEIVED;
  3548. break;
  3549. case CM_APR_ATTR_ID:
  3550. event = IB_CM_APR_RECEIVED;
  3551. break;
  3552. default:
  3553. ib_free_recv_mad(mad_recv_wc);
  3554. return;
  3555. }
  3556. attr_id = be16_to_cpu(mad_recv_wc->recv_buf.mad->mad_hdr.attr_id);
  3557. atomic_long_inc(&port->counter_group[CM_RECV].
  3558. counter[attr_id - CM_ATTR_ID_OFFSET]);
  3559. work = kmalloc(sizeof(*work) + sizeof(struct sa_path_rec) * paths,
  3560. GFP_KERNEL);
  3561. if (!work) {
  3562. ib_free_recv_mad(mad_recv_wc);
  3563. return;
  3564. }
  3565. INIT_DELAYED_WORK(&work->work, cm_work_handler);
  3566. work->cm_event.event = event;
  3567. work->mad_recv_wc = mad_recv_wc;
  3568. work->port = port;
  3569. /* Check if the device started its remove_one */
  3570. spin_lock_irq(&cm.lock);
  3571. if (!port->cm_dev->going_down)
  3572. queue_delayed_work(cm.wq, &work->work, 0);
  3573. else
  3574. going_down = 1;
  3575. spin_unlock_irq(&cm.lock);
  3576. if (going_down) {
  3577. kfree(work);
  3578. ib_free_recv_mad(mad_recv_wc);
  3579. }
  3580. }
  3581. static int cm_init_qp_init_attr(struct cm_id_private *cm_id_priv,
  3582. struct ib_qp_attr *qp_attr,
  3583. int *qp_attr_mask)
  3584. {
  3585. unsigned long flags;
  3586. int ret;
  3587. spin_lock_irqsave(&cm_id_priv->lock, flags);
  3588. switch (cm_id_priv->id.state) {
  3589. case IB_CM_REQ_SENT:
  3590. case IB_CM_MRA_REQ_RCVD:
  3591. case IB_CM_REQ_RCVD:
  3592. case IB_CM_MRA_REQ_SENT:
  3593. case IB_CM_REP_RCVD:
  3594. case IB_CM_MRA_REP_SENT:
  3595. case IB_CM_REP_SENT:
  3596. case IB_CM_MRA_REP_RCVD:
  3597. case IB_CM_ESTABLISHED:
  3598. *qp_attr_mask = IB_QP_STATE | IB_QP_ACCESS_FLAGS |
  3599. IB_QP_PKEY_INDEX | IB_QP_PORT;
  3600. qp_attr->qp_access_flags = IB_ACCESS_REMOTE_WRITE;
  3601. if (cm_id_priv->responder_resources)
  3602. qp_attr->qp_access_flags |= IB_ACCESS_REMOTE_READ |
  3603. IB_ACCESS_REMOTE_ATOMIC;
  3604. qp_attr->pkey_index = cm_id_priv->av.pkey_index;
  3605. qp_attr->port_num = cm_id_priv->av.port->port_num;
  3606. ret = 0;
  3607. break;
  3608. default:
  3609. pr_debug("%s: local_id %d, cm_id_priv->id.state: %d\n",
  3610. __func__, be32_to_cpu(cm_id_priv->id.local_id),
  3611. cm_id_priv->id.state);
  3612. ret = -EINVAL;
  3613. break;
  3614. }
  3615. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3616. return ret;
  3617. }
  3618. static int cm_init_qp_rtr_attr(struct cm_id_private *cm_id_priv,
  3619. struct ib_qp_attr *qp_attr,
  3620. int *qp_attr_mask)
  3621. {
  3622. unsigned long flags;
  3623. int ret;
  3624. spin_lock_irqsave(&cm_id_priv->lock, flags);
  3625. switch (cm_id_priv->id.state) {
  3626. case IB_CM_REQ_RCVD:
  3627. case IB_CM_MRA_REQ_SENT:
  3628. case IB_CM_REP_RCVD:
  3629. case IB_CM_MRA_REP_SENT:
  3630. case IB_CM_REP_SENT:
  3631. case IB_CM_MRA_REP_RCVD:
  3632. case IB_CM_ESTABLISHED:
  3633. *qp_attr_mask = IB_QP_STATE | IB_QP_AV | IB_QP_PATH_MTU |
  3634. IB_QP_DEST_QPN | IB_QP_RQ_PSN;
  3635. qp_attr->ah_attr = cm_id_priv->av.ah_attr;
  3636. qp_attr->path_mtu = cm_id_priv->path_mtu;
  3637. qp_attr->dest_qp_num = be32_to_cpu(cm_id_priv->remote_qpn);
  3638. qp_attr->rq_psn = be32_to_cpu(cm_id_priv->rq_psn);
  3639. if (cm_id_priv->qp_type == IB_QPT_RC ||
  3640. cm_id_priv->qp_type == IB_QPT_XRC_TGT) {
  3641. *qp_attr_mask |= IB_QP_MAX_DEST_RD_ATOMIC |
  3642. IB_QP_MIN_RNR_TIMER;
  3643. qp_attr->max_dest_rd_atomic =
  3644. cm_id_priv->responder_resources;
  3645. qp_attr->min_rnr_timer = 0;
  3646. }
  3647. if (rdma_ah_get_dlid(&cm_id_priv->alt_av.ah_attr)) {
  3648. *qp_attr_mask |= IB_QP_ALT_PATH;
  3649. qp_attr->alt_port_num = cm_id_priv->alt_av.port->port_num;
  3650. qp_attr->alt_pkey_index = cm_id_priv->alt_av.pkey_index;
  3651. qp_attr->alt_timeout = cm_id_priv->alt_av.timeout;
  3652. qp_attr->alt_ah_attr = cm_id_priv->alt_av.ah_attr;
  3653. }
  3654. ret = 0;
  3655. break;
  3656. default:
  3657. pr_debug("%s: local_id %d, cm_id_priv->id.state: %d\n",
  3658. __func__, be32_to_cpu(cm_id_priv->id.local_id),
  3659. cm_id_priv->id.state);
  3660. ret = -EINVAL;
  3661. break;
  3662. }
  3663. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3664. return ret;
  3665. }
  3666. static int cm_init_qp_rts_attr(struct cm_id_private *cm_id_priv,
  3667. struct ib_qp_attr *qp_attr,
  3668. int *qp_attr_mask)
  3669. {
  3670. unsigned long flags;
  3671. int ret;
  3672. spin_lock_irqsave(&cm_id_priv->lock, flags);
  3673. switch (cm_id_priv->id.state) {
  3674. /* Allow transition to RTS before sending REP */
  3675. case IB_CM_REQ_RCVD:
  3676. case IB_CM_MRA_REQ_SENT:
  3677. case IB_CM_REP_RCVD:
  3678. case IB_CM_MRA_REP_SENT:
  3679. case IB_CM_REP_SENT:
  3680. case IB_CM_MRA_REP_RCVD:
  3681. case IB_CM_ESTABLISHED:
  3682. if (cm_id_priv->id.lap_state == IB_CM_LAP_UNINIT) {
  3683. *qp_attr_mask = IB_QP_STATE | IB_QP_SQ_PSN;
  3684. qp_attr->sq_psn = be32_to_cpu(cm_id_priv->sq_psn);
  3685. switch (cm_id_priv->qp_type) {
  3686. case IB_QPT_RC:
  3687. case IB_QPT_XRC_INI:
  3688. *qp_attr_mask |= IB_QP_RETRY_CNT | IB_QP_RNR_RETRY |
  3689. IB_QP_MAX_QP_RD_ATOMIC;
  3690. qp_attr->retry_cnt = cm_id_priv->retry_count;
  3691. qp_attr->rnr_retry = cm_id_priv->rnr_retry_count;
  3692. qp_attr->max_rd_atomic = cm_id_priv->initiator_depth;
  3693. /* fall through */
  3694. case IB_QPT_XRC_TGT:
  3695. *qp_attr_mask |= IB_QP_TIMEOUT;
  3696. qp_attr->timeout = cm_id_priv->av.timeout;
  3697. break;
  3698. default:
  3699. break;
  3700. }
  3701. if (rdma_ah_get_dlid(&cm_id_priv->alt_av.ah_attr)) {
  3702. *qp_attr_mask |= IB_QP_PATH_MIG_STATE;
  3703. qp_attr->path_mig_state = IB_MIG_REARM;
  3704. }
  3705. } else {
  3706. *qp_attr_mask = IB_QP_ALT_PATH | IB_QP_PATH_MIG_STATE;
  3707. qp_attr->alt_port_num = cm_id_priv->alt_av.port->port_num;
  3708. qp_attr->alt_pkey_index = cm_id_priv->alt_av.pkey_index;
  3709. qp_attr->alt_timeout = cm_id_priv->alt_av.timeout;
  3710. qp_attr->alt_ah_attr = cm_id_priv->alt_av.ah_attr;
  3711. qp_attr->path_mig_state = IB_MIG_REARM;
  3712. }
  3713. ret = 0;
  3714. break;
  3715. default:
  3716. pr_debug("%s: local_id %d, cm_id_priv->id.state: %d\n",
  3717. __func__, be32_to_cpu(cm_id_priv->id.local_id),
  3718. cm_id_priv->id.state);
  3719. ret = -EINVAL;
  3720. break;
  3721. }
  3722. spin_unlock_irqrestore(&cm_id_priv->lock, flags);
  3723. return ret;
  3724. }
  3725. int ib_cm_init_qp_attr(struct ib_cm_id *cm_id,
  3726. struct ib_qp_attr *qp_attr,
  3727. int *qp_attr_mask)
  3728. {
  3729. struct cm_id_private *cm_id_priv;
  3730. int ret;
  3731. cm_id_priv = container_of(cm_id, struct cm_id_private, id);
  3732. switch (qp_attr->qp_state) {
  3733. case IB_QPS_INIT:
  3734. ret = cm_init_qp_init_attr(cm_id_priv, qp_attr, qp_attr_mask);
  3735. break;
  3736. case IB_QPS_RTR:
  3737. ret = cm_init_qp_rtr_attr(cm_id_priv, qp_attr, qp_attr_mask);
  3738. break;
  3739. case IB_QPS_RTS:
  3740. ret = cm_init_qp_rts_attr(cm_id_priv, qp_attr, qp_attr_mask);
  3741. break;
  3742. default:
  3743. ret = -EINVAL;
  3744. break;
  3745. }
  3746. return ret;
  3747. }
  3748. EXPORT_SYMBOL(ib_cm_init_qp_attr);
  3749. static ssize_t cm_show_counter(struct kobject *obj, struct attribute *attr,
  3750. char *buf)
  3751. {
  3752. struct cm_counter_group *group;
  3753. struct cm_counter_attribute *cm_attr;
  3754. group = container_of(obj, struct cm_counter_group, obj);
  3755. cm_attr = container_of(attr, struct cm_counter_attribute, attr);
  3756. return sprintf(buf, "%ld\n",
  3757. atomic_long_read(&group->counter[cm_attr->index]));
  3758. }
  3759. static const struct sysfs_ops cm_counter_ops = {
  3760. .show = cm_show_counter
  3761. };
  3762. static struct kobj_type cm_counter_obj_type = {
  3763. .sysfs_ops = &cm_counter_ops,
  3764. .default_attrs = cm_counter_default_attrs
  3765. };
  3766. static void cm_release_port_obj(struct kobject *obj)
  3767. {
  3768. struct cm_port *cm_port;
  3769. cm_port = container_of(obj, struct cm_port, port_obj);
  3770. kfree(cm_port);
  3771. }
  3772. static struct kobj_type cm_port_obj_type = {
  3773. .release = cm_release_port_obj
  3774. };
  3775. static char *cm_devnode(struct device *dev, umode_t *mode)
  3776. {
  3777. if (mode)
  3778. *mode = 0666;
  3779. return kasprintf(GFP_KERNEL, "infiniband/%s", dev_name(dev));
  3780. }
  3781. struct class cm_class = {
  3782. .owner = THIS_MODULE,
  3783. .name = "infiniband_cm",
  3784. .devnode = cm_devnode,
  3785. };
  3786. EXPORT_SYMBOL(cm_class);
  3787. static int cm_create_port_fs(struct cm_port *port)
  3788. {
  3789. int i, ret;
  3790. ret = kobject_init_and_add(&port->port_obj, &cm_port_obj_type,
  3791. &port->cm_dev->device->kobj,
  3792. "%d", port->port_num);
  3793. if (ret) {
  3794. kfree(port);
  3795. return ret;
  3796. }
  3797. for (i = 0; i < CM_COUNTER_GROUPS; i++) {
  3798. ret = kobject_init_and_add(&port->counter_group[i].obj,
  3799. &cm_counter_obj_type,
  3800. &port->port_obj,
  3801. "%s", counter_group_names[i]);
  3802. if (ret)
  3803. goto error;
  3804. }
  3805. return 0;
  3806. error:
  3807. while (i--)
  3808. kobject_put(&port->counter_group[i].obj);
  3809. kobject_put(&port->port_obj);
  3810. return ret;
  3811. }
  3812. static void cm_remove_port_fs(struct cm_port *port)
  3813. {
  3814. int i;
  3815. for (i = 0; i < CM_COUNTER_GROUPS; i++)
  3816. kobject_put(&port->counter_group[i].obj);
  3817. kobject_put(&port->port_obj);
  3818. }
  3819. static void cm_add_one(struct ib_device *ib_device)
  3820. {
  3821. struct cm_device *cm_dev;
  3822. struct cm_port *port;
  3823. struct ib_mad_reg_req reg_req = {
  3824. .mgmt_class = IB_MGMT_CLASS_CM,
  3825. .mgmt_class_version = IB_CM_CLASS_VERSION,
  3826. };
  3827. struct ib_port_modify port_modify = {
  3828. .set_port_cap_mask = IB_PORT_CM_SUP
  3829. };
  3830. unsigned long flags;
  3831. int ret;
  3832. int count = 0;
  3833. u8 i;
  3834. cm_dev = kzalloc(struct_size(cm_dev, port, ib_device->phys_port_cnt),
  3835. GFP_KERNEL);
  3836. if (!cm_dev)
  3837. return;
  3838. cm_dev->ib_device = ib_device;
  3839. cm_dev->ack_delay = ib_device->attrs.local_ca_ack_delay;
  3840. cm_dev->going_down = 0;
  3841. cm_dev->device = device_create(&cm_class, &ib_device->dev,
  3842. MKDEV(0, 0), NULL,
  3843. "%s", ib_device->name);
  3844. if (IS_ERR(cm_dev->device)) {
  3845. kfree(cm_dev);
  3846. return;
  3847. }
  3848. set_bit(IB_MGMT_METHOD_SEND, reg_req.method_mask);
  3849. for (i = 1; i <= ib_device->phys_port_cnt; i++) {
  3850. if (!rdma_cap_ib_cm(ib_device, i))
  3851. continue;
  3852. port = kzalloc(sizeof *port, GFP_KERNEL);
  3853. if (!port)
  3854. goto error1;
  3855. cm_dev->port[i-1] = port;
  3856. port->cm_dev = cm_dev;
  3857. port->port_num = i;
  3858. INIT_LIST_HEAD(&port->cm_priv_prim_list);
  3859. INIT_LIST_HEAD(&port->cm_priv_altr_list);
  3860. ret = cm_create_port_fs(port);
  3861. if (ret)
  3862. goto error1;
  3863. port->mad_agent = ib_register_mad_agent(ib_device, i,
  3864. IB_QPT_GSI,
  3865. &reg_req,
  3866. 0,
  3867. cm_send_handler,
  3868. cm_recv_handler,
  3869. port,
  3870. 0);
  3871. if (IS_ERR(port->mad_agent))
  3872. goto error2;
  3873. ret = ib_modify_port(ib_device, i, 0, &port_modify);
  3874. if (ret)
  3875. goto error3;
  3876. count++;
  3877. }
  3878. if (!count)
  3879. goto free;
  3880. ib_set_client_data(ib_device, &cm_client, cm_dev);
  3881. write_lock_irqsave(&cm.device_lock, flags);
  3882. list_add_tail(&cm_dev->list, &cm.device_list);
  3883. write_unlock_irqrestore(&cm.device_lock, flags);
  3884. return;
  3885. error3:
  3886. ib_unregister_mad_agent(port->mad_agent);
  3887. error2:
  3888. cm_remove_port_fs(port);
  3889. error1:
  3890. port_modify.set_port_cap_mask = 0;
  3891. port_modify.clr_port_cap_mask = IB_PORT_CM_SUP;
  3892. while (--i) {
  3893. if (!rdma_cap_ib_cm(ib_device, i))
  3894. continue;
  3895. port = cm_dev->port[i-1];
  3896. ib_modify_port(ib_device, port->port_num, 0, &port_modify);
  3897. ib_unregister_mad_agent(port->mad_agent);
  3898. cm_remove_port_fs(port);
  3899. }
  3900. free:
  3901. device_unregister(cm_dev->device);
  3902. kfree(cm_dev);
  3903. }
  3904. static void cm_remove_one(struct ib_device *ib_device, void *client_data)
  3905. {
  3906. struct cm_device *cm_dev = client_data;
  3907. struct cm_port *port;
  3908. struct cm_id_private *cm_id_priv;
  3909. struct ib_mad_agent *cur_mad_agent;
  3910. struct ib_port_modify port_modify = {
  3911. .clr_port_cap_mask = IB_PORT_CM_SUP
  3912. };
  3913. unsigned long flags;
  3914. int i;
  3915. if (!cm_dev)
  3916. return;
  3917. write_lock_irqsave(&cm.device_lock, flags);
  3918. list_del(&cm_dev->list);
  3919. write_unlock_irqrestore(&cm.device_lock, flags);
  3920. spin_lock_irq(&cm.lock);
  3921. cm_dev->going_down = 1;
  3922. spin_unlock_irq(&cm.lock);
  3923. for (i = 1; i <= ib_device->phys_port_cnt; i++) {
  3924. if (!rdma_cap_ib_cm(ib_device, i))
  3925. continue;
  3926. port = cm_dev->port[i-1];
  3927. ib_modify_port(ib_device, port->port_num, 0, &port_modify);
  3928. /* Mark all the cm_id's as not valid */
  3929. spin_lock_irq(&cm.lock);
  3930. list_for_each_entry(cm_id_priv, &port->cm_priv_altr_list, altr_list)
  3931. cm_id_priv->altr_send_port_not_ready = 1;
  3932. list_for_each_entry(cm_id_priv, &port->cm_priv_prim_list, prim_list)
  3933. cm_id_priv->prim_send_port_not_ready = 1;
  3934. spin_unlock_irq(&cm.lock);
  3935. /*
  3936. * We flush the queue here after the going_down set, this
  3937. * verify that no new works will be queued in the recv handler,
  3938. * after that we can call the unregister_mad_agent
  3939. */
  3940. flush_workqueue(cm.wq);
  3941. spin_lock_irq(&cm.state_lock);
  3942. cur_mad_agent = port->mad_agent;
  3943. port->mad_agent = NULL;
  3944. spin_unlock_irq(&cm.state_lock);
  3945. ib_unregister_mad_agent(cur_mad_agent);
  3946. cm_remove_port_fs(port);
  3947. }
  3948. device_unregister(cm_dev->device);
  3949. kfree(cm_dev);
  3950. }
  3951. static int __init ib_cm_init(void)
  3952. {
  3953. int ret;
  3954. memset(&cm, 0, sizeof cm);
  3955. INIT_LIST_HEAD(&cm.device_list);
  3956. rwlock_init(&cm.device_lock);
  3957. spin_lock_init(&cm.lock);
  3958. spin_lock_init(&cm.state_lock);
  3959. cm.listen_service_table = RB_ROOT;
  3960. cm.listen_service_id = be64_to_cpu(IB_CM_ASSIGN_SERVICE_ID);
  3961. cm.remote_id_table = RB_ROOT;
  3962. cm.remote_qp_table = RB_ROOT;
  3963. cm.remote_sidr_table = RB_ROOT;
  3964. idr_init(&cm.local_id_table);
  3965. get_random_bytes(&cm.random_id_operand, sizeof cm.random_id_operand);
  3966. INIT_LIST_HEAD(&cm.timewait_list);
  3967. ret = class_register(&cm_class);
  3968. if (ret) {
  3969. ret = -ENOMEM;
  3970. goto error1;
  3971. }
  3972. cm.wq = alloc_workqueue("ib_cm", 0, 1);
  3973. if (!cm.wq) {
  3974. ret = -ENOMEM;
  3975. goto error2;
  3976. }
  3977. ret = ib_register_client(&cm_client);
  3978. if (ret)
  3979. goto error3;
  3980. return 0;
  3981. error3:
  3982. destroy_workqueue(cm.wq);
  3983. error2:
  3984. class_unregister(&cm_class);
  3985. error1:
  3986. idr_destroy(&cm.local_id_table);
  3987. return ret;
  3988. }
  3989. static void __exit ib_cm_cleanup(void)
  3990. {
  3991. struct cm_timewait_info *timewait_info, *tmp;
  3992. spin_lock_irq(&cm.lock);
  3993. list_for_each_entry(timewait_info, &cm.timewait_list, list)
  3994. cancel_delayed_work(&timewait_info->work.work);
  3995. spin_unlock_irq(&cm.lock);
  3996. ib_unregister_client(&cm_client);
  3997. destroy_workqueue(cm.wq);
  3998. list_for_each_entry_safe(timewait_info, tmp, &cm.timewait_list, list) {
  3999. list_del(&timewait_info->list);
  4000. kfree(timewait_info);
  4001. }
  4002. class_unregister(&cm_class);
  4003. idr_destroy(&cm.local_id_table);
  4004. }
  4005. module_init(ib_cm_init);
  4006. module_exit(ib_cm_cleanup);