cm.c 109 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221322232233224322532263227322832293230323132323233323432353236323732383239324032413242324332443245324632473248324932503251325232533254325532563257325832593260326132623263326432653266326732683269327032713272327332743275327632773278327932803281328232833284328532863287328832893290329132923293329432953296329732983299330033013302330333043305330633073308330933103311331233133314331533163317331833193320332133223323332433253326332733283329333033313332333333343335333633373338333933403341334233433344334533463347334833493350335133523353335433553356335733583359336033613362336333643365336633673368336933703371337233733374337533763377337833793380338133823383338433853386338733883389339033913392339333943395339633973398339934003401340234033404340534063407340834093410341134123413341434153416341734183419342034213422342334243425342634273428342934303431343234333434343534363437343834393440344134423443344434453446344734483449345034513452345334543455345634573458345934603461346234633464346534663467346834693470347134723473347434753476347734783479348034813482348334843485348634873488348934903491349234933494349534963497349834993500350135023503350435053506350735083509351035113512351335143515351635173518351935203521352235233524352535263527352835293530353135323533353435353536353735383539354035413542354335443545354635473548354935503551355235533554355535563557355835593560356135623563356435653566356735683569357035713572357335743575357635773578357935803581358235833584358535863587358835893590359135923593359435953596359735983599360036013602360336043605360636073608360936103611361236133614361536163617361836193620362136223623362436253626362736283629363036313632363336343635363636373638363936403641364236433644364536463647364836493650365136523653365436553656365736583659366036613662366336643665366636673668366936703671367236733674367536763677367836793680368136823683368436853686368736883689369036913692369336943695369636973698369937003701370237033704370537063707370837093710371137123713371437153716371737183719372037213722372337243725372637273728372937303731373237333734373537363737373837393740374137423743374437453746374737483749375037513752375337543755375637573758375937603761376237633764376537663767376837693770377137723773377437753776377737783779378037813782378337843785378637873788378937903791379237933794379537963797379837993800380138023803380438053806380738083809381038113812381338143815381638173818381938203821382238233824382538263827382838293830383138323833383438353836383738383839384038413842384338443845384638473848384938503851385238533854385538563857385838593860386138623863386438653866386738683869387038713872387338743875387638773878387938803881388238833884388538863887388838893890389138923893389438953896389738983899390039013902390339043905390639073908390939103911391239133914391539163917391839193920392139223923392439253926392739283929393039313932393339343935393639373938393939403941394239433944394539463947394839493950395139523953395439553956395739583959396039613962396339643965396639673968396939703971397239733974397539763977397839793980398139823983398439853986398739883989399039913992399339943995399639973998
  1. /*
  2. * Copyright (c) 2009-2014 Chelsio, Inc. All rights reserved.
  3. *
  4. * This software is available to you under a choice of one of two
  5. * licenses. You may choose to be licensed under the terms of the GNU
  6. * General Public License (GPL) Version 2, available from the file
  7. * COPYING in the main directory of this source tree, or the
  8. * OpenIB.org BSD license below:
  9. *
  10. * Redistribution and use in source and binary forms, with or
  11. * without modification, are permitted provided that the following
  12. * conditions are met:
  13. *
  14. * - Redistributions of source code must retain the above
  15. * copyright notice, this list of conditions and the following
  16. * disclaimer.
  17. *
  18. * - Redistributions in binary form must reproduce the above
  19. * copyright notice, this list of conditions and the following
  20. * disclaimer in the documentation and/or other materials
  21. * provided with the distribution.
  22. *
  23. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  24. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  25. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  26. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  27. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  28. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  29. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  30. * SOFTWARE.
  31. */
  32. #include <linux/module.h>
  33. #include <linux/list.h>
  34. #include <linux/workqueue.h>
  35. #include <linux/skbuff.h>
  36. #include <linux/timer.h>
  37. #include <linux/notifier.h>
  38. #include <linux/inetdevice.h>
  39. #include <linux/ip.h>
  40. #include <linux/tcp.h>
  41. #include <linux/if_vlan.h>
  42. #include <net/neighbour.h>
  43. #include <net/netevent.h>
  44. #include <net/route.h>
  45. #include <net/tcp.h>
  46. #include <net/ip6_route.h>
  47. #include <net/addrconf.h>
  48. #include <rdma/ib_addr.h>
  49. #include "iw_cxgb4.h"
  50. static char *states[] = {
  51. "idle",
  52. "listen",
  53. "connecting",
  54. "mpa_wait_req",
  55. "mpa_req_sent",
  56. "mpa_req_rcvd",
  57. "mpa_rep_sent",
  58. "fpdu_mode",
  59. "aborting",
  60. "closing",
  61. "moribund",
  62. "dead",
  63. NULL,
  64. };
  65. static int nocong;
  66. module_param(nocong, int, 0644);
  67. MODULE_PARM_DESC(nocong, "Turn of congestion control (default=0)");
  68. static int enable_ecn;
  69. module_param(enable_ecn, int, 0644);
  70. MODULE_PARM_DESC(enable_ecn, "Enable ECN (default=0/disabled)");
  71. static int dack_mode = 1;
  72. module_param(dack_mode, int, 0644);
  73. MODULE_PARM_DESC(dack_mode, "Delayed ack mode (default=1)");
  74. uint c4iw_max_read_depth = 32;
  75. module_param(c4iw_max_read_depth, int, 0644);
  76. MODULE_PARM_DESC(c4iw_max_read_depth,
  77. "Per-connection max ORD/IRD (default=32)");
  78. static int enable_tcp_timestamps;
  79. module_param(enable_tcp_timestamps, int, 0644);
  80. MODULE_PARM_DESC(enable_tcp_timestamps, "Enable tcp timestamps (default=0)");
  81. static int enable_tcp_sack;
  82. module_param(enable_tcp_sack, int, 0644);
  83. MODULE_PARM_DESC(enable_tcp_sack, "Enable tcp SACK (default=0)");
  84. static int enable_tcp_window_scaling = 1;
  85. module_param(enable_tcp_window_scaling, int, 0644);
  86. MODULE_PARM_DESC(enable_tcp_window_scaling,
  87. "Enable tcp window scaling (default=1)");
  88. int c4iw_debug;
  89. module_param(c4iw_debug, int, 0644);
  90. MODULE_PARM_DESC(c4iw_debug, "Enable debug logging (default=0)");
  91. static int peer2peer = 1;
  92. module_param(peer2peer, int, 0644);
  93. MODULE_PARM_DESC(peer2peer, "Support peer2peer ULPs (default=1)");
  94. static int p2p_type = FW_RI_INIT_P2PTYPE_READ_REQ;
  95. module_param(p2p_type, int, 0644);
  96. MODULE_PARM_DESC(p2p_type, "RDMAP opcode to use for the RTR message: "
  97. "1=RDMA_READ 0=RDMA_WRITE (default 1)");
  98. static int ep_timeout_secs = 60;
  99. module_param(ep_timeout_secs, int, 0644);
  100. MODULE_PARM_DESC(ep_timeout_secs, "CM Endpoint operation timeout "
  101. "in seconds (default=60)");
  102. static int mpa_rev = 1;
  103. module_param(mpa_rev, int, 0644);
  104. MODULE_PARM_DESC(mpa_rev, "MPA Revision, 0 supports amso1100, "
  105. "1 is RFC0544 spec compliant, 2 is IETF MPA Peer Connect Draft"
  106. " compliant (default=1)");
  107. static int markers_enabled;
  108. module_param(markers_enabled, int, 0644);
  109. MODULE_PARM_DESC(markers_enabled, "Enable MPA MARKERS (default(0)=disabled)");
  110. static int crc_enabled = 1;
  111. module_param(crc_enabled, int, 0644);
  112. MODULE_PARM_DESC(crc_enabled, "Enable MPA CRC (default(1)=enabled)");
  113. static int rcv_win = 256 * 1024;
  114. module_param(rcv_win, int, 0644);
  115. MODULE_PARM_DESC(rcv_win, "TCP receive window in bytes (default=256KB)");
  116. static int snd_win = 128 * 1024;
  117. module_param(snd_win, int, 0644);
  118. MODULE_PARM_DESC(snd_win, "TCP send window in bytes (default=128KB)");
  119. static struct workqueue_struct *workq;
  120. static struct sk_buff_head rxq;
  121. static struct sk_buff *get_skb(struct sk_buff *skb, int len, gfp_t gfp);
  122. static void ep_timeout(unsigned long arg);
  123. static void connect_reply_upcall(struct c4iw_ep *ep, int status);
  124. static LIST_HEAD(timeout_list);
  125. static spinlock_t timeout_lock;
  126. static void deref_qp(struct c4iw_ep *ep)
  127. {
  128. c4iw_qp_rem_ref(&ep->com.qp->ibqp);
  129. clear_bit(QP_REFERENCED, &ep->com.flags);
  130. }
  131. static void ref_qp(struct c4iw_ep *ep)
  132. {
  133. set_bit(QP_REFERENCED, &ep->com.flags);
  134. c4iw_qp_add_ref(&ep->com.qp->ibqp);
  135. }
  136. static void start_ep_timer(struct c4iw_ep *ep)
  137. {
  138. PDBG("%s ep %p\n", __func__, ep);
  139. if (timer_pending(&ep->timer)) {
  140. pr_err("%s timer already started! ep %p\n",
  141. __func__, ep);
  142. return;
  143. }
  144. clear_bit(TIMEOUT, &ep->com.flags);
  145. c4iw_get_ep(&ep->com);
  146. ep->timer.expires = jiffies + ep_timeout_secs * HZ;
  147. ep->timer.data = (unsigned long)ep;
  148. ep->timer.function = ep_timeout;
  149. add_timer(&ep->timer);
  150. }
  151. static int stop_ep_timer(struct c4iw_ep *ep)
  152. {
  153. PDBG("%s ep %p stopping\n", __func__, ep);
  154. del_timer_sync(&ep->timer);
  155. if (!test_and_set_bit(TIMEOUT, &ep->com.flags)) {
  156. c4iw_put_ep(&ep->com);
  157. return 0;
  158. }
  159. return 1;
  160. }
  161. static int c4iw_l2t_send(struct c4iw_rdev *rdev, struct sk_buff *skb,
  162. struct l2t_entry *l2e)
  163. {
  164. int error = 0;
  165. if (c4iw_fatal_error(rdev)) {
  166. kfree_skb(skb);
  167. PDBG("%s - device in error state - dropping\n", __func__);
  168. return -EIO;
  169. }
  170. error = cxgb4_l2t_send(rdev->lldi.ports[0], skb, l2e);
  171. if (error < 0)
  172. kfree_skb(skb);
  173. return error < 0 ? error : 0;
  174. }
  175. int c4iw_ofld_send(struct c4iw_rdev *rdev, struct sk_buff *skb)
  176. {
  177. int error = 0;
  178. if (c4iw_fatal_error(rdev)) {
  179. kfree_skb(skb);
  180. PDBG("%s - device in error state - dropping\n", __func__);
  181. return -EIO;
  182. }
  183. error = cxgb4_ofld_send(rdev->lldi.ports[0], skb);
  184. if (error < 0)
  185. kfree_skb(skb);
  186. return error < 0 ? error : 0;
  187. }
  188. static void release_tid(struct c4iw_rdev *rdev, u32 hwtid, struct sk_buff *skb)
  189. {
  190. struct cpl_tid_release *req;
  191. skb = get_skb(skb, sizeof *req, GFP_KERNEL);
  192. if (!skb)
  193. return;
  194. req = (struct cpl_tid_release *) skb_put(skb, sizeof(*req));
  195. INIT_TP_WR(req, hwtid);
  196. OPCODE_TID(req) = cpu_to_be32(MK_OPCODE_TID(CPL_TID_RELEASE, hwtid));
  197. set_wr_txq(skb, CPL_PRIORITY_SETUP, 0);
  198. c4iw_ofld_send(rdev, skb);
  199. return;
  200. }
  201. static void set_emss(struct c4iw_ep *ep, u16 opt)
  202. {
  203. ep->emss = ep->com.dev->rdev.lldi.mtus[GET_TCPOPT_MSS(opt)] -
  204. ((AF_INET == ep->com.remote_addr.ss_family) ?
  205. sizeof(struct iphdr) : sizeof(struct ipv6hdr)) -
  206. sizeof(struct tcphdr);
  207. ep->mss = ep->emss;
  208. if (GET_TCPOPT_TSTAMP(opt))
  209. ep->emss -= round_up(TCPOLEN_TIMESTAMP, 4);
  210. if (ep->emss < 128)
  211. ep->emss = 128;
  212. if (ep->emss & 7)
  213. PDBG("Warning: misaligned mtu idx %u mss %u emss=%u\n",
  214. GET_TCPOPT_MSS(opt), ep->mss, ep->emss);
  215. PDBG("%s mss_idx %u mss %u emss=%u\n", __func__, GET_TCPOPT_MSS(opt),
  216. ep->mss, ep->emss);
  217. }
  218. static enum c4iw_ep_state state_read(struct c4iw_ep_common *epc)
  219. {
  220. enum c4iw_ep_state state;
  221. mutex_lock(&epc->mutex);
  222. state = epc->state;
  223. mutex_unlock(&epc->mutex);
  224. return state;
  225. }
  226. static void __state_set(struct c4iw_ep_common *epc, enum c4iw_ep_state new)
  227. {
  228. epc->state = new;
  229. }
  230. static void state_set(struct c4iw_ep_common *epc, enum c4iw_ep_state new)
  231. {
  232. mutex_lock(&epc->mutex);
  233. PDBG("%s - %s -> %s\n", __func__, states[epc->state], states[new]);
  234. __state_set(epc, new);
  235. mutex_unlock(&epc->mutex);
  236. return;
  237. }
  238. static void *alloc_ep(int size, gfp_t gfp)
  239. {
  240. struct c4iw_ep_common *epc;
  241. epc = kzalloc(size, gfp);
  242. if (epc) {
  243. kref_init(&epc->kref);
  244. mutex_init(&epc->mutex);
  245. c4iw_init_wr_wait(&epc->wr_wait);
  246. }
  247. PDBG("%s alloc ep %p\n", __func__, epc);
  248. return epc;
  249. }
  250. void _c4iw_free_ep(struct kref *kref)
  251. {
  252. struct c4iw_ep *ep;
  253. ep = container_of(kref, struct c4iw_ep, com.kref);
  254. PDBG("%s ep %p state %s\n", __func__, ep, states[state_read(&ep->com)]);
  255. if (test_bit(QP_REFERENCED, &ep->com.flags))
  256. deref_qp(ep);
  257. if (test_bit(RELEASE_RESOURCES, &ep->com.flags)) {
  258. remove_handle(ep->com.dev, &ep->com.dev->hwtid_idr, ep->hwtid);
  259. cxgb4_remove_tid(ep->com.dev->rdev.lldi.tids, 0, ep->hwtid);
  260. dst_release(ep->dst);
  261. cxgb4_l2t_release(ep->l2t);
  262. }
  263. if (test_bit(RELEASE_MAPINFO, &ep->com.flags)) {
  264. print_addr(&ep->com, __func__, "remove_mapinfo/mapping");
  265. iwpm_remove_mapinfo(&ep->com.local_addr,
  266. &ep->com.mapped_local_addr);
  267. iwpm_remove_mapping(&ep->com.local_addr, RDMA_NL_C4IW);
  268. }
  269. kfree(ep);
  270. }
  271. static void release_ep_resources(struct c4iw_ep *ep)
  272. {
  273. set_bit(RELEASE_RESOURCES, &ep->com.flags);
  274. c4iw_put_ep(&ep->com);
  275. }
  276. static int status2errno(int status)
  277. {
  278. switch (status) {
  279. case CPL_ERR_NONE:
  280. return 0;
  281. case CPL_ERR_CONN_RESET:
  282. return -ECONNRESET;
  283. case CPL_ERR_ARP_MISS:
  284. return -EHOSTUNREACH;
  285. case CPL_ERR_CONN_TIMEDOUT:
  286. return -ETIMEDOUT;
  287. case CPL_ERR_TCAM_FULL:
  288. return -ENOMEM;
  289. case CPL_ERR_CONN_EXIST:
  290. return -EADDRINUSE;
  291. default:
  292. return -EIO;
  293. }
  294. }
  295. /*
  296. * Try and reuse skbs already allocated...
  297. */
  298. static struct sk_buff *get_skb(struct sk_buff *skb, int len, gfp_t gfp)
  299. {
  300. if (skb && !skb_is_nonlinear(skb) && !skb_cloned(skb)) {
  301. skb_trim(skb, 0);
  302. skb_get(skb);
  303. skb_reset_transport_header(skb);
  304. } else {
  305. skb = alloc_skb(len, gfp);
  306. }
  307. t4_set_arp_err_handler(skb, NULL, NULL);
  308. return skb;
  309. }
  310. static struct net_device *get_real_dev(struct net_device *egress_dev)
  311. {
  312. return rdma_vlan_dev_real_dev(egress_dev) ? : egress_dev;
  313. }
  314. static int our_interface(struct c4iw_dev *dev, struct net_device *egress_dev)
  315. {
  316. int i;
  317. egress_dev = get_real_dev(egress_dev);
  318. for (i = 0; i < dev->rdev.lldi.nports; i++)
  319. if (dev->rdev.lldi.ports[i] == egress_dev)
  320. return 1;
  321. return 0;
  322. }
  323. static struct dst_entry *find_route6(struct c4iw_dev *dev, __u8 *local_ip,
  324. __u8 *peer_ip, __be16 local_port,
  325. __be16 peer_port, u8 tos,
  326. __u32 sin6_scope_id)
  327. {
  328. struct dst_entry *dst = NULL;
  329. if (IS_ENABLED(CONFIG_IPV6)) {
  330. struct flowi6 fl6;
  331. memset(&fl6, 0, sizeof(fl6));
  332. memcpy(&fl6.daddr, peer_ip, 16);
  333. memcpy(&fl6.saddr, local_ip, 16);
  334. if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
  335. fl6.flowi6_oif = sin6_scope_id;
  336. dst = ip6_route_output(&init_net, NULL, &fl6);
  337. if (!dst)
  338. goto out;
  339. if (!our_interface(dev, ip6_dst_idev(dst)->dev) &&
  340. !(ip6_dst_idev(dst)->dev->flags & IFF_LOOPBACK)) {
  341. dst_release(dst);
  342. dst = NULL;
  343. }
  344. }
  345. out:
  346. return dst;
  347. }
  348. static struct dst_entry *find_route(struct c4iw_dev *dev, __be32 local_ip,
  349. __be32 peer_ip, __be16 local_port,
  350. __be16 peer_port, u8 tos)
  351. {
  352. struct rtable *rt;
  353. struct flowi4 fl4;
  354. struct neighbour *n;
  355. rt = ip_route_output_ports(&init_net, &fl4, NULL, peer_ip, local_ip,
  356. peer_port, local_port, IPPROTO_TCP,
  357. tos, 0);
  358. if (IS_ERR(rt))
  359. return NULL;
  360. n = dst_neigh_lookup(&rt->dst, &peer_ip);
  361. if (!n)
  362. return NULL;
  363. if (!our_interface(dev, n->dev) &&
  364. !(n->dev->flags & IFF_LOOPBACK)) {
  365. neigh_release(n);
  366. dst_release(&rt->dst);
  367. return NULL;
  368. }
  369. neigh_release(n);
  370. return &rt->dst;
  371. }
  372. static void arp_failure_discard(void *handle, struct sk_buff *skb)
  373. {
  374. PDBG("%s c4iw_dev %p\n", __func__, handle);
  375. kfree_skb(skb);
  376. }
  377. /*
  378. * Handle an ARP failure for an active open.
  379. */
  380. static void act_open_req_arp_failure(void *handle, struct sk_buff *skb)
  381. {
  382. struct c4iw_ep *ep = handle;
  383. printk(KERN_ERR MOD "ARP failure duing connect\n");
  384. kfree_skb(skb);
  385. connect_reply_upcall(ep, -EHOSTUNREACH);
  386. state_set(&ep->com, DEAD);
  387. remove_handle(ep->com.dev, &ep->com.dev->atid_idr, ep->atid);
  388. cxgb4_free_atid(ep->com.dev->rdev.lldi.tids, ep->atid);
  389. dst_release(ep->dst);
  390. cxgb4_l2t_release(ep->l2t);
  391. c4iw_put_ep(&ep->com);
  392. }
  393. /*
  394. * Handle an ARP failure for a CPL_ABORT_REQ. Change it into a no RST variant
  395. * and send it along.
  396. */
  397. static void abort_arp_failure(void *handle, struct sk_buff *skb)
  398. {
  399. struct c4iw_rdev *rdev = handle;
  400. struct cpl_abort_req *req = cplhdr(skb);
  401. PDBG("%s rdev %p\n", __func__, rdev);
  402. req->cmd = CPL_ABORT_NO_RST;
  403. c4iw_ofld_send(rdev, skb);
  404. }
  405. static void send_flowc(struct c4iw_ep *ep, struct sk_buff *skb)
  406. {
  407. unsigned int flowclen = 80;
  408. struct fw_flowc_wr *flowc;
  409. int i;
  410. skb = get_skb(skb, flowclen, GFP_KERNEL);
  411. flowc = (struct fw_flowc_wr *)__skb_put(skb, flowclen);
  412. flowc->op_to_nparams = cpu_to_be32(FW_WR_OP_V(FW_FLOWC_WR) |
  413. FW_FLOWC_WR_NPARAMS_V(8));
  414. flowc->flowid_len16 = cpu_to_be32(FW_WR_LEN16_V(DIV_ROUND_UP(flowclen,
  415. 16)) | FW_WR_FLOWID_V(ep->hwtid));
  416. flowc->mnemval[0].mnemonic = FW_FLOWC_MNEM_PFNVFN;
  417. flowc->mnemval[0].val = cpu_to_be32(FW_PFVF_CMD_PFN_V
  418. (ep->com.dev->rdev.lldi.pf));
  419. flowc->mnemval[1].mnemonic = FW_FLOWC_MNEM_CH;
  420. flowc->mnemval[1].val = cpu_to_be32(ep->tx_chan);
  421. flowc->mnemval[2].mnemonic = FW_FLOWC_MNEM_PORT;
  422. flowc->mnemval[2].val = cpu_to_be32(ep->tx_chan);
  423. flowc->mnemval[3].mnemonic = FW_FLOWC_MNEM_IQID;
  424. flowc->mnemval[3].val = cpu_to_be32(ep->rss_qid);
  425. flowc->mnemval[4].mnemonic = FW_FLOWC_MNEM_SNDNXT;
  426. flowc->mnemval[4].val = cpu_to_be32(ep->snd_seq);
  427. flowc->mnemval[5].mnemonic = FW_FLOWC_MNEM_RCVNXT;
  428. flowc->mnemval[5].val = cpu_to_be32(ep->rcv_seq);
  429. flowc->mnemval[6].mnemonic = FW_FLOWC_MNEM_SNDBUF;
  430. flowc->mnemval[6].val = cpu_to_be32(ep->snd_win);
  431. flowc->mnemval[7].mnemonic = FW_FLOWC_MNEM_MSS;
  432. flowc->mnemval[7].val = cpu_to_be32(ep->emss);
  433. /* Pad WR to 16 byte boundary */
  434. flowc->mnemval[8].mnemonic = 0;
  435. flowc->mnemval[8].val = 0;
  436. for (i = 0; i < 9; i++) {
  437. flowc->mnemval[i].r4[0] = 0;
  438. flowc->mnemval[i].r4[1] = 0;
  439. flowc->mnemval[i].r4[2] = 0;
  440. }
  441. set_wr_txq(skb, CPL_PRIORITY_DATA, ep->txq_idx);
  442. c4iw_ofld_send(&ep->com.dev->rdev, skb);
  443. }
  444. static int send_halfclose(struct c4iw_ep *ep, gfp_t gfp)
  445. {
  446. struct cpl_close_con_req *req;
  447. struct sk_buff *skb;
  448. int wrlen = roundup(sizeof *req, 16);
  449. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  450. skb = get_skb(NULL, wrlen, gfp);
  451. if (!skb) {
  452. printk(KERN_ERR MOD "%s - failed to alloc skb\n", __func__);
  453. return -ENOMEM;
  454. }
  455. set_wr_txq(skb, CPL_PRIORITY_DATA, ep->txq_idx);
  456. t4_set_arp_err_handler(skb, NULL, arp_failure_discard);
  457. req = (struct cpl_close_con_req *) skb_put(skb, wrlen);
  458. memset(req, 0, wrlen);
  459. INIT_TP_WR(req, ep->hwtid);
  460. OPCODE_TID(req) = cpu_to_be32(MK_OPCODE_TID(CPL_CLOSE_CON_REQ,
  461. ep->hwtid));
  462. return c4iw_l2t_send(&ep->com.dev->rdev, skb, ep->l2t);
  463. }
  464. static int send_abort(struct c4iw_ep *ep, struct sk_buff *skb, gfp_t gfp)
  465. {
  466. struct cpl_abort_req *req;
  467. int wrlen = roundup(sizeof *req, 16);
  468. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  469. skb = get_skb(skb, wrlen, gfp);
  470. if (!skb) {
  471. printk(KERN_ERR MOD "%s - failed to alloc skb.\n",
  472. __func__);
  473. return -ENOMEM;
  474. }
  475. set_wr_txq(skb, CPL_PRIORITY_DATA, ep->txq_idx);
  476. t4_set_arp_err_handler(skb, &ep->com.dev->rdev, abort_arp_failure);
  477. req = (struct cpl_abort_req *) skb_put(skb, wrlen);
  478. memset(req, 0, wrlen);
  479. INIT_TP_WR(req, ep->hwtid);
  480. OPCODE_TID(req) = cpu_to_be32(MK_OPCODE_TID(CPL_ABORT_REQ, ep->hwtid));
  481. req->cmd = CPL_ABORT_SEND_RST;
  482. return c4iw_l2t_send(&ep->com.dev->rdev, skb, ep->l2t);
  483. }
  484. /*
  485. * c4iw_form_pm_msg - Form a port mapper message with mapping info
  486. */
  487. static void c4iw_form_pm_msg(struct c4iw_ep *ep,
  488. struct iwpm_sa_data *pm_msg)
  489. {
  490. memcpy(&pm_msg->loc_addr, &ep->com.local_addr,
  491. sizeof(ep->com.local_addr));
  492. memcpy(&pm_msg->rem_addr, &ep->com.remote_addr,
  493. sizeof(ep->com.remote_addr));
  494. }
  495. /*
  496. * c4iw_form_reg_msg - Form a port mapper message with dev info
  497. */
  498. static void c4iw_form_reg_msg(struct c4iw_dev *dev,
  499. struct iwpm_dev_data *pm_msg)
  500. {
  501. memcpy(pm_msg->dev_name, dev->ibdev.name, IWPM_DEVNAME_SIZE);
  502. memcpy(pm_msg->if_name, dev->rdev.lldi.ports[0]->name,
  503. IWPM_IFNAME_SIZE);
  504. }
  505. static void c4iw_record_pm_msg(struct c4iw_ep *ep,
  506. struct iwpm_sa_data *pm_msg)
  507. {
  508. memcpy(&ep->com.mapped_local_addr, &pm_msg->mapped_loc_addr,
  509. sizeof(ep->com.mapped_local_addr));
  510. memcpy(&ep->com.mapped_remote_addr, &pm_msg->mapped_rem_addr,
  511. sizeof(ep->com.mapped_remote_addr));
  512. }
  513. static void best_mtu(const unsigned short *mtus, unsigned short mtu,
  514. unsigned int *idx, int use_ts, int ipv6)
  515. {
  516. unsigned short hdr_size = (ipv6 ?
  517. sizeof(struct ipv6hdr) :
  518. sizeof(struct iphdr)) +
  519. sizeof(struct tcphdr) +
  520. (use_ts ?
  521. round_up(TCPOLEN_TIMESTAMP, 4) : 0);
  522. unsigned short data_size = mtu - hdr_size;
  523. cxgb4_best_aligned_mtu(mtus, hdr_size, data_size, 8, idx);
  524. }
  525. static int send_connect(struct c4iw_ep *ep)
  526. {
  527. struct cpl_act_open_req *req;
  528. struct cpl_t5_act_open_req *t5_req;
  529. struct cpl_act_open_req6 *req6;
  530. struct cpl_t5_act_open_req6 *t5_req6;
  531. struct sk_buff *skb;
  532. u64 opt0;
  533. u32 opt2;
  534. unsigned int mtu_idx;
  535. int wscale;
  536. int wrlen;
  537. int sizev4 = is_t4(ep->com.dev->rdev.lldi.adapter_type) ?
  538. sizeof(struct cpl_act_open_req) :
  539. sizeof(struct cpl_t5_act_open_req);
  540. int sizev6 = is_t4(ep->com.dev->rdev.lldi.adapter_type) ?
  541. sizeof(struct cpl_act_open_req6) :
  542. sizeof(struct cpl_t5_act_open_req6);
  543. struct sockaddr_in *la = (struct sockaddr_in *)
  544. &ep->com.mapped_local_addr;
  545. struct sockaddr_in *ra = (struct sockaddr_in *)
  546. &ep->com.mapped_remote_addr;
  547. struct sockaddr_in6 *la6 = (struct sockaddr_in6 *)
  548. &ep->com.mapped_local_addr;
  549. struct sockaddr_in6 *ra6 = (struct sockaddr_in6 *)
  550. &ep->com.mapped_remote_addr;
  551. int win;
  552. wrlen = (ep->com.remote_addr.ss_family == AF_INET) ?
  553. roundup(sizev4, 16) :
  554. roundup(sizev6, 16);
  555. PDBG("%s ep %p atid %u\n", __func__, ep, ep->atid);
  556. skb = get_skb(NULL, wrlen, GFP_KERNEL);
  557. if (!skb) {
  558. printk(KERN_ERR MOD "%s - failed to alloc skb.\n",
  559. __func__);
  560. return -ENOMEM;
  561. }
  562. set_wr_txq(skb, CPL_PRIORITY_SETUP, ep->ctrlq_idx);
  563. best_mtu(ep->com.dev->rdev.lldi.mtus, ep->mtu, &mtu_idx,
  564. enable_tcp_timestamps,
  565. (AF_INET == ep->com.remote_addr.ss_family) ? 0 : 1);
  566. wscale = compute_wscale(rcv_win);
  567. /*
  568. * Specify the largest window that will fit in opt0. The
  569. * remainder will be specified in the rx_data_ack.
  570. */
  571. win = ep->rcv_win >> 10;
  572. if (win > RCV_BUFSIZ_M)
  573. win = RCV_BUFSIZ_M;
  574. opt0 = (nocong ? NO_CONG(1) : 0) |
  575. KEEP_ALIVE_F |
  576. DELACK(1) |
  577. WND_SCALE_V(wscale) |
  578. MSS_IDX_V(mtu_idx) |
  579. L2T_IDX_V(ep->l2t->idx) |
  580. TX_CHAN_V(ep->tx_chan) |
  581. SMAC_SEL_V(ep->smac_idx) |
  582. DSCP(ep->tos) |
  583. ULP_MODE_V(ULP_MODE_TCPDDP) |
  584. RCV_BUFSIZ_V(win);
  585. opt2 = RX_CHANNEL_V(0) |
  586. CCTRL_ECN(enable_ecn) |
  587. RSS_QUEUE_VALID_F | RSS_QUEUE_V(ep->rss_qid);
  588. if (enable_tcp_timestamps)
  589. opt2 |= TSTAMPS_EN(1);
  590. if (enable_tcp_sack)
  591. opt2 |= SACK_EN(1);
  592. if (wscale && enable_tcp_window_scaling)
  593. opt2 |= WND_SCALE_EN_F;
  594. if (is_t5(ep->com.dev->rdev.lldi.adapter_type)) {
  595. opt2 |= T5_OPT_2_VALID_F;
  596. opt2 |= V_CONG_CNTRL(CONG_ALG_TAHOE);
  597. opt2 |= CONG_CNTRL_VALID; /* OPT_2_ISS for T5 */
  598. }
  599. t4_set_arp_err_handler(skb, ep, act_open_req_arp_failure);
  600. if (is_t4(ep->com.dev->rdev.lldi.adapter_type)) {
  601. if (ep->com.remote_addr.ss_family == AF_INET) {
  602. req = (struct cpl_act_open_req *) skb_put(skb, wrlen);
  603. INIT_TP_WR(req, 0);
  604. OPCODE_TID(req) = cpu_to_be32(
  605. MK_OPCODE_TID(CPL_ACT_OPEN_REQ,
  606. ((ep->rss_qid << 14) | ep->atid)));
  607. req->local_port = la->sin_port;
  608. req->peer_port = ra->sin_port;
  609. req->local_ip = la->sin_addr.s_addr;
  610. req->peer_ip = ra->sin_addr.s_addr;
  611. req->opt0 = cpu_to_be64(opt0);
  612. req->params = cpu_to_be32(cxgb4_select_ntuple(
  613. ep->com.dev->rdev.lldi.ports[0],
  614. ep->l2t));
  615. req->opt2 = cpu_to_be32(opt2);
  616. } else {
  617. req6 = (struct cpl_act_open_req6 *)skb_put(skb, wrlen);
  618. INIT_TP_WR(req6, 0);
  619. OPCODE_TID(req6) = cpu_to_be32(
  620. MK_OPCODE_TID(CPL_ACT_OPEN_REQ6,
  621. ((ep->rss_qid<<14)|ep->atid)));
  622. req6->local_port = la6->sin6_port;
  623. req6->peer_port = ra6->sin6_port;
  624. req6->local_ip_hi = *((__be64 *)
  625. (la6->sin6_addr.s6_addr));
  626. req6->local_ip_lo = *((__be64 *)
  627. (la6->sin6_addr.s6_addr + 8));
  628. req6->peer_ip_hi = *((__be64 *)
  629. (ra6->sin6_addr.s6_addr));
  630. req6->peer_ip_lo = *((__be64 *)
  631. (ra6->sin6_addr.s6_addr + 8));
  632. req6->opt0 = cpu_to_be64(opt0);
  633. req6->params = cpu_to_be32(cxgb4_select_ntuple(
  634. ep->com.dev->rdev.lldi.ports[0],
  635. ep->l2t));
  636. req6->opt2 = cpu_to_be32(opt2);
  637. }
  638. } else {
  639. u32 isn = (prandom_u32() & ~7UL) - 1;
  640. if (peer2peer)
  641. isn += 4;
  642. if (ep->com.remote_addr.ss_family == AF_INET) {
  643. t5_req = (struct cpl_t5_act_open_req *)
  644. skb_put(skb, wrlen);
  645. INIT_TP_WR(t5_req, 0);
  646. OPCODE_TID(t5_req) = cpu_to_be32(
  647. MK_OPCODE_TID(CPL_ACT_OPEN_REQ,
  648. ((ep->rss_qid << 14) | ep->atid)));
  649. t5_req->local_port = la->sin_port;
  650. t5_req->peer_port = ra->sin_port;
  651. t5_req->local_ip = la->sin_addr.s_addr;
  652. t5_req->peer_ip = ra->sin_addr.s_addr;
  653. t5_req->opt0 = cpu_to_be64(opt0);
  654. t5_req->params = cpu_to_be64(FILTER_TUPLE_V(
  655. cxgb4_select_ntuple(
  656. ep->com.dev->rdev.lldi.ports[0],
  657. ep->l2t)));
  658. t5_req->rsvd = cpu_to_be32(isn);
  659. PDBG("%s snd_isn %u\n", __func__,
  660. be32_to_cpu(t5_req->rsvd));
  661. t5_req->opt2 = cpu_to_be32(opt2);
  662. } else {
  663. t5_req6 = (struct cpl_t5_act_open_req6 *)
  664. skb_put(skb, wrlen);
  665. INIT_TP_WR(t5_req6, 0);
  666. OPCODE_TID(t5_req6) = cpu_to_be32(
  667. MK_OPCODE_TID(CPL_ACT_OPEN_REQ6,
  668. ((ep->rss_qid<<14)|ep->atid)));
  669. t5_req6->local_port = la6->sin6_port;
  670. t5_req6->peer_port = ra6->sin6_port;
  671. t5_req6->local_ip_hi = *((__be64 *)
  672. (la6->sin6_addr.s6_addr));
  673. t5_req6->local_ip_lo = *((__be64 *)
  674. (la6->sin6_addr.s6_addr + 8));
  675. t5_req6->peer_ip_hi = *((__be64 *)
  676. (ra6->sin6_addr.s6_addr));
  677. t5_req6->peer_ip_lo = *((__be64 *)
  678. (ra6->sin6_addr.s6_addr + 8));
  679. t5_req6->opt0 = cpu_to_be64(opt0);
  680. t5_req6->params = cpu_to_be64(FILTER_TUPLE_V(
  681. cxgb4_select_ntuple(
  682. ep->com.dev->rdev.lldi.ports[0],
  683. ep->l2t)));
  684. t5_req6->rsvd = cpu_to_be32(isn);
  685. PDBG("%s snd_isn %u\n", __func__,
  686. be32_to_cpu(t5_req6->rsvd));
  687. t5_req6->opt2 = cpu_to_be32(opt2);
  688. }
  689. }
  690. set_bit(ACT_OPEN_REQ, &ep->com.history);
  691. return c4iw_l2t_send(&ep->com.dev->rdev, skb, ep->l2t);
  692. }
  693. static void send_mpa_req(struct c4iw_ep *ep, struct sk_buff *skb,
  694. u8 mpa_rev_to_use)
  695. {
  696. int mpalen, wrlen;
  697. struct fw_ofld_tx_data_wr *req;
  698. struct mpa_message *mpa;
  699. struct mpa_v2_conn_params mpa_v2_params;
  700. PDBG("%s ep %p tid %u pd_len %d\n", __func__, ep, ep->hwtid, ep->plen);
  701. BUG_ON(skb_cloned(skb));
  702. mpalen = sizeof(*mpa) + ep->plen;
  703. if (mpa_rev_to_use == 2)
  704. mpalen += sizeof(struct mpa_v2_conn_params);
  705. wrlen = roundup(mpalen + sizeof *req, 16);
  706. skb = get_skb(skb, wrlen, GFP_KERNEL);
  707. if (!skb) {
  708. connect_reply_upcall(ep, -ENOMEM);
  709. return;
  710. }
  711. set_wr_txq(skb, CPL_PRIORITY_DATA, ep->txq_idx);
  712. req = (struct fw_ofld_tx_data_wr *)skb_put(skb, wrlen);
  713. memset(req, 0, wrlen);
  714. req->op_to_immdlen = cpu_to_be32(
  715. FW_WR_OP_V(FW_OFLD_TX_DATA_WR) |
  716. FW_WR_COMPL_F |
  717. FW_WR_IMMDLEN_V(mpalen));
  718. req->flowid_len16 = cpu_to_be32(
  719. FW_WR_FLOWID_V(ep->hwtid) |
  720. FW_WR_LEN16_V(wrlen >> 4));
  721. req->plen = cpu_to_be32(mpalen);
  722. req->tunnel_to_proxy = cpu_to_be32(
  723. FW_OFLD_TX_DATA_WR_FLUSH_F |
  724. FW_OFLD_TX_DATA_WR_SHOVE_F);
  725. mpa = (struct mpa_message *)(req + 1);
  726. memcpy(mpa->key, MPA_KEY_REQ, sizeof(mpa->key));
  727. mpa->flags = (crc_enabled ? MPA_CRC : 0) |
  728. (markers_enabled ? MPA_MARKERS : 0) |
  729. (mpa_rev_to_use == 2 ? MPA_ENHANCED_RDMA_CONN : 0);
  730. mpa->private_data_size = htons(ep->plen);
  731. mpa->revision = mpa_rev_to_use;
  732. if (mpa_rev_to_use == 1) {
  733. ep->tried_with_mpa_v1 = 1;
  734. ep->retry_with_mpa_v1 = 0;
  735. }
  736. if (mpa_rev_to_use == 2) {
  737. mpa->private_data_size = htons(ntohs(mpa->private_data_size) +
  738. sizeof (struct mpa_v2_conn_params));
  739. PDBG("%s initiator ird %u ord %u\n", __func__, ep->ird,
  740. ep->ord);
  741. mpa_v2_params.ird = htons((u16)ep->ird);
  742. mpa_v2_params.ord = htons((u16)ep->ord);
  743. if (peer2peer) {
  744. mpa_v2_params.ird |= htons(MPA_V2_PEER2PEER_MODEL);
  745. if (p2p_type == FW_RI_INIT_P2PTYPE_RDMA_WRITE)
  746. mpa_v2_params.ord |=
  747. htons(MPA_V2_RDMA_WRITE_RTR);
  748. else if (p2p_type == FW_RI_INIT_P2PTYPE_READ_REQ)
  749. mpa_v2_params.ord |=
  750. htons(MPA_V2_RDMA_READ_RTR);
  751. }
  752. memcpy(mpa->private_data, &mpa_v2_params,
  753. sizeof(struct mpa_v2_conn_params));
  754. if (ep->plen)
  755. memcpy(mpa->private_data +
  756. sizeof(struct mpa_v2_conn_params),
  757. ep->mpa_pkt + sizeof(*mpa), ep->plen);
  758. } else
  759. if (ep->plen)
  760. memcpy(mpa->private_data,
  761. ep->mpa_pkt + sizeof(*mpa), ep->plen);
  762. /*
  763. * Reference the mpa skb. This ensures the data area
  764. * will remain in memory until the hw acks the tx.
  765. * Function fw4_ack() will deref it.
  766. */
  767. skb_get(skb);
  768. t4_set_arp_err_handler(skb, NULL, arp_failure_discard);
  769. BUG_ON(ep->mpa_skb);
  770. ep->mpa_skb = skb;
  771. c4iw_l2t_send(&ep->com.dev->rdev, skb, ep->l2t);
  772. start_ep_timer(ep);
  773. __state_set(&ep->com, MPA_REQ_SENT);
  774. ep->mpa_attr.initiator = 1;
  775. ep->snd_seq += mpalen;
  776. return;
  777. }
  778. static int send_mpa_reject(struct c4iw_ep *ep, const void *pdata, u8 plen)
  779. {
  780. int mpalen, wrlen;
  781. struct fw_ofld_tx_data_wr *req;
  782. struct mpa_message *mpa;
  783. struct sk_buff *skb;
  784. struct mpa_v2_conn_params mpa_v2_params;
  785. PDBG("%s ep %p tid %u pd_len %d\n", __func__, ep, ep->hwtid, ep->plen);
  786. mpalen = sizeof(*mpa) + plen;
  787. if (ep->mpa_attr.version == 2 && ep->mpa_attr.enhanced_rdma_conn)
  788. mpalen += sizeof(struct mpa_v2_conn_params);
  789. wrlen = roundup(mpalen + sizeof *req, 16);
  790. skb = get_skb(NULL, wrlen, GFP_KERNEL);
  791. if (!skb) {
  792. printk(KERN_ERR MOD "%s - cannot alloc skb!\n", __func__);
  793. return -ENOMEM;
  794. }
  795. set_wr_txq(skb, CPL_PRIORITY_DATA, ep->txq_idx);
  796. req = (struct fw_ofld_tx_data_wr *)skb_put(skb, wrlen);
  797. memset(req, 0, wrlen);
  798. req->op_to_immdlen = cpu_to_be32(
  799. FW_WR_OP_V(FW_OFLD_TX_DATA_WR) |
  800. FW_WR_COMPL_F |
  801. FW_WR_IMMDLEN_V(mpalen));
  802. req->flowid_len16 = cpu_to_be32(
  803. FW_WR_FLOWID_V(ep->hwtid) |
  804. FW_WR_LEN16_V(wrlen >> 4));
  805. req->plen = cpu_to_be32(mpalen);
  806. req->tunnel_to_proxy = cpu_to_be32(
  807. FW_OFLD_TX_DATA_WR_FLUSH_F |
  808. FW_OFLD_TX_DATA_WR_SHOVE_F);
  809. mpa = (struct mpa_message *)(req + 1);
  810. memset(mpa, 0, sizeof(*mpa));
  811. memcpy(mpa->key, MPA_KEY_REP, sizeof(mpa->key));
  812. mpa->flags = MPA_REJECT;
  813. mpa->revision = ep->mpa_attr.version;
  814. mpa->private_data_size = htons(plen);
  815. if (ep->mpa_attr.version == 2 && ep->mpa_attr.enhanced_rdma_conn) {
  816. mpa->flags |= MPA_ENHANCED_RDMA_CONN;
  817. mpa->private_data_size = htons(ntohs(mpa->private_data_size) +
  818. sizeof (struct mpa_v2_conn_params));
  819. mpa_v2_params.ird = htons(((u16)ep->ird) |
  820. (peer2peer ? MPA_V2_PEER2PEER_MODEL :
  821. 0));
  822. mpa_v2_params.ord = htons(((u16)ep->ord) | (peer2peer ?
  823. (p2p_type ==
  824. FW_RI_INIT_P2PTYPE_RDMA_WRITE ?
  825. MPA_V2_RDMA_WRITE_RTR : p2p_type ==
  826. FW_RI_INIT_P2PTYPE_READ_REQ ?
  827. MPA_V2_RDMA_READ_RTR : 0) : 0));
  828. memcpy(mpa->private_data, &mpa_v2_params,
  829. sizeof(struct mpa_v2_conn_params));
  830. if (ep->plen)
  831. memcpy(mpa->private_data +
  832. sizeof(struct mpa_v2_conn_params), pdata, plen);
  833. } else
  834. if (plen)
  835. memcpy(mpa->private_data, pdata, plen);
  836. /*
  837. * Reference the mpa skb again. This ensures the data area
  838. * will remain in memory until the hw acks the tx.
  839. * Function fw4_ack() will deref it.
  840. */
  841. skb_get(skb);
  842. set_wr_txq(skb, CPL_PRIORITY_DATA, ep->txq_idx);
  843. t4_set_arp_err_handler(skb, NULL, arp_failure_discard);
  844. BUG_ON(ep->mpa_skb);
  845. ep->mpa_skb = skb;
  846. ep->snd_seq += mpalen;
  847. return c4iw_l2t_send(&ep->com.dev->rdev, skb, ep->l2t);
  848. }
  849. static int send_mpa_reply(struct c4iw_ep *ep, const void *pdata, u8 plen)
  850. {
  851. int mpalen, wrlen;
  852. struct fw_ofld_tx_data_wr *req;
  853. struct mpa_message *mpa;
  854. struct sk_buff *skb;
  855. struct mpa_v2_conn_params mpa_v2_params;
  856. PDBG("%s ep %p tid %u pd_len %d\n", __func__, ep, ep->hwtid, ep->plen);
  857. mpalen = sizeof(*mpa) + plen;
  858. if (ep->mpa_attr.version == 2 && ep->mpa_attr.enhanced_rdma_conn)
  859. mpalen += sizeof(struct mpa_v2_conn_params);
  860. wrlen = roundup(mpalen + sizeof *req, 16);
  861. skb = get_skb(NULL, wrlen, GFP_KERNEL);
  862. if (!skb) {
  863. printk(KERN_ERR MOD "%s - cannot alloc skb!\n", __func__);
  864. return -ENOMEM;
  865. }
  866. set_wr_txq(skb, CPL_PRIORITY_DATA, ep->txq_idx);
  867. req = (struct fw_ofld_tx_data_wr *) skb_put(skb, wrlen);
  868. memset(req, 0, wrlen);
  869. req->op_to_immdlen = cpu_to_be32(
  870. FW_WR_OP_V(FW_OFLD_TX_DATA_WR) |
  871. FW_WR_COMPL_F |
  872. FW_WR_IMMDLEN_V(mpalen));
  873. req->flowid_len16 = cpu_to_be32(
  874. FW_WR_FLOWID_V(ep->hwtid) |
  875. FW_WR_LEN16_V(wrlen >> 4));
  876. req->plen = cpu_to_be32(mpalen);
  877. req->tunnel_to_proxy = cpu_to_be32(
  878. FW_OFLD_TX_DATA_WR_FLUSH_F |
  879. FW_OFLD_TX_DATA_WR_SHOVE_F);
  880. mpa = (struct mpa_message *)(req + 1);
  881. memset(mpa, 0, sizeof(*mpa));
  882. memcpy(mpa->key, MPA_KEY_REP, sizeof(mpa->key));
  883. mpa->flags = (ep->mpa_attr.crc_enabled ? MPA_CRC : 0) |
  884. (markers_enabled ? MPA_MARKERS : 0);
  885. mpa->revision = ep->mpa_attr.version;
  886. mpa->private_data_size = htons(plen);
  887. if (ep->mpa_attr.version == 2 && ep->mpa_attr.enhanced_rdma_conn) {
  888. mpa->flags |= MPA_ENHANCED_RDMA_CONN;
  889. mpa->private_data_size = htons(ntohs(mpa->private_data_size) +
  890. sizeof (struct mpa_v2_conn_params));
  891. mpa_v2_params.ird = htons((u16)ep->ird);
  892. mpa_v2_params.ord = htons((u16)ep->ord);
  893. if (peer2peer && (ep->mpa_attr.p2p_type !=
  894. FW_RI_INIT_P2PTYPE_DISABLED)) {
  895. mpa_v2_params.ird |= htons(MPA_V2_PEER2PEER_MODEL);
  896. if (p2p_type == FW_RI_INIT_P2PTYPE_RDMA_WRITE)
  897. mpa_v2_params.ord |=
  898. htons(MPA_V2_RDMA_WRITE_RTR);
  899. else if (p2p_type == FW_RI_INIT_P2PTYPE_READ_REQ)
  900. mpa_v2_params.ord |=
  901. htons(MPA_V2_RDMA_READ_RTR);
  902. }
  903. memcpy(mpa->private_data, &mpa_v2_params,
  904. sizeof(struct mpa_v2_conn_params));
  905. if (ep->plen)
  906. memcpy(mpa->private_data +
  907. sizeof(struct mpa_v2_conn_params), pdata, plen);
  908. } else
  909. if (plen)
  910. memcpy(mpa->private_data, pdata, plen);
  911. /*
  912. * Reference the mpa skb. This ensures the data area
  913. * will remain in memory until the hw acks the tx.
  914. * Function fw4_ack() will deref it.
  915. */
  916. skb_get(skb);
  917. t4_set_arp_err_handler(skb, NULL, arp_failure_discard);
  918. ep->mpa_skb = skb;
  919. __state_set(&ep->com, MPA_REP_SENT);
  920. ep->snd_seq += mpalen;
  921. return c4iw_l2t_send(&ep->com.dev->rdev, skb, ep->l2t);
  922. }
  923. static int act_establish(struct c4iw_dev *dev, struct sk_buff *skb)
  924. {
  925. struct c4iw_ep *ep;
  926. struct cpl_act_establish *req = cplhdr(skb);
  927. unsigned int tid = GET_TID(req);
  928. unsigned int atid = GET_TID_TID(ntohl(req->tos_atid));
  929. struct tid_info *t = dev->rdev.lldi.tids;
  930. ep = lookup_atid(t, atid);
  931. PDBG("%s ep %p tid %u snd_isn %u rcv_isn %u\n", __func__, ep, tid,
  932. be32_to_cpu(req->snd_isn), be32_to_cpu(req->rcv_isn));
  933. mutex_lock(&ep->com.mutex);
  934. dst_confirm(ep->dst);
  935. /* setup the hwtid for this connection */
  936. ep->hwtid = tid;
  937. cxgb4_insert_tid(t, ep, tid);
  938. insert_handle(dev, &dev->hwtid_idr, ep, ep->hwtid);
  939. ep->snd_seq = be32_to_cpu(req->snd_isn);
  940. ep->rcv_seq = be32_to_cpu(req->rcv_isn);
  941. set_emss(ep, ntohs(req->tcp_opt));
  942. /* dealloc the atid */
  943. remove_handle(ep->com.dev, &ep->com.dev->atid_idr, atid);
  944. cxgb4_free_atid(t, atid);
  945. set_bit(ACT_ESTAB, &ep->com.history);
  946. /* start MPA negotiation */
  947. send_flowc(ep, NULL);
  948. if (ep->retry_with_mpa_v1)
  949. send_mpa_req(ep, skb, 1);
  950. else
  951. send_mpa_req(ep, skb, mpa_rev);
  952. mutex_unlock(&ep->com.mutex);
  953. return 0;
  954. }
  955. static void close_complete_upcall(struct c4iw_ep *ep, int status)
  956. {
  957. struct iw_cm_event event;
  958. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  959. memset(&event, 0, sizeof(event));
  960. event.event = IW_CM_EVENT_CLOSE;
  961. event.status = status;
  962. if (ep->com.cm_id) {
  963. PDBG("close complete delivered ep %p cm_id %p tid %u\n",
  964. ep, ep->com.cm_id, ep->hwtid);
  965. ep->com.cm_id->event_handler(ep->com.cm_id, &event);
  966. ep->com.cm_id->rem_ref(ep->com.cm_id);
  967. ep->com.cm_id = NULL;
  968. set_bit(CLOSE_UPCALL, &ep->com.history);
  969. }
  970. }
  971. static int abort_connection(struct c4iw_ep *ep, struct sk_buff *skb, gfp_t gfp)
  972. {
  973. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  974. __state_set(&ep->com, ABORTING);
  975. set_bit(ABORT_CONN, &ep->com.history);
  976. return send_abort(ep, skb, gfp);
  977. }
  978. static void peer_close_upcall(struct c4iw_ep *ep)
  979. {
  980. struct iw_cm_event event;
  981. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  982. memset(&event, 0, sizeof(event));
  983. event.event = IW_CM_EVENT_DISCONNECT;
  984. if (ep->com.cm_id) {
  985. PDBG("peer close delivered ep %p cm_id %p tid %u\n",
  986. ep, ep->com.cm_id, ep->hwtid);
  987. ep->com.cm_id->event_handler(ep->com.cm_id, &event);
  988. set_bit(DISCONN_UPCALL, &ep->com.history);
  989. }
  990. }
  991. static void peer_abort_upcall(struct c4iw_ep *ep)
  992. {
  993. struct iw_cm_event event;
  994. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  995. memset(&event, 0, sizeof(event));
  996. event.event = IW_CM_EVENT_CLOSE;
  997. event.status = -ECONNRESET;
  998. if (ep->com.cm_id) {
  999. PDBG("abort delivered ep %p cm_id %p tid %u\n", ep,
  1000. ep->com.cm_id, ep->hwtid);
  1001. ep->com.cm_id->event_handler(ep->com.cm_id, &event);
  1002. ep->com.cm_id->rem_ref(ep->com.cm_id);
  1003. ep->com.cm_id = NULL;
  1004. set_bit(ABORT_UPCALL, &ep->com.history);
  1005. }
  1006. }
  1007. static void connect_reply_upcall(struct c4iw_ep *ep, int status)
  1008. {
  1009. struct iw_cm_event event;
  1010. PDBG("%s ep %p tid %u status %d\n", __func__, ep, ep->hwtid, status);
  1011. memset(&event, 0, sizeof(event));
  1012. event.event = IW_CM_EVENT_CONNECT_REPLY;
  1013. event.status = status;
  1014. memcpy(&event.local_addr, &ep->com.local_addr,
  1015. sizeof(ep->com.local_addr));
  1016. memcpy(&event.remote_addr, &ep->com.remote_addr,
  1017. sizeof(ep->com.remote_addr));
  1018. if ((status == 0) || (status == -ECONNREFUSED)) {
  1019. if (!ep->tried_with_mpa_v1) {
  1020. /* this means MPA_v2 is used */
  1021. event.private_data_len = ep->plen -
  1022. sizeof(struct mpa_v2_conn_params);
  1023. event.private_data = ep->mpa_pkt +
  1024. sizeof(struct mpa_message) +
  1025. sizeof(struct mpa_v2_conn_params);
  1026. } else {
  1027. /* this means MPA_v1 is used */
  1028. event.private_data_len = ep->plen;
  1029. event.private_data = ep->mpa_pkt +
  1030. sizeof(struct mpa_message);
  1031. }
  1032. }
  1033. PDBG("%s ep %p tid %u status %d\n", __func__, ep,
  1034. ep->hwtid, status);
  1035. set_bit(CONN_RPL_UPCALL, &ep->com.history);
  1036. ep->com.cm_id->event_handler(ep->com.cm_id, &event);
  1037. if (status < 0) {
  1038. ep->com.cm_id->rem_ref(ep->com.cm_id);
  1039. ep->com.cm_id = NULL;
  1040. }
  1041. }
  1042. static int connect_request_upcall(struct c4iw_ep *ep)
  1043. {
  1044. struct iw_cm_event event;
  1045. int ret;
  1046. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  1047. memset(&event, 0, sizeof(event));
  1048. event.event = IW_CM_EVENT_CONNECT_REQUEST;
  1049. memcpy(&event.local_addr, &ep->com.local_addr,
  1050. sizeof(ep->com.local_addr));
  1051. memcpy(&event.remote_addr, &ep->com.remote_addr,
  1052. sizeof(ep->com.remote_addr));
  1053. event.provider_data = ep;
  1054. if (!ep->tried_with_mpa_v1) {
  1055. /* this means MPA_v2 is used */
  1056. event.ord = ep->ord;
  1057. event.ird = ep->ird;
  1058. event.private_data_len = ep->plen -
  1059. sizeof(struct mpa_v2_conn_params);
  1060. event.private_data = ep->mpa_pkt + sizeof(struct mpa_message) +
  1061. sizeof(struct mpa_v2_conn_params);
  1062. } else {
  1063. /* this means MPA_v1 is used. Send max supported */
  1064. event.ord = cur_max_read_depth(ep->com.dev);
  1065. event.ird = cur_max_read_depth(ep->com.dev);
  1066. event.private_data_len = ep->plen;
  1067. event.private_data = ep->mpa_pkt + sizeof(struct mpa_message);
  1068. }
  1069. c4iw_get_ep(&ep->com);
  1070. ret = ep->parent_ep->com.cm_id->event_handler(ep->parent_ep->com.cm_id,
  1071. &event);
  1072. if (ret)
  1073. c4iw_put_ep(&ep->com);
  1074. set_bit(CONNREQ_UPCALL, &ep->com.history);
  1075. c4iw_put_ep(&ep->parent_ep->com);
  1076. return ret;
  1077. }
  1078. static void established_upcall(struct c4iw_ep *ep)
  1079. {
  1080. struct iw_cm_event event;
  1081. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  1082. memset(&event, 0, sizeof(event));
  1083. event.event = IW_CM_EVENT_ESTABLISHED;
  1084. event.ird = ep->ird;
  1085. event.ord = ep->ord;
  1086. if (ep->com.cm_id) {
  1087. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  1088. ep->com.cm_id->event_handler(ep->com.cm_id, &event);
  1089. set_bit(ESTAB_UPCALL, &ep->com.history);
  1090. }
  1091. }
  1092. static int update_rx_credits(struct c4iw_ep *ep, u32 credits)
  1093. {
  1094. struct cpl_rx_data_ack *req;
  1095. struct sk_buff *skb;
  1096. int wrlen = roundup(sizeof *req, 16);
  1097. PDBG("%s ep %p tid %u credits %u\n", __func__, ep, ep->hwtid, credits);
  1098. skb = get_skb(NULL, wrlen, GFP_KERNEL);
  1099. if (!skb) {
  1100. printk(KERN_ERR MOD "update_rx_credits - cannot alloc skb!\n");
  1101. return 0;
  1102. }
  1103. /*
  1104. * If we couldn't specify the entire rcv window at connection setup
  1105. * due to the limit in the number of bits in the RCV_BUFSIZ field,
  1106. * then add the overage in to the credits returned.
  1107. */
  1108. if (ep->rcv_win > RCV_BUFSIZ_M * 1024)
  1109. credits += ep->rcv_win - RCV_BUFSIZ_M * 1024;
  1110. req = (struct cpl_rx_data_ack *) skb_put(skb, wrlen);
  1111. memset(req, 0, wrlen);
  1112. INIT_TP_WR(req, ep->hwtid);
  1113. OPCODE_TID(req) = cpu_to_be32(MK_OPCODE_TID(CPL_RX_DATA_ACK,
  1114. ep->hwtid));
  1115. req->credit_dack = cpu_to_be32(credits | RX_FORCE_ACK_F |
  1116. F_RX_DACK_CHANGE |
  1117. V_RX_DACK_MODE(dack_mode));
  1118. set_wr_txq(skb, CPL_PRIORITY_ACK, ep->ctrlq_idx);
  1119. c4iw_ofld_send(&ep->com.dev->rdev, skb);
  1120. return credits;
  1121. }
  1122. #define RELAXED_IRD_NEGOTIATION 1
  1123. static int process_mpa_reply(struct c4iw_ep *ep, struct sk_buff *skb)
  1124. {
  1125. struct mpa_message *mpa;
  1126. struct mpa_v2_conn_params *mpa_v2_params;
  1127. u16 plen;
  1128. u16 resp_ird, resp_ord;
  1129. u8 rtr_mismatch = 0, insuff_ird = 0;
  1130. struct c4iw_qp_attributes attrs;
  1131. enum c4iw_qp_attr_mask mask;
  1132. int err;
  1133. int disconnect = 0;
  1134. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  1135. /*
  1136. * Stop mpa timer. If it expired, then
  1137. * we ignore the MPA reply. process_timeout()
  1138. * will abort the connection.
  1139. */
  1140. if (stop_ep_timer(ep))
  1141. return 0;
  1142. /*
  1143. * If we get more than the supported amount of private data
  1144. * then we must fail this connection.
  1145. */
  1146. if (ep->mpa_pkt_len + skb->len > sizeof(ep->mpa_pkt)) {
  1147. err = -EINVAL;
  1148. goto err;
  1149. }
  1150. /*
  1151. * copy the new data into our accumulation buffer.
  1152. */
  1153. skb_copy_from_linear_data(skb, &(ep->mpa_pkt[ep->mpa_pkt_len]),
  1154. skb->len);
  1155. ep->mpa_pkt_len += skb->len;
  1156. /*
  1157. * if we don't even have the mpa message, then bail.
  1158. */
  1159. if (ep->mpa_pkt_len < sizeof(*mpa))
  1160. return 0;
  1161. mpa = (struct mpa_message *) ep->mpa_pkt;
  1162. /* Validate MPA header. */
  1163. if (mpa->revision > mpa_rev) {
  1164. printk(KERN_ERR MOD "%s MPA version mismatch. Local = %d,"
  1165. " Received = %d\n", __func__, mpa_rev, mpa->revision);
  1166. err = -EPROTO;
  1167. goto err;
  1168. }
  1169. if (memcmp(mpa->key, MPA_KEY_REP, sizeof(mpa->key))) {
  1170. err = -EPROTO;
  1171. goto err;
  1172. }
  1173. plen = ntohs(mpa->private_data_size);
  1174. /*
  1175. * Fail if there's too much private data.
  1176. */
  1177. if (plen > MPA_MAX_PRIVATE_DATA) {
  1178. err = -EPROTO;
  1179. goto err;
  1180. }
  1181. /*
  1182. * If plen does not account for pkt size
  1183. */
  1184. if (ep->mpa_pkt_len > (sizeof(*mpa) + plen)) {
  1185. err = -EPROTO;
  1186. goto err;
  1187. }
  1188. ep->plen = (u8) plen;
  1189. /*
  1190. * If we don't have all the pdata yet, then bail.
  1191. * We'll continue process when more data arrives.
  1192. */
  1193. if (ep->mpa_pkt_len < (sizeof(*mpa) + plen))
  1194. return 0;
  1195. if (mpa->flags & MPA_REJECT) {
  1196. err = -ECONNREFUSED;
  1197. goto err;
  1198. }
  1199. /*
  1200. * If we get here we have accumulated the entire mpa
  1201. * start reply message including private data. And
  1202. * the MPA header is valid.
  1203. */
  1204. __state_set(&ep->com, FPDU_MODE);
  1205. ep->mpa_attr.crc_enabled = (mpa->flags & MPA_CRC) | crc_enabled ? 1 : 0;
  1206. ep->mpa_attr.recv_marker_enabled = markers_enabled;
  1207. ep->mpa_attr.xmit_marker_enabled = mpa->flags & MPA_MARKERS ? 1 : 0;
  1208. ep->mpa_attr.version = mpa->revision;
  1209. ep->mpa_attr.p2p_type = FW_RI_INIT_P2PTYPE_DISABLED;
  1210. if (mpa->revision == 2) {
  1211. ep->mpa_attr.enhanced_rdma_conn =
  1212. mpa->flags & MPA_ENHANCED_RDMA_CONN ? 1 : 0;
  1213. if (ep->mpa_attr.enhanced_rdma_conn) {
  1214. mpa_v2_params = (struct mpa_v2_conn_params *)
  1215. (ep->mpa_pkt + sizeof(*mpa));
  1216. resp_ird = ntohs(mpa_v2_params->ird) &
  1217. MPA_V2_IRD_ORD_MASK;
  1218. resp_ord = ntohs(mpa_v2_params->ord) &
  1219. MPA_V2_IRD_ORD_MASK;
  1220. PDBG("%s responder ird %u ord %u ep ird %u ord %u\n",
  1221. __func__, resp_ird, resp_ord, ep->ird, ep->ord);
  1222. /*
  1223. * This is a double-check. Ideally, below checks are
  1224. * not required since ird/ord stuff has been taken
  1225. * care of in c4iw_accept_cr
  1226. */
  1227. if (ep->ird < resp_ord) {
  1228. if (RELAXED_IRD_NEGOTIATION && resp_ord <=
  1229. ep->com.dev->rdev.lldi.max_ordird_qp)
  1230. ep->ird = resp_ord;
  1231. else
  1232. insuff_ird = 1;
  1233. } else if (ep->ird > resp_ord) {
  1234. ep->ird = resp_ord;
  1235. }
  1236. if (ep->ord > resp_ird) {
  1237. if (RELAXED_IRD_NEGOTIATION)
  1238. ep->ord = resp_ird;
  1239. else
  1240. insuff_ird = 1;
  1241. }
  1242. if (insuff_ird) {
  1243. err = -ENOMEM;
  1244. ep->ird = resp_ord;
  1245. ep->ord = resp_ird;
  1246. }
  1247. if (ntohs(mpa_v2_params->ird) &
  1248. MPA_V2_PEER2PEER_MODEL) {
  1249. if (ntohs(mpa_v2_params->ord) &
  1250. MPA_V2_RDMA_WRITE_RTR)
  1251. ep->mpa_attr.p2p_type =
  1252. FW_RI_INIT_P2PTYPE_RDMA_WRITE;
  1253. else if (ntohs(mpa_v2_params->ord) &
  1254. MPA_V2_RDMA_READ_RTR)
  1255. ep->mpa_attr.p2p_type =
  1256. FW_RI_INIT_P2PTYPE_READ_REQ;
  1257. }
  1258. }
  1259. } else if (mpa->revision == 1)
  1260. if (peer2peer)
  1261. ep->mpa_attr.p2p_type = p2p_type;
  1262. PDBG("%s - crc_enabled=%d, recv_marker_enabled=%d, "
  1263. "xmit_marker_enabled=%d, version=%d p2p_type=%d local-p2p_type = "
  1264. "%d\n", __func__, ep->mpa_attr.crc_enabled,
  1265. ep->mpa_attr.recv_marker_enabled,
  1266. ep->mpa_attr.xmit_marker_enabled, ep->mpa_attr.version,
  1267. ep->mpa_attr.p2p_type, p2p_type);
  1268. /*
  1269. * If responder's RTR does not match with that of initiator, assign
  1270. * FW_RI_INIT_P2PTYPE_DISABLED in mpa attributes so that RTR is not
  1271. * generated when moving QP to RTS state.
  1272. * A TERM message will be sent after QP has moved to RTS state
  1273. */
  1274. if ((ep->mpa_attr.version == 2) && peer2peer &&
  1275. (ep->mpa_attr.p2p_type != p2p_type)) {
  1276. ep->mpa_attr.p2p_type = FW_RI_INIT_P2PTYPE_DISABLED;
  1277. rtr_mismatch = 1;
  1278. }
  1279. attrs.mpa_attr = ep->mpa_attr;
  1280. attrs.max_ird = ep->ird;
  1281. attrs.max_ord = ep->ord;
  1282. attrs.llp_stream_handle = ep;
  1283. attrs.next_state = C4IW_QP_STATE_RTS;
  1284. mask = C4IW_QP_ATTR_NEXT_STATE |
  1285. C4IW_QP_ATTR_LLP_STREAM_HANDLE | C4IW_QP_ATTR_MPA_ATTR |
  1286. C4IW_QP_ATTR_MAX_IRD | C4IW_QP_ATTR_MAX_ORD;
  1287. /* bind QP and TID with INIT_WR */
  1288. err = c4iw_modify_qp(ep->com.qp->rhp,
  1289. ep->com.qp, mask, &attrs, 1);
  1290. if (err)
  1291. goto err;
  1292. /*
  1293. * If responder's RTR requirement did not match with what initiator
  1294. * supports, generate TERM message
  1295. */
  1296. if (rtr_mismatch) {
  1297. printk(KERN_ERR "%s: RTR mismatch, sending TERM\n", __func__);
  1298. attrs.layer_etype = LAYER_MPA | DDP_LLP;
  1299. attrs.ecode = MPA_NOMATCH_RTR;
  1300. attrs.next_state = C4IW_QP_STATE_TERMINATE;
  1301. attrs.send_term = 1;
  1302. err = c4iw_modify_qp(ep->com.qp->rhp, ep->com.qp,
  1303. C4IW_QP_ATTR_NEXT_STATE, &attrs, 1);
  1304. err = -ENOMEM;
  1305. disconnect = 1;
  1306. goto out;
  1307. }
  1308. /*
  1309. * Generate TERM if initiator IRD is not sufficient for responder
  1310. * provided ORD. Currently, we do the same behaviour even when
  1311. * responder provided IRD is also not sufficient as regards to
  1312. * initiator ORD.
  1313. */
  1314. if (insuff_ird) {
  1315. printk(KERN_ERR "%s: Insufficient IRD, sending TERM\n",
  1316. __func__);
  1317. attrs.layer_etype = LAYER_MPA | DDP_LLP;
  1318. attrs.ecode = MPA_INSUFF_IRD;
  1319. attrs.next_state = C4IW_QP_STATE_TERMINATE;
  1320. attrs.send_term = 1;
  1321. err = c4iw_modify_qp(ep->com.qp->rhp, ep->com.qp,
  1322. C4IW_QP_ATTR_NEXT_STATE, &attrs, 1);
  1323. err = -ENOMEM;
  1324. disconnect = 1;
  1325. goto out;
  1326. }
  1327. goto out;
  1328. err:
  1329. __state_set(&ep->com, ABORTING);
  1330. send_abort(ep, skb, GFP_KERNEL);
  1331. out:
  1332. connect_reply_upcall(ep, err);
  1333. return disconnect;
  1334. }
  1335. static void process_mpa_request(struct c4iw_ep *ep, struct sk_buff *skb)
  1336. {
  1337. struct mpa_message *mpa;
  1338. struct mpa_v2_conn_params *mpa_v2_params;
  1339. u16 plen;
  1340. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  1341. /*
  1342. * If we get more than the supported amount of private data
  1343. * then we must fail this connection.
  1344. */
  1345. if (ep->mpa_pkt_len + skb->len > sizeof(ep->mpa_pkt)) {
  1346. (void)stop_ep_timer(ep);
  1347. abort_connection(ep, skb, GFP_KERNEL);
  1348. return;
  1349. }
  1350. PDBG("%s enter (%s line %u)\n", __func__, __FILE__, __LINE__);
  1351. /*
  1352. * Copy the new data into our accumulation buffer.
  1353. */
  1354. skb_copy_from_linear_data(skb, &(ep->mpa_pkt[ep->mpa_pkt_len]),
  1355. skb->len);
  1356. ep->mpa_pkt_len += skb->len;
  1357. /*
  1358. * If we don't even have the mpa message, then bail.
  1359. * We'll continue process when more data arrives.
  1360. */
  1361. if (ep->mpa_pkt_len < sizeof(*mpa))
  1362. return;
  1363. PDBG("%s enter (%s line %u)\n", __func__, __FILE__, __LINE__);
  1364. mpa = (struct mpa_message *) ep->mpa_pkt;
  1365. /*
  1366. * Validate MPA Header.
  1367. */
  1368. if (mpa->revision > mpa_rev) {
  1369. printk(KERN_ERR MOD "%s MPA version mismatch. Local = %d,"
  1370. " Received = %d\n", __func__, mpa_rev, mpa->revision);
  1371. (void)stop_ep_timer(ep);
  1372. abort_connection(ep, skb, GFP_KERNEL);
  1373. return;
  1374. }
  1375. if (memcmp(mpa->key, MPA_KEY_REQ, sizeof(mpa->key))) {
  1376. (void)stop_ep_timer(ep);
  1377. abort_connection(ep, skb, GFP_KERNEL);
  1378. return;
  1379. }
  1380. plen = ntohs(mpa->private_data_size);
  1381. /*
  1382. * Fail if there's too much private data.
  1383. */
  1384. if (plen > MPA_MAX_PRIVATE_DATA) {
  1385. (void)stop_ep_timer(ep);
  1386. abort_connection(ep, skb, GFP_KERNEL);
  1387. return;
  1388. }
  1389. /*
  1390. * If plen does not account for pkt size
  1391. */
  1392. if (ep->mpa_pkt_len > (sizeof(*mpa) + plen)) {
  1393. (void)stop_ep_timer(ep);
  1394. abort_connection(ep, skb, GFP_KERNEL);
  1395. return;
  1396. }
  1397. ep->plen = (u8) plen;
  1398. /*
  1399. * If we don't have all the pdata yet, then bail.
  1400. */
  1401. if (ep->mpa_pkt_len < (sizeof(*mpa) + plen))
  1402. return;
  1403. /*
  1404. * If we get here we have accumulated the entire mpa
  1405. * start reply message including private data.
  1406. */
  1407. ep->mpa_attr.initiator = 0;
  1408. ep->mpa_attr.crc_enabled = (mpa->flags & MPA_CRC) | crc_enabled ? 1 : 0;
  1409. ep->mpa_attr.recv_marker_enabled = markers_enabled;
  1410. ep->mpa_attr.xmit_marker_enabled = mpa->flags & MPA_MARKERS ? 1 : 0;
  1411. ep->mpa_attr.version = mpa->revision;
  1412. if (mpa->revision == 1)
  1413. ep->tried_with_mpa_v1 = 1;
  1414. ep->mpa_attr.p2p_type = FW_RI_INIT_P2PTYPE_DISABLED;
  1415. if (mpa->revision == 2) {
  1416. ep->mpa_attr.enhanced_rdma_conn =
  1417. mpa->flags & MPA_ENHANCED_RDMA_CONN ? 1 : 0;
  1418. if (ep->mpa_attr.enhanced_rdma_conn) {
  1419. mpa_v2_params = (struct mpa_v2_conn_params *)
  1420. (ep->mpa_pkt + sizeof(*mpa));
  1421. ep->ird = ntohs(mpa_v2_params->ird) &
  1422. MPA_V2_IRD_ORD_MASK;
  1423. ep->ord = ntohs(mpa_v2_params->ord) &
  1424. MPA_V2_IRD_ORD_MASK;
  1425. PDBG("%s initiator ird %u ord %u\n", __func__, ep->ird,
  1426. ep->ord);
  1427. if (ntohs(mpa_v2_params->ird) & MPA_V2_PEER2PEER_MODEL)
  1428. if (peer2peer) {
  1429. if (ntohs(mpa_v2_params->ord) &
  1430. MPA_V2_RDMA_WRITE_RTR)
  1431. ep->mpa_attr.p2p_type =
  1432. FW_RI_INIT_P2PTYPE_RDMA_WRITE;
  1433. else if (ntohs(mpa_v2_params->ord) &
  1434. MPA_V2_RDMA_READ_RTR)
  1435. ep->mpa_attr.p2p_type =
  1436. FW_RI_INIT_P2PTYPE_READ_REQ;
  1437. }
  1438. }
  1439. } else if (mpa->revision == 1)
  1440. if (peer2peer)
  1441. ep->mpa_attr.p2p_type = p2p_type;
  1442. PDBG("%s - crc_enabled=%d, recv_marker_enabled=%d, "
  1443. "xmit_marker_enabled=%d, version=%d p2p_type=%d\n", __func__,
  1444. ep->mpa_attr.crc_enabled, ep->mpa_attr.recv_marker_enabled,
  1445. ep->mpa_attr.xmit_marker_enabled, ep->mpa_attr.version,
  1446. ep->mpa_attr.p2p_type);
  1447. /*
  1448. * If the endpoint timer already expired, then we ignore
  1449. * the start request. process_timeout() will abort
  1450. * the connection.
  1451. */
  1452. if (!stop_ep_timer(ep)) {
  1453. __state_set(&ep->com, MPA_REQ_RCVD);
  1454. /* drive upcall */
  1455. mutex_lock_nested(&ep->parent_ep->com.mutex,
  1456. SINGLE_DEPTH_NESTING);
  1457. if (ep->parent_ep->com.state != DEAD) {
  1458. if (connect_request_upcall(ep))
  1459. abort_connection(ep, skb, GFP_KERNEL);
  1460. } else {
  1461. abort_connection(ep, skb, GFP_KERNEL);
  1462. }
  1463. mutex_unlock(&ep->parent_ep->com.mutex);
  1464. }
  1465. return;
  1466. }
  1467. static int rx_data(struct c4iw_dev *dev, struct sk_buff *skb)
  1468. {
  1469. struct c4iw_ep *ep;
  1470. struct cpl_rx_data *hdr = cplhdr(skb);
  1471. unsigned int dlen = ntohs(hdr->len);
  1472. unsigned int tid = GET_TID(hdr);
  1473. struct tid_info *t = dev->rdev.lldi.tids;
  1474. __u8 status = hdr->status;
  1475. int disconnect = 0;
  1476. ep = lookup_tid(t, tid);
  1477. if (!ep)
  1478. return 0;
  1479. PDBG("%s ep %p tid %u dlen %u\n", __func__, ep, ep->hwtid, dlen);
  1480. skb_pull(skb, sizeof(*hdr));
  1481. skb_trim(skb, dlen);
  1482. mutex_lock(&ep->com.mutex);
  1483. /* update RX credits */
  1484. update_rx_credits(ep, dlen);
  1485. switch (ep->com.state) {
  1486. case MPA_REQ_SENT:
  1487. ep->rcv_seq += dlen;
  1488. disconnect = process_mpa_reply(ep, skb);
  1489. break;
  1490. case MPA_REQ_WAIT:
  1491. ep->rcv_seq += dlen;
  1492. process_mpa_request(ep, skb);
  1493. break;
  1494. case FPDU_MODE: {
  1495. struct c4iw_qp_attributes attrs;
  1496. BUG_ON(!ep->com.qp);
  1497. if (status)
  1498. pr_err("%s Unexpected streaming data." \
  1499. " qpid %u ep %p state %d tid %u status %d\n",
  1500. __func__, ep->com.qp->wq.sq.qid, ep,
  1501. ep->com.state, ep->hwtid, status);
  1502. attrs.next_state = C4IW_QP_STATE_TERMINATE;
  1503. c4iw_modify_qp(ep->com.qp->rhp, ep->com.qp,
  1504. C4IW_QP_ATTR_NEXT_STATE, &attrs, 1);
  1505. disconnect = 1;
  1506. break;
  1507. }
  1508. default:
  1509. break;
  1510. }
  1511. mutex_unlock(&ep->com.mutex);
  1512. if (disconnect)
  1513. c4iw_ep_disconnect(ep, 0, GFP_KERNEL);
  1514. return 0;
  1515. }
  1516. static int abort_rpl(struct c4iw_dev *dev, struct sk_buff *skb)
  1517. {
  1518. struct c4iw_ep *ep;
  1519. struct cpl_abort_rpl_rss *rpl = cplhdr(skb);
  1520. int release = 0;
  1521. unsigned int tid = GET_TID(rpl);
  1522. struct tid_info *t = dev->rdev.lldi.tids;
  1523. ep = lookup_tid(t, tid);
  1524. if (!ep) {
  1525. printk(KERN_WARNING MOD "Abort rpl to freed endpoint\n");
  1526. return 0;
  1527. }
  1528. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  1529. mutex_lock(&ep->com.mutex);
  1530. switch (ep->com.state) {
  1531. case ABORTING:
  1532. c4iw_wake_up(&ep->com.wr_wait, -ECONNRESET);
  1533. __state_set(&ep->com, DEAD);
  1534. release = 1;
  1535. break;
  1536. default:
  1537. printk(KERN_ERR "%s ep %p state %d\n",
  1538. __func__, ep, ep->com.state);
  1539. break;
  1540. }
  1541. mutex_unlock(&ep->com.mutex);
  1542. if (release)
  1543. release_ep_resources(ep);
  1544. return 0;
  1545. }
  1546. static void send_fw_act_open_req(struct c4iw_ep *ep, unsigned int atid)
  1547. {
  1548. struct sk_buff *skb;
  1549. struct fw_ofld_connection_wr *req;
  1550. unsigned int mtu_idx;
  1551. int wscale;
  1552. struct sockaddr_in *sin;
  1553. int win;
  1554. skb = get_skb(NULL, sizeof(*req), GFP_KERNEL);
  1555. req = (struct fw_ofld_connection_wr *)__skb_put(skb, sizeof(*req));
  1556. memset(req, 0, sizeof(*req));
  1557. req->op_compl = htonl(V_WR_OP(FW_OFLD_CONNECTION_WR));
  1558. req->len16_pkd = htonl(FW_WR_LEN16_V(DIV_ROUND_UP(sizeof(*req), 16)));
  1559. req->le.filter = cpu_to_be32(cxgb4_select_ntuple(
  1560. ep->com.dev->rdev.lldi.ports[0],
  1561. ep->l2t));
  1562. sin = (struct sockaddr_in *)&ep->com.mapped_local_addr;
  1563. req->le.lport = sin->sin_port;
  1564. req->le.u.ipv4.lip = sin->sin_addr.s_addr;
  1565. sin = (struct sockaddr_in *)&ep->com.mapped_remote_addr;
  1566. req->le.pport = sin->sin_port;
  1567. req->le.u.ipv4.pip = sin->sin_addr.s_addr;
  1568. req->tcb.t_state_to_astid =
  1569. htonl(FW_OFLD_CONNECTION_WR_T_STATE_V(TCP_SYN_SENT) |
  1570. FW_OFLD_CONNECTION_WR_ASTID_V(atid));
  1571. req->tcb.cplrxdataack_cplpassacceptrpl =
  1572. htons(FW_OFLD_CONNECTION_WR_CPLRXDATAACK_F);
  1573. req->tcb.tx_max = (__force __be32) jiffies;
  1574. req->tcb.rcv_adv = htons(1);
  1575. best_mtu(ep->com.dev->rdev.lldi.mtus, ep->mtu, &mtu_idx,
  1576. enable_tcp_timestamps,
  1577. (AF_INET == ep->com.remote_addr.ss_family) ? 0 : 1);
  1578. wscale = compute_wscale(rcv_win);
  1579. /*
  1580. * Specify the largest window that will fit in opt0. The
  1581. * remainder will be specified in the rx_data_ack.
  1582. */
  1583. win = ep->rcv_win >> 10;
  1584. if (win > RCV_BUFSIZ_M)
  1585. win = RCV_BUFSIZ_M;
  1586. req->tcb.opt0 = (__force __be64) (TCAM_BYPASS(1) |
  1587. (nocong ? NO_CONG(1) : 0) |
  1588. KEEP_ALIVE_F |
  1589. DELACK(1) |
  1590. WND_SCALE_V(wscale) |
  1591. MSS_IDX_V(mtu_idx) |
  1592. L2T_IDX_V(ep->l2t->idx) |
  1593. TX_CHAN_V(ep->tx_chan) |
  1594. SMAC_SEL_V(ep->smac_idx) |
  1595. DSCP(ep->tos) |
  1596. ULP_MODE_V(ULP_MODE_TCPDDP) |
  1597. RCV_BUFSIZ_V(win));
  1598. req->tcb.opt2 = (__force __be32) (PACE(1) |
  1599. TX_QUEUE(ep->com.dev->rdev.lldi.tx_modq[ep->tx_chan]) |
  1600. RX_CHANNEL_V(0) |
  1601. CCTRL_ECN(enable_ecn) |
  1602. RSS_QUEUE_VALID_F | RSS_QUEUE_V(ep->rss_qid));
  1603. if (enable_tcp_timestamps)
  1604. req->tcb.opt2 |= (__force __be32)TSTAMPS_EN(1);
  1605. if (enable_tcp_sack)
  1606. req->tcb.opt2 |= (__force __be32)SACK_EN(1);
  1607. if (wscale && enable_tcp_window_scaling)
  1608. req->tcb.opt2 |= (__force __be32)WND_SCALE_EN_F;
  1609. req->tcb.opt0 = cpu_to_be64((__force u64)req->tcb.opt0);
  1610. req->tcb.opt2 = cpu_to_be32((__force u32)req->tcb.opt2);
  1611. set_wr_txq(skb, CPL_PRIORITY_CONTROL, ep->ctrlq_idx);
  1612. set_bit(ACT_OFLD_CONN, &ep->com.history);
  1613. c4iw_l2t_send(&ep->com.dev->rdev, skb, ep->l2t);
  1614. }
  1615. /*
  1616. * Return whether a failed active open has allocated a TID
  1617. */
  1618. static inline int act_open_has_tid(int status)
  1619. {
  1620. return status != CPL_ERR_TCAM_FULL && status != CPL_ERR_CONN_EXIST &&
  1621. status != CPL_ERR_ARP_MISS;
  1622. }
  1623. /* Returns whether a CPL status conveys negative advice.
  1624. */
  1625. static int is_neg_adv(unsigned int status)
  1626. {
  1627. return status == CPL_ERR_RTX_NEG_ADVICE ||
  1628. status == CPL_ERR_PERSIST_NEG_ADVICE ||
  1629. status == CPL_ERR_KEEPALV_NEG_ADVICE;
  1630. }
  1631. static char *neg_adv_str(unsigned int status)
  1632. {
  1633. switch (status) {
  1634. case CPL_ERR_RTX_NEG_ADVICE:
  1635. return "Retransmit timeout";
  1636. case CPL_ERR_PERSIST_NEG_ADVICE:
  1637. return "Persist timeout";
  1638. case CPL_ERR_KEEPALV_NEG_ADVICE:
  1639. return "Keepalive timeout";
  1640. default:
  1641. return "Unknown";
  1642. }
  1643. }
  1644. static void set_tcp_window(struct c4iw_ep *ep, struct port_info *pi)
  1645. {
  1646. ep->snd_win = snd_win;
  1647. ep->rcv_win = rcv_win;
  1648. PDBG("%s snd_win %d rcv_win %d\n", __func__, ep->snd_win, ep->rcv_win);
  1649. }
  1650. #define ACT_OPEN_RETRY_COUNT 2
  1651. static int import_ep(struct c4iw_ep *ep, int iptype, __u8 *peer_ip,
  1652. struct dst_entry *dst, struct c4iw_dev *cdev,
  1653. bool clear_mpa_v1)
  1654. {
  1655. struct neighbour *n;
  1656. int err, step;
  1657. struct net_device *pdev;
  1658. n = dst_neigh_lookup(dst, peer_ip);
  1659. if (!n)
  1660. return -ENODEV;
  1661. rcu_read_lock();
  1662. err = -ENOMEM;
  1663. if (n->dev->flags & IFF_LOOPBACK) {
  1664. if (iptype == 4)
  1665. pdev = ip_dev_find(&init_net, *(__be32 *)peer_ip);
  1666. else if (IS_ENABLED(CONFIG_IPV6))
  1667. for_each_netdev(&init_net, pdev) {
  1668. if (ipv6_chk_addr(&init_net,
  1669. (struct in6_addr *)peer_ip,
  1670. pdev, 1))
  1671. break;
  1672. }
  1673. else
  1674. pdev = NULL;
  1675. if (!pdev) {
  1676. err = -ENODEV;
  1677. goto out;
  1678. }
  1679. ep->l2t = cxgb4_l2t_get(cdev->rdev.lldi.l2t,
  1680. n, pdev, 0);
  1681. if (!ep->l2t)
  1682. goto out;
  1683. ep->mtu = pdev->mtu;
  1684. ep->tx_chan = cxgb4_port_chan(pdev);
  1685. ep->smac_idx = (cxgb4_port_viid(pdev) & 0x7F) << 1;
  1686. step = cdev->rdev.lldi.ntxq /
  1687. cdev->rdev.lldi.nchan;
  1688. ep->txq_idx = cxgb4_port_idx(pdev) * step;
  1689. step = cdev->rdev.lldi.nrxq /
  1690. cdev->rdev.lldi.nchan;
  1691. ep->ctrlq_idx = cxgb4_port_idx(pdev);
  1692. ep->rss_qid = cdev->rdev.lldi.rxq_ids[
  1693. cxgb4_port_idx(pdev) * step];
  1694. set_tcp_window(ep, (struct port_info *)netdev_priv(pdev));
  1695. dev_put(pdev);
  1696. } else {
  1697. pdev = get_real_dev(n->dev);
  1698. ep->l2t = cxgb4_l2t_get(cdev->rdev.lldi.l2t,
  1699. n, pdev, 0);
  1700. if (!ep->l2t)
  1701. goto out;
  1702. ep->mtu = dst_mtu(dst);
  1703. ep->tx_chan = cxgb4_port_chan(pdev);
  1704. ep->smac_idx = (cxgb4_port_viid(pdev) & 0x7F) << 1;
  1705. step = cdev->rdev.lldi.ntxq /
  1706. cdev->rdev.lldi.nchan;
  1707. ep->txq_idx = cxgb4_port_idx(pdev) * step;
  1708. ep->ctrlq_idx = cxgb4_port_idx(pdev);
  1709. step = cdev->rdev.lldi.nrxq /
  1710. cdev->rdev.lldi.nchan;
  1711. ep->rss_qid = cdev->rdev.lldi.rxq_ids[
  1712. cxgb4_port_idx(pdev) * step];
  1713. set_tcp_window(ep, (struct port_info *)netdev_priv(pdev));
  1714. if (clear_mpa_v1) {
  1715. ep->retry_with_mpa_v1 = 0;
  1716. ep->tried_with_mpa_v1 = 0;
  1717. }
  1718. }
  1719. err = 0;
  1720. out:
  1721. rcu_read_unlock();
  1722. neigh_release(n);
  1723. return err;
  1724. }
  1725. static int c4iw_reconnect(struct c4iw_ep *ep)
  1726. {
  1727. int err = 0;
  1728. struct sockaddr_in *laddr = (struct sockaddr_in *)
  1729. &ep->com.cm_id->local_addr;
  1730. struct sockaddr_in *raddr = (struct sockaddr_in *)
  1731. &ep->com.cm_id->remote_addr;
  1732. struct sockaddr_in6 *laddr6 = (struct sockaddr_in6 *)
  1733. &ep->com.cm_id->local_addr;
  1734. struct sockaddr_in6 *raddr6 = (struct sockaddr_in6 *)
  1735. &ep->com.cm_id->remote_addr;
  1736. int iptype;
  1737. __u8 *ra;
  1738. PDBG("%s qp %p cm_id %p\n", __func__, ep->com.qp, ep->com.cm_id);
  1739. init_timer(&ep->timer);
  1740. /*
  1741. * Allocate an active TID to initiate a TCP connection.
  1742. */
  1743. ep->atid = cxgb4_alloc_atid(ep->com.dev->rdev.lldi.tids, ep);
  1744. if (ep->atid == -1) {
  1745. pr_err("%s - cannot alloc atid.\n", __func__);
  1746. err = -ENOMEM;
  1747. goto fail2;
  1748. }
  1749. insert_handle(ep->com.dev, &ep->com.dev->atid_idr, ep, ep->atid);
  1750. /* find a route */
  1751. if (ep->com.cm_id->local_addr.ss_family == AF_INET) {
  1752. ep->dst = find_route(ep->com.dev, laddr->sin_addr.s_addr,
  1753. raddr->sin_addr.s_addr, laddr->sin_port,
  1754. raddr->sin_port, 0);
  1755. iptype = 4;
  1756. ra = (__u8 *)&raddr->sin_addr;
  1757. } else {
  1758. ep->dst = find_route6(ep->com.dev, laddr6->sin6_addr.s6_addr,
  1759. raddr6->sin6_addr.s6_addr,
  1760. laddr6->sin6_port, raddr6->sin6_port, 0,
  1761. raddr6->sin6_scope_id);
  1762. iptype = 6;
  1763. ra = (__u8 *)&raddr6->sin6_addr;
  1764. }
  1765. if (!ep->dst) {
  1766. pr_err("%s - cannot find route.\n", __func__);
  1767. err = -EHOSTUNREACH;
  1768. goto fail3;
  1769. }
  1770. err = import_ep(ep, iptype, ra, ep->dst, ep->com.dev, false);
  1771. if (err) {
  1772. pr_err("%s - cannot alloc l2e.\n", __func__);
  1773. goto fail4;
  1774. }
  1775. PDBG("%s txq_idx %u tx_chan %u smac_idx %u rss_qid %u l2t_idx %u\n",
  1776. __func__, ep->txq_idx, ep->tx_chan, ep->smac_idx, ep->rss_qid,
  1777. ep->l2t->idx);
  1778. state_set(&ep->com, CONNECTING);
  1779. ep->tos = 0;
  1780. /* send connect request to rnic */
  1781. err = send_connect(ep);
  1782. if (!err)
  1783. goto out;
  1784. cxgb4_l2t_release(ep->l2t);
  1785. fail4:
  1786. dst_release(ep->dst);
  1787. fail3:
  1788. remove_handle(ep->com.dev, &ep->com.dev->atid_idr, ep->atid);
  1789. cxgb4_free_atid(ep->com.dev->rdev.lldi.tids, ep->atid);
  1790. fail2:
  1791. /*
  1792. * remember to send notification to upper layer.
  1793. * We are in here so the upper layer is not aware that this is
  1794. * re-connect attempt and so, upper layer is still waiting for
  1795. * response of 1st connect request.
  1796. */
  1797. connect_reply_upcall(ep, -ECONNRESET);
  1798. c4iw_put_ep(&ep->com);
  1799. out:
  1800. return err;
  1801. }
  1802. static int act_open_rpl(struct c4iw_dev *dev, struct sk_buff *skb)
  1803. {
  1804. struct c4iw_ep *ep;
  1805. struct cpl_act_open_rpl *rpl = cplhdr(skb);
  1806. unsigned int atid = GET_TID_TID(GET_AOPEN_ATID(
  1807. ntohl(rpl->atid_status)));
  1808. struct tid_info *t = dev->rdev.lldi.tids;
  1809. int status = GET_AOPEN_STATUS(ntohl(rpl->atid_status));
  1810. struct sockaddr_in *la;
  1811. struct sockaddr_in *ra;
  1812. struct sockaddr_in6 *la6;
  1813. struct sockaddr_in6 *ra6;
  1814. ep = lookup_atid(t, atid);
  1815. la = (struct sockaddr_in *)&ep->com.mapped_local_addr;
  1816. ra = (struct sockaddr_in *)&ep->com.mapped_remote_addr;
  1817. la6 = (struct sockaddr_in6 *)&ep->com.mapped_local_addr;
  1818. ra6 = (struct sockaddr_in6 *)&ep->com.mapped_remote_addr;
  1819. PDBG("%s ep %p atid %u status %u errno %d\n", __func__, ep, atid,
  1820. status, status2errno(status));
  1821. if (is_neg_adv(status)) {
  1822. dev_warn(&dev->rdev.lldi.pdev->dev,
  1823. "Connection problems for atid %u status %u (%s)\n",
  1824. atid, status, neg_adv_str(status));
  1825. return 0;
  1826. }
  1827. set_bit(ACT_OPEN_RPL, &ep->com.history);
  1828. /*
  1829. * Log interesting failures.
  1830. */
  1831. switch (status) {
  1832. case CPL_ERR_CONN_RESET:
  1833. case CPL_ERR_CONN_TIMEDOUT:
  1834. break;
  1835. case CPL_ERR_TCAM_FULL:
  1836. mutex_lock(&dev->rdev.stats.lock);
  1837. dev->rdev.stats.tcam_full++;
  1838. mutex_unlock(&dev->rdev.stats.lock);
  1839. if (ep->com.local_addr.ss_family == AF_INET &&
  1840. dev->rdev.lldi.enable_fw_ofld_conn) {
  1841. send_fw_act_open_req(ep,
  1842. GET_TID_TID(GET_AOPEN_ATID(
  1843. ntohl(rpl->atid_status))));
  1844. return 0;
  1845. }
  1846. break;
  1847. case CPL_ERR_CONN_EXIST:
  1848. if (ep->retry_count++ < ACT_OPEN_RETRY_COUNT) {
  1849. set_bit(ACT_RETRY_INUSE, &ep->com.history);
  1850. remove_handle(ep->com.dev, &ep->com.dev->atid_idr,
  1851. atid);
  1852. cxgb4_free_atid(t, atid);
  1853. dst_release(ep->dst);
  1854. cxgb4_l2t_release(ep->l2t);
  1855. c4iw_reconnect(ep);
  1856. return 0;
  1857. }
  1858. break;
  1859. default:
  1860. if (ep->com.local_addr.ss_family == AF_INET) {
  1861. pr_info("Active open failure - atid %u status %u errno %d %pI4:%u->%pI4:%u\n",
  1862. atid, status, status2errno(status),
  1863. &la->sin_addr.s_addr, ntohs(la->sin_port),
  1864. &ra->sin_addr.s_addr, ntohs(ra->sin_port));
  1865. } else {
  1866. pr_info("Active open failure - atid %u status %u errno %d %pI6:%u->%pI6:%u\n",
  1867. atid, status, status2errno(status),
  1868. la6->sin6_addr.s6_addr, ntohs(la6->sin6_port),
  1869. ra6->sin6_addr.s6_addr, ntohs(ra6->sin6_port));
  1870. }
  1871. break;
  1872. }
  1873. connect_reply_upcall(ep, status2errno(status));
  1874. state_set(&ep->com, DEAD);
  1875. if (status && act_open_has_tid(status))
  1876. cxgb4_remove_tid(ep->com.dev->rdev.lldi.tids, 0, GET_TID(rpl));
  1877. remove_handle(ep->com.dev, &ep->com.dev->atid_idr, atid);
  1878. cxgb4_free_atid(t, atid);
  1879. dst_release(ep->dst);
  1880. cxgb4_l2t_release(ep->l2t);
  1881. c4iw_put_ep(&ep->com);
  1882. return 0;
  1883. }
  1884. static int pass_open_rpl(struct c4iw_dev *dev, struct sk_buff *skb)
  1885. {
  1886. struct cpl_pass_open_rpl *rpl = cplhdr(skb);
  1887. struct tid_info *t = dev->rdev.lldi.tids;
  1888. unsigned int stid = GET_TID(rpl);
  1889. struct c4iw_listen_ep *ep = lookup_stid(t, stid);
  1890. if (!ep) {
  1891. PDBG("%s stid %d lookup failure!\n", __func__, stid);
  1892. goto out;
  1893. }
  1894. PDBG("%s ep %p status %d error %d\n", __func__, ep,
  1895. rpl->status, status2errno(rpl->status));
  1896. c4iw_wake_up(&ep->com.wr_wait, status2errno(rpl->status));
  1897. out:
  1898. return 0;
  1899. }
  1900. static int close_listsrv_rpl(struct c4iw_dev *dev, struct sk_buff *skb)
  1901. {
  1902. struct cpl_close_listsvr_rpl *rpl = cplhdr(skb);
  1903. struct tid_info *t = dev->rdev.lldi.tids;
  1904. unsigned int stid = GET_TID(rpl);
  1905. struct c4iw_listen_ep *ep = lookup_stid(t, stid);
  1906. PDBG("%s ep %p\n", __func__, ep);
  1907. c4iw_wake_up(&ep->com.wr_wait, status2errno(rpl->status));
  1908. return 0;
  1909. }
  1910. static void accept_cr(struct c4iw_ep *ep, struct sk_buff *skb,
  1911. struct cpl_pass_accept_req *req)
  1912. {
  1913. struct cpl_pass_accept_rpl *rpl;
  1914. unsigned int mtu_idx;
  1915. u64 opt0;
  1916. u32 opt2;
  1917. int wscale;
  1918. struct cpl_t5_pass_accept_rpl *rpl5 = NULL;
  1919. int win;
  1920. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  1921. BUG_ON(skb_cloned(skb));
  1922. skb_get(skb);
  1923. rpl = cplhdr(skb);
  1924. if (is_t5(ep->com.dev->rdev.lldi.adapter_type)) {
  1925. skb_trim(skb, roundup(sizeof(*rpl5), 16));
  1926. rpl5 = (void *)rpl;
  1927. INIT_TP_WR(rpl5, ep->hwtid);
  1928. } else {
  1929. skb_trim(skb, sizeof(*rpl));
  1930. INIT_TP_WR(rpl, ep->hwtid);
  1931. }
  1932. OPCODE_TID(rpl) = cpu_to_be32(MK_OPCODE_TID(CPL_PASS_ACCEPT_RPL,
  1933. ep->hwtid));
  1934. best_mtu(ep->com.dev->rdev.lldi.mtus, ep->mtu, &mtu_idx,
  1935. enable_tcp_timestamps && req->tcpopt.tstamp,
  1936. (AF_INET == ep->com.remote_addr.ss_family) ? 0 : 1);
  1937. wscale = compute_wscale(rcv_win);
  1938. /*
  1939. * Specify the largest window that will fit in opt0. The
  1940. * remainder will be specified in the rx_data_ack.
  1941. */
  1942. win = ep->rcv_win >> 10;
  1943. if (win > RCV_BUFSIZ_M)
  1944. win = RCV_BUFSIZ_M;
  1945. opt0 = (nocong ? NO_CONG(1) : 0) |
  1946. KEEP_ALIVE_F |
  1947. DELACK(1) |
  1948. WND_SCALE_V(wscale) |
  1949. MSS_IDX_V(mtu_idx) |
  1950. L2T_IDX_V(ep->l2t->idx) |
  1951. TX_CHAN_V(ep->tx_chan) |
  1952. SMAC_SEL_V(ep->smac_idx) |
  1953. DSCP(ep->tos >> 2) |
  1954. ULP_MODE_V(ULP_MODE_TCPDDP) |
  1955. RCV_BUFSIZ_V(win);
  1956. opt2 = RX_CHANNEL_V(0) |
  1957. RSS_QUEUE_VALID_F | RSS_QUEUE_V(ep->rss_qid);
  1958. if (enable_tcp_timestamps && req->tcpopt.tstamp)
  1959. opt2 |= TSTAMPS_EN(1);
  1960. if (enable_tcp_sack && req->tcpopt.sack)
  1961. opt2 |= SACK_EN(1);
  1962. if (wscale && enable_tcp_window_scaling)
  1963. opt2 |= WND_SCALE_EN_F;
  1964. if (enable_ecn) {
  1965. const struct tcphdr *tcph;
  1966. u32 hlen = ntohl(req->hdr_len);
  1967. tcph = (const void *)(req + 1) + G_ETH_HDR_LEN(hlen) +
  1968. G_IP_HDR_LEN(hlen);
  1969. if (tcph->ece && tcph->cwr)
  1970. opt2 |= CCTRL_ECN(1);
  1971. }
  1972. if (is_t5(ep->com.dev->rdev.lldi.adapter_type)) {
  1973. u32 isn = (prandom_u32() & ~7UL) - 1;
  1974. opt2 |= T5_OPT_2_VALID_F;
  1975. opt2 |= V_CONG_CNTRL(CONG_ALG_TAHOE);
  1976. opt2 |= CONG_CNTRL_VALID; /* OPT_2_ISS for T5 */
  1977. rpl5 = (void *)rpl;
  1978. memset(&rpl5->iss, 0, roundup(sizeof(*rpl5)-sizeof(*rpl), 16));
  1979. if (peer2peer)
  1980. isn += 4;
  1981. rpl5->iss = cpu_to_be32(isn);
  1982. PDBG("%s iss %u\n", __func__, be32_to_cpu(rpl5->iss));
  1983. }
  1984. rpl->opt0 = cpu_to_be64(opt0);
  1985. rpl->opt2 = cpu_to_be32(opt2);
  1986. set_wr_txq(skb, CPL_PRIORITY_SETUP, ep->ctrlq_idx);
  1987. t4_set_arp_err_handler(skb, NULL, arp_failure_discard);
  1988. c4iw_l2t_send(&ep->com.dev->rdev, skb, ep->l2t);
  1989. return;
  1990. }
  1991. static void reject_cr(struct c4iw_dev *dev, u32 hwtid, struct sk_buff *skb)
  1992. {
  1993. PDBG("%s c4iw_dev %p tid %u\n", __func__, dev, hwtid);
  1994. BUG_ON(skb_cloned(skb));
  1995. skb_trim(skb, sizeof(struct cpl_tid_release));
  1996. release_tid(&dev->rdev, hwtid, skb);
  1997. return;
  1998. }
  1999. static void get_4tuple(struct cpl_pass_accept_req *req, int *iptype,
  2000. __u8 *local_ip, __u8 *peer_ip,
  2001. __be16 *local_port, __be16 *peer_port)
  2002. {
  2003. int eth_len = G_ETH_HDR_LEN(be32_to_cpu(req->hdr_len));
  2004. int ip_len = G_IP_HDR_LEN(be32_to_cpu(req->hdr_len));
  2005. struct iphdr *ip = (struct iphdr *)((u8 *)(req + 1) + eth_len);
  2006. struct ipv6hdr *ip6 = (struct ipv6hdr *)((u8 *)(req + 1) + eth_len);
  2007. struct tcphdr *tcp = (struct tcphdr *)
  2008. ((u8 *)(req + 1) + eth_len + ip_len);
  2009. if (ip->version == 4) {
  2010. PDBG("%s saddr 0x%x daddr 0x%x sport %u dport %u\n", __func__,
  2011. ntohl(ip->saddr), ntohl(ip->daddr), ntohs(tcp->source),
  2012. ntohs(tcp->dest));
  2013. *iptype = 4;
  2014. memcpy(peer_ip, &ip->saddr, 4);
  2015. memcpy(local_ip, &ip->daddr, 4);
  2016. } else {
  2017. PDBG("%s saddr %pI6 daddr %pI6 sport %u dport %u\n", __func__,
  2018. ip6->saddr.s6_addr, ip6->daddr.s6_addr, ntohs(tcp->source),
  2019. ntohs(tcp->dest));
  2020. *iptype = 6;
  2021. memcpy(peer_ip, ip6->saddr.s6_addr, 16);
  2022. memcpy(local_ip, ip6->daddr.s6_addr, 16);
  2023. }
  2024. *peer_port = tcp->source;
  2025. *local_port = tcp->dest;
  2026. return;
  2027. }
  2028. static int pass_accept_req(struct c4iw_dev *dev, struct sk_buff *skb)
  2029. {
  2030. struct c4iw_ep *child_ep = NULL, *parent_ep;
  2031. struct cpl_pass_accept_req *req = cplhdr(skb);
  2032. unsigned int stid = GET_POPEN_TID(ntohl(req->tos_stid));
  2033. struct tid_info *t = dev->rdev.lldi.tids;
  2034. unsigned int hwtid = GET_TID(req);
  2035. struct dst_entry *dst;
  2036. __u8 local_ip[16], peer_ip[16];
  2037. __be16 local_port, peer_port;
  2038. int err;
  2039. u16 peer_mss = ntohs(req->tcpopt.mss);
  2040. int iptype;
  2041. unsigned short hdrs;
  2042. parent_ep = lookup_stid(t, stid);
  2043. if (!parent_ep) {
  2044. PDBG("%s connect request on invalid stid %d\n", __func__, stid);
  2045. goto reject;
  2046. }
  2047. if (state_read(&parent_ep->com) != LISTEN) {
  2048. printk(KERN_ERR "%s - listening ep not in LISTEN\n",
  2049. __func__);
  2050. goto reject;
  2051. }
  2052. get_4tuple(req, &iptype, local_ip, peer_ip, &local_port, &peer_port);
  2053. /* Find output route */
  2054. if (iptype == 4) {
  2055. PDBG("%s parent ep %p hwtid %u laddr %pI4 raddr %pI4 lport %d rport %d peer_mss %d\n"
  2056. , __func__, parent_ep, hwtid,
  2057. local_ip, peer_ip, ntohs(local_port),
  2058. ntohs(peer_port), peer_mss);
  2059. dst = find_route(dev, *(__be32 *)local_ip, *(__be32 *)peer_ip,
  2060. local_port, peer_port,
  2061. GET_POPEN_TOS(ntohl(req->tos_stid)));
  2062. } else {
  2063. PDBG("%s parent ep %p hwtid %u laddr %pI6 raddr %pI6 lport %d rport %d peer_mss %d\n"
  2064. , __func__, parent_ep, hwtid,
  2065. local_ip, peer_ip, ntohs(local_port),
  2066. ntohs(peer_port), peer_mss);
  2067. dst = find_route6(dev, local_ip, peer_ip, local_port, peer_port,
  2068. PASS_OPEN_TOS(ntohl(req->tos_stid)),
  2069. ((struct sockaddr_in6 *)
  2070. &parent_ep->com.local_addr)->sin6_scope_id);
  2071. }
  2072. if (!dst) {
  2073. printk(KERN_ERR MOD "%s - failed to find dst entry!\n",
  2074. __func__);
  2075. goto reject;
  2076. }
  2077. child_ep = alloc_ep(sizeof(*child_ep), GFP_KERNEL);
  2078. if (!child_ep) {
  2079. printk(KERN_ERR MOD "%s - failed to allocate ep entry!\n",
  2080. __func__);
  2081. dst_release(dst);
  2082. goto reject;
  2083. }
  2084. err = import_ep(child_ep, iptype, peer_ip, dst, dev, false);
  2085. if (err) {
  2086. printk(KERN_ERR MOD "%s - failed to allocate l2t entry!\n",
  2087. __func__);
  2088. dst_release(dst);
  2089. kfree(child_ep);
  2090. goto reject;
  2091. }
  2092. hdrs = sizeof(struct iphdr) + sizeof(struct tcphdr) +
  2093. ((enable_tcp_timestamps && req->tcpopt.tstamp) ? 12 : 0);
  2094. if (peer_mss && child_ep->mtu > (peer_mss + hdrs))
  2095. child_ep->mtu = peer_mss + hdrs;
  2096. state_set(&child_ep->com, CONNECTING);
  2097. child_ep->com.dev = dev;
  2098. child_ep->com.cm_id = NULL;
  2099. if (iptype == 4) {
  2100. struct sockaddr_in *sin = (struct sockaddr_in *)
  2101. &child_ep->com.local_addr;
  2102. sin->sin_family = PF_INET;
  2103. sin->sin_port = local_port;
  2104. sin->sin_addr.s_addr = *(__be32 *)local_ip;
  2105. sin = (struct sockaddr_in *)&child_ep->com.remote_addr;
  2106. sin->sin_family = PF_INET;
  2107. sin->sin_port = peer_port;
  2108. sin->sin_addr.s_addr = *(__be32 *)peer_ip;
  2109. } else {
  2110. struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)
  2111. &child_ep->com.local_addr;
  2112. sin6->sin6_family = PF_INET6;
  2113. sin6->sin6_port = local_port;
  2114. memcpy(sin6->sin6_addr.s6_addr, local_ip, 16);
  2115. sin6 = (struct sockaddr_in6 *)&child_ep->com.remote_addr;
  2116. sin6->sin6_family = PF_INET6;
  2117. sin6->sin6_port = peer_port;
  2118. memcpy(sin6->sin6_addr.s6_addr, peer_ip, 16);
  2119. }
  2120. c4iw_get_ep(&parent_ep->com);
  2121. child_ep->parent_ep = parent_ep;
  2122. child_ep->tos = GET_POPEN_TOS(ntohl(req->tos_stid));
  2123. child_ep->dst = dst;
  2124. child_ep->hwtid = hwtid;
  2125. PDBG("%s tx_chan %u smac_idx %u rss_qid %u\n", __func__,
  2126. child_ep->tx_chan, child_ep->smac_idx, child_ep->rss_qid);
  2127. init_timer(&child_ep->timer);
  2128. cxgb4_insert_tid(t, child_ep, hwtid);
  2129. insert_handle(dev, &dev->hwtid_idr, child_ep, child_ep->hwtid);
  2130. accept_cr(child_ep, skb, req);
  2131. set_bit(PASS_ACCEPT_REQ, &child_ep->com.history);
  2132. goto out;
  2133. reject:
  2134. reject_cr(dev, hwtid, skb);
  2135. out:
  2136. return 0;
  2137. }
  2138. static int pass_establish(struct c4iw_dev *dev, struct sk_buff *skb)
  2139. {
  2140. struct c4iw_ep *ep;
  2141. struct cpl_pass_establish *req = cplhdr(skb);
  2142. struct tid_info *t = dev->rdev.lldi.tids;
  2143. unsigned int tid = GET_TID(req);
  2144. ep = lookup_tid(t, tid);
  2145. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  2146. ep->snd_seq = be32_to_cpu(req->snd_isn);
  2147. ep->rcv_seq = be32_to_cpu(req->rcv_isn);
  2148. PDBG("%s ep %p hwtid %u tcp_opt 0x%02x\n", __func__, ep, tid,
  2149. ntohs(req->tcp_opt));
  2150. set_emss(ep, ntohs(req->tcp_opt));
  2151. dst_confirm(ep->dst);
  2152. state_set(&ep->com, MPA_REQ_WAIT);
  2153. start_ep_timer(ep);
  2154. send_flowc(ep, skb);
  2155. set_bit(PASS_ESTAB, &ep->com.history);
  2156. return 0;
  2157. }
  2158. static int peer_close(struct c4iw_dev *dev, struct sk_buff *skb)
  2159. {
  2160. struct cpl_peer_close *hdr = cplhdr(skb);
  2161. struct c4iw_ep *ep;
  2162. struct c4iw_qp_attributes attrs;
  2163. int disconnect = 1;
  2164. int release = 0;
  2165. struct tid_info *t = dev->rdev.lldi.tids;
  2166. unsigned int tid = GET_TID(hdr);
  2167. int ret;
  2168. ep = lookup_tid(t, tid);
  2169. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  2170. dst_confirm(ep->dst);
  2171. set_bit(PEER_CLOSE, &ep->com.history);
  2172. mutex_lock(&ep->com.mutex);
  2173. switch (ep->com.state) {
  2174. case MPA_REQ_WAIT:
  2175. __state_set(&ep->com, CLOSING);
  2176. break;
  2177. case MPA_REQ_SENT:
  2178. __state_set(&ep->com, CLOSING);
  2179. connect_reply_upcall(ep, -ECONNRESET);
  2180. break;
  2181. case MPA_REQ_RCVD:
  2182. /*
  2183. * We're gonna mark this puppy DEAD, but keep
  2184. * the reference on it until the ULP accepts or
  2185. * rejects the CR. Also wake up anyone waiting
  2186. * in rdma connection migration (see c4iw_accept_cr()).
  2187. */
  2188. __state_set(&ep->com, CLOSING);
  2189. PDBG("waking up ep %p tid %u\n", ep, ep->hwtid);
  2190. c4iw_wake_up(&ep->com.wr_wait, -ECONNRESET);
  2191. break;
  2192. case MPA_REP_SENT:
  2193. __state_set(&ep->com, CLOSING);
  2194. PDBG("waking up ep %p tid %u\n", ep, ep->hwtid);
  2195. c4iw_wake_up(&ep->com.wr_wait, -ECONNRESET);
  2196. break;
  2197. case FPDU_MODE:
  2198. start_ep_timer(ep);
  2199. __state_set(&ep->com, CLOSING);
  2200. attrs.next_state = C4IW_QP_STATE_CLOSING;
  2201. ret = c4iw_modify_qp(ep->com.qp->rhp, ep->com.qp,
  2202. C4IW_QP_ATTR_NEXT_STATE, &attrs, 1);
  2203. if (ret != -ECONNRESET) {
  2204. peer_close_upcall(ep);
  2205. disconnect = 1;
  2206. }
  2207. break;
  2208. case ABORTING:
  2209. disconnect = 0;
  2210. break;
  2211. case CLOSING:
  2212. __state_set(&ep->com, MORIBUND);
  2213. disconnect = 0;
  2214. break;
  2215. case MORIBUND:
  2216. (void)stop_ep_timer(ep);
  2217. if (ep->com.cm_id && ep->com.qp) {
  2218. attrs.next_state = C4IW_QP_STATE_IDLE;
  2219. c4iw_modify_qp(ep->com.qp->rhp, ep->com.qp,
  2220. C4IW_QP_ATTR_NEXT_STATE, &attrs, 1);
  2221. }
  2222. close_complete_upcall(ep, 0);
  2223. __state_set(&ep->com, DEAD);
  2224. release = 1;
  2225. disconnect = 0;
  2226. break;
  2227. case DEAD:
  2228. disconnect = 0;
  2229. break;
  2230. default:
  2231. BUG_ON(1);
  2232. }
  2233. mutex_unlock(&ep->com.mutex);
  2234. if (disconnect)
  2235. c4iw_ep_disconnect(ep, 0, GFP_KERNEL);
  2236. if (release)
  2237. release_ep_resources(ep);
  2238. return 0;
  2239. }
  2240. static int peer_abort(struct c4iw_dev *dev, struct sk_buff *skb)
  2241. {
  2242. struct cpl_abort_req_rss *req = cplhdr(skb);
  2243. struct c4iw_ep *ep;
  2244. struct cpl_abort_rpl *rpl;
  2245. struct sk_buff *rpl_skb;
  2246. struct c4iw_qp_attributes attrs;
  2247. int ret;
  2248. int release = 0;
  2249. struct tid_info *t = dev->rdev.lldi.tids;
  2250. unsigned int tid = GET_TID(req);
  2251. ep = lookup_tid(t, tid);
  2252. if (is_neg_adv(req->status)) {
  2253. dev_warn(&dev->rdev.lldi.pdev->dev,
  2254. "Negative advice on abort - tid %u status %d (%s)\n",
  2255. ep->hwtid, req->status, neg_adv_str(req->status));
  2256. return 0;
  2257. }
  2258. PDBG("%s ep %p tid %u state %u\n", __func__, ep, ep->hwtid,
  2259. ep->com.state);
  2260. set_bit(PEER_ABORT, &ep->com.history);
  2261. /*
  2262. * Wake up any threads in rdma_init() or rdma_fini().
  2263. * However, this is not needed if com state is just
  2264. * MPA_REQ_SENT
  2265. */
  2266. if (ep->com.state != MPA_REQ_SENT)
  2267. c4iw_wake_up(&ep->com.wr_wait, -ECONNRESET);
  2268. mutex_lock(&ep->com.mutex);
  2269. switch (ep->com.state) {
  2270. case CONNECTING:
  2271. break;
  2272. case MPA_REQ_WAIT:
  2273. (void)stop_ep_timer(ep);
  2274. break;
  2275. case MPA_REQ_SENT:
  2276. (void)stop_ep_timer(ep);
  2277. if (mpa_rev == 1 || (mpa_rev == 2 && ep->tried_with_mpa_v1))
  2278. connect_reply_upcall(ep, -ECONNRESET);
  2279. else {
  2280. /*
  2281. * we just don't send notification upwards because we
  2282. * want to retry with mpa_v1 without upper layers even
  2283. * knowing it.
  2284. *
  2285. * do some housekeeping so as to re-initiate the
  2286. * connection
  2287. */
  2288. PDBG("%s: mpa_rev=%d. Retrying with mpav1\n", __func__,
  2289. mpa_rev);
  2290. ep->retry_with_mpa_v1 = 1;
  2291. }
  2292. break;
  2293. case MPA_REP_SENT:
  2294. break;
  2295. case MPA_REQ_RCVD:
  2296. break;
  2297. case MORIBUND:
  2298. case CLOSING:
  2299. stop_ep_timer(ep);
  2300. /*FALLTHROUGH*/
  2301. case FPDU_MODE:
  2302. if (ep->com.cm_id && ep->com.qp) {
  2303. attrs.next_state = C4IW_QP_STATE_ERROR;
  2304. ret = c4iw_modify_qp(ep->com.qp->rhp,
  2305. ep->com.qp, C4IW_QP_ATTR_NEXT_STATE,
  2306. &attrs, 1);
  2307. if (ret)
  2308. printk(KERN_ERR MOD
  2309. "%s - qp <- error failed!\n",
  2310. __func__);
  2311. }
  2312. peer_abort_upcall(ep);
  2313. break;
  2314. case ABORTING:
  2315. break;
  2316. case DEAD:
  2317. PDBG("%s PEER_ABORT IN DEAD STATE!!!!\n", __func__);
  2318. mutex_unlock(&ep->com.mutex);
  2319. return 0;
  2320. default:
  2321. BUG_ON(1);
  2322. break;
  2323. }
  2324. dst_confirm(ep->dst);
  2325. if (ep->com.state != ABORTING) {
  2326. __state_set(&ep->com, DEAD);
  2327. /* we don't release if we want to retry with mpa_v1 */
  2328. if (!ep->retry_with_mpa_v1)
  2329. release = 1;
  2330. }
  2331. mutex_unlock(&ep->com.mutex);
  2332. rpl_skb = get_skb(skb, sizeof(*rpl), GFP_KERNEL);
  2333. if (!rpl_skb) {
  2334. printk(KERN_ERR MOD "%s - cannot allocate skb!\n",
  2335. __func__);
  2336. release = 1;
  2337. goto out;
  2338. }
  2339. set_wr_txq(skb, CPL_PRIORITY_DATA, ep->txq_idx);
  2340. rpl = (struct cpl_abort_rpl *) skb_put(rpl_skb, sizeof(*rpl));
  2341. INIT_TP_WR(rpl, ep->hwtid);
  2342. OPCODE_TID(rpl) = cpu_to_be32(MK_OPCODE_TID(CPL_ABORT_RPL, ep->hwtid));
  2343. rpl->cmd = CPL_ABORT_NO_RST;
  2344. c4iw_ofld_send(&ep->com.dev->rdev, rpl_skb);
  2345. out:
  2346. if (release)
  2347. release_ep_resources(ep);
  2348. else if (ep->retry_with_mpa_v1) {
  2349. remove_handle(ep->com.dev, &ep->com.dev->hwtid_idr, ep->hwtid);
  2350. cxgb4_remove_tid(ep->com.dev->rdev.lldi.tids, 0, ep->hwtid);
  2351. dst_release(ep->dst);
  2352. cxgb4_l2t_release(ep->l2t);
  2353. c4iw_reconnect(ep);
  2354. }
  2355. return 0;
  2356. }
  2357. static int close_con_rpl(struct c4iw_dev *dev, struct sk_buff *skb)
  2358. {
  2359. struct c4iw_ep *ep;
  2360. struct c4iw_qp_attributes attrs;
  2361. struct cpl_close_con_rpl *rpl = cplhdr(skb);
  2362. int release = 0;
  2363. struct tid_info *t = dev->rdev.lldi.tids;
  2364. unsigned int tid = GET_TID(rpl);
  2365. ep = lookup_tid(t, tid);
  2366. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  2367. BUG_ON(!ep);
  2368. /* The cm_id may be null if we failed to connect */
  2369. mutex_lock(&ep->com.mutex);
  2370. switch (ep->com.state) {
  2371. case CLOSING:
  2372. __state_set(&ep->com, MORIBUND);
  2373. break;
  2374. case MORIBUND:
  2375. (void)stop_ep_timer(ep);
  2376. if ((ep->com.cm_id) && (ep->com.qp)) {
  2377. attrs.next_state = C4IW_QP_STATE_IDLE;
  2378. c4iw_modify_qp(ep->com.qp->rhp,
  2379. ep->com.qp,
  2380. C4IW_QP_ATTR_NEXT_STATE,
  2381. &attrs, 1);
  2382. }
  2383. close_complete_upcall(ep, 0);
  2384. __state_set(&ep->com, DEAD);
  2385. release = 1;
  2386. break;
  2387. case ABORTING:
  2388. case DEAD:
  2389. break;
  2390. default:
  2391. BUG_ON(1);
  2392. break;
  2393. }
  2394. mutex_unlock(&ep->com.mutex);
  2395. if (release)
  2396. release_ep_resources(ep);
  2397. return 0;
  2398. }
  2399. static int terminate(struct c4iw_dev *dev, struct sk_buff *skb)
  2400. {
  2401. struct cpl_rdma_terminate *rpl = cplhdr(skb);
  2402. struct tid_info *t = dev->rdev.lldi.tids;
  2403. unsigned int tid = GET_TID(rpl);
  2404. struct c4iw_ep *ep;
  2405. struct c4iw_qp_attributes attrs;
  2406. ep = lookup_tid(t, tid);
  2407. BUG_ON(!ep);
  2408. if (ep && ep->com.qp) {
  2409. printk(KERN_WARNING MOD "TERM received tid %u qpid %u\n", tid,
  2410. ep->com.qp->wq.sq.qid);
  2411. attrs.next_state = C4IW_QP_STATE_TERMINATE;
  2412. c4iw_modify_qp(ep->com.qp->rhp, ep->com.qp,
  2413. C4IW_QP_ATTR_NEXT_STATE, &attrs, 1);
  2414. } else
  2415. printk(KERN_WARNING MOD "TERM received tid %u no ep/qp\n", tid);
  2416. return 0;
  2417. }
  2418. /*
  2419. * Upcall from the adapter indicating data has been transmitted.
  2420. * For us its just the single MPA request or reply. We can now free
  2421. * the skb holding the mpa message.
  2422. */
  2423. static int fw4_ack(struct c4iw_dev *dev, struct sk_buff *skb)
  2424. {
  2425. struct c4iw_ep *ep;
  2426. struct cpl_fw4_ack *hdr = cplhdr(skb);
  2427. u8 credits = hdr->credits;
  2428. unsigned int tid = GET_TID(hdr);
  2429. struct tid_info *t = dev->rdev.lldi.tids;
  2430. ep = lookup_tid(t, tid);
  2431. PDBG("%s ep %p tid %u credits %u\n", __func__, ep, ep->hwtid, credits);
  2432. if (credits == 0) {
  2433. PDBG("%s 0 credit ack ep %p tid %u state %u\n",
  2434. __func__, ep, ep->hwtid, state_read(&ep->com));
  2435. return 0;
  2436. }
  2437. dst_confirm(ep->dst);
  2438. if (ep->mpa_skb) {
  2439. PDBG("%s last streaming msg ack ep %p tid %u state %u "
  2440. "initiator %u freeing skb\n", __func__, ep, ep->hwtid,
  2441. state_read(&ep->com), ep->mpa_attr.initiator ? 1 : 0);
  2442. kfree_skb(ep->mpa_skb);
  2443. ep->mpa_skb = NULL;
  2444. }
  2445. return 0;
  2446. }
  2447. int c4iw_reject_cr(struct iw_cm_id *cm_id, const void *pdata, u8 pdata_len)
  2448. {
  2449. int err = 0;
  2450. int disconnect = 0;
  2451. struct c4iw_ep *ep = to_ep(cm_id);
  2452. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  2453. mutex_lock(&ep->com.mutex);
  2454. if (ep->com.state == DEAD) {
  2455. mutex_unlock(&ep->com.mutex);
  2456. c4iw_put_ep(&ep->com);
  2457. return -ECONNRESET;
  2458. }
  2459. set_bit(ULP_REJECT, &ep->com.history);
  2460. BUG_ON(ep->com.state != MPA_REQ_RCVD);
  2461. if (mpa_rev == 0)
  2462. abort_connection(ep, NULL, GFP_KERNEL);
  2463. else {
  2464. err = send_mpa_reject(ep, pdata, pdata_len);
  2465. disconnect = 1;
  2466. }
  2467. mutex_unlock(&ep->com.mutex);
  2468. if (disconnect)
  2469. err = c4iw_ep_disconnect(ep, 0, GFP_KERNEL);
  2470. c4iw_put_ep(&ep->com);
  2471. return 0;
  2472. }
  2473. int c4iw_accept_cr(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
  2474. {
  2475. int err;
  2476. struct c4iw_qp_attributes attrs;
  2477. enum c4iw_qp_attr_mask mask;
  2478. struct c4iw_ep *ep = to_ep(cm_id);
  2479. struct c4iw_dev *h = to_c4iw_dev(cm_id->device);
  2480. struct c4iw_qp *qp = get_qhp(h, conn_param->qpn);
  2481. PDBG("%s ep %p tid %u\n", __func__, ep, ep->hwtid);
  2482. mutex_lock(&ep->com.mutex);
  2483. if (ep->com.state == DEAD) {
  2484. err = -ECONNRESET;
  2485. goto err;
  2486. }
  2487. BUG_ON(ep->com.state != MPA_REQ_RCVD);
  2488. BUG_ON(!qp);
  2489. set_bit(ULP_ACCEPT, &ep->com.history);
  2490. if ((conn_param->ord > cur_max_read_depth(ep->com.dev)) ||
  2491. (conn_param->ird > cur_max_read_depth(ep->com.dev))) {
  2492. abort_connection(ep, NULL, GFP_KERNEL);
  2493. err = -EINVAL;
  2494. goto err;
  2495. }
  2496. if (ep->mpa_attr.version == 2 && ep->mpa_attr.enhanced_rdma_conn) {
  2497. if (conn_param->ord > ep->ird) {
  2498. if (RELAXED_IRD_NEGOTIATION) {
  2499. ep->ord = ep->ird;
  2500. } else {
  2501. ep->ird = conn_param->ird;
  2502. ep->ord = conn_param->ord;
  2503. send_mpa_reject(ep, conn_param->private_data,
  2504. conn_param->private_data_len);
  2505. abort_connection(ep, NULL, GFP_KERNEL);
  2506. err = -ENOMEM;
  2507. goto err;
  2508. }
  2509. }
  2510. if (conn_param->ird < ep->ord) {
  2511. if (RELAXED_IRD_NEGOTIATION &&
  2512. ep->ord <= h->rdev.lldi.max_ordird_qp) {
  2513. conn_param->ird = ep->ord;
  2514. } else {
  2515. abort_connection(ep, NULL, GFP_KERNEL);
  2516. err = -ENOMEM;
  2517. goto err;
  2518. }
  2519. }
  2520. }
  2521. ep->ird = conn_param->ird;
  2522. ep->ord = conn_param->ord;
  2523. if (ep->mpa_attr.version == 1) {
  2524. if (peer2peer && ep->ird == 0)
  2525. ep->ird = 1;
  2526. } else {
  2527. if (peer2peer &&
  2528. (ep->mpa_attr.p2p_type != FW_RI_INIT_P2PTYPE_DISABLED) &&
  2529. (p2p_type == FW_RI_INIT_P2PTYPE_READ_REQ) && ep->ord == 0)
  2530. ep->ird = 1;
  2531. }
  2532. PDBG("%s %d ird %d ord %d\n", __func__, __LINE__, ep->ird, ep->ord);
  2533. cm_id->add_ref(cm_id);
  2534. ep->com.cm_id = cm_id;
  2535. ep->com.qp = qp;
  2536. ref_qp(ep);
  2537. /* bind QP to EP and move to RTS */
  2538. attrs.mpa_attr = ep->mpa_attr;
  2539. attrs.max_ird = ep->ird;
  2540. attrs.max_ord = ep->ord;
  2541. attrs.llp_stream_handle = ep;
  2542. attrs.next_state = C4IW_QP_STATE_RTS;
  2543. /* bind QP and TID with INIT_WR */
  2544. mask = C4IW_QP_ATTR_NEXT_STATE |
  2545. C4IW_QP_ATTR_LLP_STREAM_HANDLE |
  2546. C4IW_QP_ATTR_MPA_ATTR |
  2547. C4IW_QP_ATTR_MAX_IRD |
  2548. C4IW_QP_ATTR_MAX_ORD;
  2549. err = c4iw_modify_qp(ep->com.qp->rhp,
  2550. ep->com.qp, mask, &attrs, 1);
  2551. if (err)
  2552. goto err1;
  2553. err = send_mpa_reply(ep, conn_param->private_data,
  2554. conn_param->private_data_len);
  2555. if (err)
  2556. goto err1;
  2557. __state_set(&ep->com, FPDU_MODE);
  2558. established_upcall(ep);
  2559. mutex_unlock(&ep->com.mutex);
  2560. c4iw_put_ep(&ep->com);
  2561. return 0;
  2562. err1:
  2563. ep->com.cm_id = NULL;
  2564. abort_connection(ep, NULL, GFP_KERNEL);
  2565. cm_id->rem_ref(cm_id);
  2566. err:
  2567. mutex_unlock(&ep->com.mutex);
  2568. c4iw_put_ep(&ep->com);
  2569. return err;
  2570. }
  2571. static int pick_local_ipaddrs(struct c4iw_dev *dev, struct iw_cm_id *cm_id)
  2572. {
  2573. struct in_device *ind;
  2574. int found = 0;
  2575. struct sockaddr_in *laddr = (struct sockaddr_in *)&cm_id->local_addr;
  2576. struct sockaddr_in *raddr = (struct sockaddr_in *)&cm_id->remote_addr;
  2577. ind = in_dev_get(dev->rdev.lldi.ports[0]);
  2578. if (!ind)
  2579. return -EADDRNOTAVAIL;
  2580. for_primary_ifa(ind) {
  2581. laddr->sin_addr.s_addr = ifa->ifa_address;
  2582. raddr->sin_addr.s_addr = ifa->ifa_address;
  2583. found = 1;
  2584. break;
  2585. }
  2586. endfor_ifa(ind);
  2587. in_dev_put(ind);
  2588. return found ? 0 : -EADDRNOTAVAIL;
  2589. }
  2590. static int get_lladdr(struct net_device *dev, struct in6_addr *addr,
  2591. unsigned char banned_flags)
  2592. {
  2593. struct inet6_dev *idev;
  2594. int err = -EADDRNOTAVAIL;
  2595. rcu_read_lock();
  2596. idev = __in6_dev_get(dev);
  2597. if (idev != NULL) {
  2598. struct inet6_ifaddr *ifp;
  2599. read_lock_bh(&idev->lock);
  2600. list_for_each_entry(ifp, &idev->addr_list, if_list) {
  2601. if (ifp->scope == IFA_LINK &&
  2602. !(ifp->flags & banned_flags)) {
  2603. memcpy(addr, &ifp->addr, 16);
  2604. err = 0;
  2605. break;
  2606. }
  2607. }
  2608. read_unlock_bh(&idev->lock);
  2609. }
  2610. rcu_read_unlock();
  2611. return err;
  2612. }
  2613. static int pick_local_ip6addrs(struct c4iw_dev *dev, struct iw_cm_id *cm_id)
  2614. {
  2615. struct in6_addr uninitialized_var(addr);
  2616. struct sockaddr_in6 *la6 = (struct sockaddr_in6 *)&cm_id->local_addr;
  2617. struct sockaddr_in6 *ra6 = (struct sockaddr_in6 *)&cm_id->remote_addr;
  2618. if (get_lladdr(dev->rdev.lldi.ports[0], &addr, IFA_F_TENTATIVE)) {
  2619. memcpy(la6->sin6_addr.s6_addr, &addr, 16);
  2620. memcpy(ra6->sin6_addr.s6_addr, &addr, 16);
  2621. return 0;
  2622. }
  2623. return -EADDRNOTAVAIL;
  2624. }
  2625. int c4iw_connect(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
  2626. {
  2627. struct c4iw_dev *dev = to_c4iw_dev(cm_id->device);
  2628. struct c4iw_ep *ep;
  2629. int err = 0;
  2630. struct sockaddr_in *laddr;
  2631. struct sockaddr_in *raddr;
  2632. struct sockaddr_in6 *laddr6;
  2633. struct sockaddr_in6 *raddr6;
  2634. struct iwpm_dev_data pm_reg_msg;
  2635. struct iwpm_sa_data pm_msg;
  2636. __u8 *ra;
  2637. int iptype;
  2638. int iwpm_err = 0;
  2639. if ((conn_param->ord > cur_max_read_depth(dev)) ||
  2640. (conn_param->ird > cur_max_read_depth(dev))) {
  2641. err = -EINVAL;
  2642. goto out;
  2643. }
  2644. ep = alloc_ep(sizeof(*ep), GFP_KERNEL);
  2645. if (!ep) {
  2646. printk(KERN_ERR MOD "%s - cannot alloc ep.\n", __func__);
  2647. err = -ENOMEM;
  2648. goto out;
  2649. }
  2650. init_timer(&ep->timer);
  2651. ep->plen = conn_param->private_data_len;
  2652. if (ep->plen)
  2653. memcpy(ep->mpa_pkt + sizeof(struct mpa_message),
  2654. conn_param->private_data, ep->plen);
  2655. ep->ird = conn_param->ird;
  2656. ep->ord = conn_param->ord;
  2657. if (peer2peer && ep->ord == 0)
  2658. ep->ord = 1;
  2659. cm_id->add_ref(cm_id);
  2660. ep->com.dev = dev;
  2661. ep->com.cm_id = cm_id;
  2662. ep->com.qp = get_qhp(dev, conn_param->qpn);
  2663. if (!ep->com.qp) {
  2664. PDBG("%s qpn 0x%x not found!\n", __func__, conn_param->qpn);
  2665. err = -EINVAL;
  2666. goto fail1;
  2667. }
  2668. ref_qp(ep);
  2669. PDBG("%s qpn 0x%x qp %p cm_id %p\n", __func__, conn_param->qpn,
  2670. ep->com.qp, cm_id);
  2671. /*
  2672. * Allocate an active TID to initiate a TCP connection.
  2673. */
  2674. ep->atid = cxgb4_alloc_atid(dev->rdev.lldi.tids, ep);
  2675. if (ep->atid == -1) {
  2676. printk(KERN_ERR MOD "%s - cannot alloc atid.\n", __func__);
  2677. err = -ENOMEM;
  2678. goto fail1;
  2679. }
  2680. insert_handle(dev, &dev->atid_idr, ep, ep->atid);
  2681. memcpy(&ep->com.local_addr, &cm_id->local_addr,
  2682. sizeof(ep->com.local_addr));
  2683. memcpy(&ep->com.remote_addr, &cm_id->remote_addr,
  2684. sizeof(ep->com.remote_addr));
  2685. /* No port mapper available, go with the specified peer information */
  2686. memcpy(&ep->com.mapped_local_addr, &cm_id->local_addr,
  2687. sizeof(ep->com.mapped_local_addr));
  2688. memcpy(&ep->com.mapped_remote_addr, &cm_id->remote_addr,
  2689. sizeof(ep->com.mapped_remote_addr));
  2690. c4iw_form_reg_msg(dev, &pm_reg_msg);
  2691. iwpm_err = iwpm_register_pid(&pm_reg_msg, RDMA_NL_C4IW);
  2692. if (iwpm_err) {
  2693. PDBG("%s: Port Mapper reg pid fail (err = %d).\n",
  2694. __func__, iwpm_err);
  2695. }
  2696. if (iwpm_valid_pid() && !iwpm_err) {
  2697. c4iw_form_pm_msg(ep, &pm_msg);
  2698. iwpm_err = iwpm_add_and_query_mapping(&pm_msg, RDMA_NL_C4IW);
  2699. if (iwpm_err)
  2700. PDBG("%s: Port Mapper query fail (err = %d).\n",
  2701. __func__, iwpm_err);
  2702. else
  2703. c4iw_record_pm_msg(ep, &pm_msg);
  2704. }
  2705. if (iwpm_create_mapinfo(&ep->com.local_addr,
  2706. &ep->com.mapped_local_addr, RDMA_NL_C4IW)) {
  2707. iwpm_remove_mapping(&ep->com.local_addr, RDMA_NL_C4IW);
  2708. err = -ENOMEM;
  2709. goto fail1;
  2710. }
  2711. print_addr(&ep->com, __func__, "add_query/create_mapinfo");
  2712. set_bit(RELEASE_MAPINFO, &ep->com.flags);
  2713. laddr = (struct sockaddr_in *)&ep->com.mapped_local_addr;
  2714. raddr = (struct sockaddr_in *)&ep->com.mapped_remote_addr;
  2715. laddr6 = (struct sockaddr_in6 *)&ep->com.mapped_local_addr;
  2716. raddr6 = (struct sockaddr_in6 *) &ep->com.mapped_remote_addr;
  2717. if (cm_id->remote_addr.ss_family == AF_INET) {
  2718. iptype = 4;
  2719. ra = (__u8 *)&raddr->sin_addr;
  2720. /*
  2721. * Handle loopback requests to INADDR_ANY.
  2722. */
  2723. if ((__force int)raddr->sin_addr.s_addr == INADDR_ANY) {
  2724. err = pick_local_ipaddrs(dev, cm_id);
  2725. if (err)
  2726. goto fail1;
  2727. }
  2728. /* find a route */
  2729. PDBG("%s saddr %pI4 sport 0x%x raddr %pI4 rport 0x%x\n",
  2730. __func__, &laddr->sin_addr, ntohs(laddr->sin_port),
  2731. ra, ntohs(raddr->sin_port));
  2732. ep->dst = find_route(dev, laddr->sin_addr.s_addr,
  2733. raddr->sin_addr.s_addr, laddr->sin_port,
  2734. raddr->sin_port, 0);
  2735. } else {
  2736. iptype = 6;
  2737. ra = (__u8 *)&raddr6->sin6_addr;
  2738. /*
  2739. * Handle loopback requests to INADDR_ANY.
  2740. */
  2741. if (ipv6_addr_type(&raddr6->sin6_addr) == IPV6_ADDR_ANY) {
  2742. err = pick_local_ip6addrs(dev, cm_id);
  2743. if (err)
  2744. goto fail1;
  2745. }
  2746. /* find a route */
  2747. PDBG("%s saddr %pI6 sport 0x%x raddr %pI6 rport 0x%x\n",
  2748. __func__, laddr6->sin6_addr.s6_addr,
  2749. ntohs(laddr6->sin6_port),
  2750. raddr6->sin6_addr.s6_addr, ntohs(raddr6->sin6_port));
  2751. ep->dst = find_route6(dev, laddr6->sin6_addr.s6_addr,
  2752. raddr6->sin6_addr.s6_addr,
  2753. laddr6->sin6_port, raddr6->sin6_port, 0,
  2754. raddr6->sin6_scope_id);
  2755. }
  2756. if (!ep->dst) {
  2757. printk(KERN_ERR MOD "%s - cannot find route.\n", __func__);
  2758. err = -EHOSTUNREACH;
  2759. goto fail2;
  2760. }
  2761. err = import_ep(ep, iptype, ra, ep->dst, ep->com.dev, true);
  2762. if (err) {
  2763. printk(KERN_ERR MOD "%s - cannot alloc l2e.\n", __func__);
  2764. goto fail3;
  2765. }
  2766. PDBG("%s txq_idx %u tx_chan %u smac_idx %u rss_qid %u l2t_idx %u\n",
  2767. __func__, ep->txq_idx, ep->tx_chan, ep->smac_idx, ep->rss_qid,
  2768. ep->l2t->idx);
  2769. state_set(&ep->com, CONNECTING);
  2770. ep->tos = 0;
  2771. /* send connect request to rnic */
  2772. err = send_connect(ep);
  2773. if (!err)
  2774. goto out;
  2775. cxgb4_l2t_release(ep->l2t);
  2776. fail3:
  2777. dst_release(ep->dst);
  2778. fail2:
  2779. remove_handle(ep->com.dev, &ep->com.dev->atid_idr, ep->atid);
  2780. cxgb4_free_atid(ep->com.dev->rdev.lldi.tids, ep->atid);
  2781. fail1:
  2782. cm_id->rem_ref(cm_id);
  2783. c4iw_put_ep(&ep->com);
  2784. out:
  2785. return err;
  2786. }
  2787. static int create_server6(struct c4iw_dev *dev, struct c4iw_listen_ep *ep)
  2788. {
  2789. int err;
  2790. struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)
  2791. &ep->com.mapped_local_addr;
  2792. c4iw_init_wr_wait(&ep->com.wr_wait);
  2793. err = cxgb4_create_server6(ep->com.dev->rdev.lldi.ports[0],
  2794. ep->stid, &sin6->sin6_addr,
  2795. sin6->sin6_port,
  2796. ep->com.dev->rdev.lldi.rxq_ids[0]);
  2797. if (!err)
  2798. err = c4iw_wait_for_reply(&ep->com.dev->rdev,
  2799. &ep->com.wr_wait,
  2800. 0, 0, __func__);
  2801. else if (err > 0)
  2802. err = net_xmit_errno(err);
  2803. if (err)
  2804. pr_err("cxgb4_create_server6/filter failed err %d stid %d laddr %pI6 lport %d\n",
  2805. err, ep->stid,
  2806. sin6->sin6_addr.s6_addr, ntohs(sin6->sin6_port));
  2807. return err;
  2808. }
  2809. static int create_server4(struct c4iw_dev *dev, struct c4iw_listen_ep *ep)
  2810. {
  2811. int err;
  2812. struct sockaddr_in *sin = (struct sockaddr_in *)
  2813. &ep->com.mapped_local_addr;
  2814. if (dev->rdev.lldi.enable_fw_ofld_conn) {
  2815. do {
  2816. err = cxgb4_create_server_filter(
  2817. ep->com.dev->rdev.lldi.ports[0], ep->stid,
  2818. sin->sin_addr.s_addr, sin->sin_port, 0,
  2819. ep->com.dev->rdev.lldi.rxq_ids[0], 0, 0);
  2820. if (err == -EBUSY) {
  2821. set_current_state(TASK_UNINTERRUPTIBLE);
  2822. schedule_timeout(usecs_to_jiffies(100));
  2823. }
  2824. } while (err == -EBUSY);
  2825. } else {
  2826. c4iw_init_wr_wait(&ep->com.wr_wait);
  2827. err = cxgb4_create_server(ep->com.dev->rdev.lldi.ports[0],
  2828. ep->stid, sin->sin_addr.s_addr, sin->sin_port,
  2829. 0, ep->com.dev->rdev.lldi.rxq_ids[0]);
  2830. if (!err)
  2831. err = c4iw_wait_for_reply(&ep->com.dev->rdev,
  2832. &ep->com.wr_wait,
  2833. 0, 0, __func__);
  2834. else if (err > 0)
  2835. err = net_xmit_errno(err);
  2836. }
  2837. if (err)
  2838. pr_err("cxgb4_create_server/filter failed err %d stid %d laddr %pI4 lport %d\n"
  2839. , err, ep->stid,
  2840. &sin->sin_addr, ntohs(sin->sin_port));
  2841. return err;
  2842. }
  2843. int c4iw_create_listen(struct iw_cm_id *cm_id, int backlog)
  2844. {
  2845. int err = 0;
  2846. struct c4iw_dev *dev = to_c4iw_dev(cm_id->device);
  2847. struct c4iw_listen_ep *ep;
  2848. struct iwpm_dev_data pm_reg_msg;
  2849. struct iwpm_sa_data pm_msg;
  2850. int iwpm_err = 0;
  2851. might_sleep();
  2852. ep = alloc_ep(sizeof(*ep), GFP_KERNEL);
  2853. if (!ep) {
  2854. printk(KERN_ERR MOD "%s - cannot alloc ep.\n", __func__);
  2855. err = -ENOMEM;
  2856. goto fail1;
  2857. }
  2858. PDBG("%s ep %p\n", __func__, ep);
  2859. cm_id->add_ref(cm_id);
  2860. ep->com.cm_id = cm_id;
  2861. ep->com.dev = dev;
  2862. ep->backlog = backlog;
  2863. memcpy(&ep->com.local_addr, &cm_id->local_addr,
  2864. sizeof(ep->com.local_addr));
  2865. /*
  2866. * Allocate a server TID.
  2867. */
  2868. if (dev->rdev.lldi.enable_fw_ofld_conn &&
  2869. ep->com.local_addr.ss_family == AF_INET)
  2870. ep->stid = cxgb4_alloc_sftid(dev->rdev.lldi.tids,
  2871. cm_id->local_addr.ss_family, ep);
  2872. else
  2873. ep->stid = cxgb4_alloc_stid(dev->rdev.lldi.tids,
  2874. cm_id->local_addr.ss_family, ep);
  2875. if (ep->stid == -1) {
  2876. printk(KERN_ERR MOD "%s - cannot alloc stid.\n", __func__);
  2877. err = -ENOMEM;
  2878. goto fail2;
  2879. }
  2880. insert_handle(dev, &dev->stid_idr, ep, ep->stid);
  2881. /* No port mapper available, go with the specified info */
  2882. memcpy(&ep->com.mapped_local_addr, &cm_id->local_addr,
  2883. sizeof(ep->com.mapped_local_addr));
  2884. c4iw_form_reg_msg(dev, &pm_reg_msg);
  2885. iwpm_err = iwpm_register_pid(&pm_reg_msg, RDMA_NL_C4IW);
  2886. if (iwpm_err) {
  2887. PDBG("%s: Port Mapper reg pid fail (err = %d).\n",
  2888. __func__, iwpm_err);
  2889. }
  2890. if (iwpm_valid_pid() && !iwpm_err) {
  2891. memcpy(&pm_msg.loc_addr, &ep->com.local_addr,
  2892. sizeof(ep->com.local_addr));
  2893. iwpm_err = iwpm_add_mapping(&pm_msg, RDMA_NL_C4IW);
  2894. if (iwpm_err)
  2895. PDBG("%s: Port Mapper query fail (err = %d).\n",
  2896. __func__, iwpm_err);
  2897. else
  2898. memcpy(&ep->com.mapped_local_addr,
  2899. &pm_msg.mapped_loc_addr,
  2900. sizeof(ep->com.mapped_local_addr));
  2901. }
  2902. if (iwpm_create_mapinfo(&ep->com.local_addr,
  2903. &ep->com.mapped_local_addr, RDMA_NL_C4IW)) {
  2904. err = -ENOMEM;
  2905. goto fail3;
  2906. }
  2907. print_addr(&ep->com, __func__, "add_mapping/create_mapinfo");
  2908. set_bit(RELEASE_MAPINFO, &ep->com.flags);
  2909. state_set(&ep->com, LISTEN);
  2910. if (ep->com.local_addr.ss_family == AF_INET)
  2911. err = create_server4(dev, ep);
  2912. else
  2913. err = create_server6(dev, ep);
  2914. if (!err) {
  2915. cm_id->provider_data = ep;
  2916. goto out;
  2917. }
  2918. fail3:
  2919. cxgb4_free_stid(ep->com.dev->rdev.lldi.tids, ep->stid,
  2920. ep->com.local_addr.ss_family);
  2921. fail2:
  2922. cm_id->rem_ref(cm_id);
  2923. c4iw_put_ep(&ep->com);
  2924. fail1:
  2925. out:
  2926. return err;
  2927. }
  2928. int c4iw_destroy_listen(struct iw_cm_id *cm_id)
  2929. {
  2930. int err;
  2931. struct c4iw_listen_ep *ep = to_listen_ep(cm_id);
  2932. PDBG("%s ep %p\n", __func__, ep);
  2933. might_sleep();
  2934. state_set(&ep->com, DEAD);
  2935. if (ep->com.dev->rdev.lldi.enable_fw_ofld_conn &&
  2936. ep->com.local_addr.ss_family == AF_INET) {
  2937. err = cxgb4_remove_server_filter(
  2938. ep->com.dev->rdev.lldi.ports[0], ep->stid,
  2939. ep->com.dev->rdev.lldi.rxq_ids[0], 0);
  2940. } else {
  2941. c4iw_init_wr_wait(&ep->com.wr_wait);
  2942. err = cxgb4_remove_server(
  2943. ep->com.dev->rdev.lldi.ports[0], ep->stid,
  2944. ep->com.dev->rdev.lldi.rxq_ids[0], 0);
  2945. if (err)
  2946. goto done;
  2947. err = c4iw_wait_for_reply(&ep->com.dev->rdev, &ep->com.wr_wait,
  2948. 0, 0, __func__);
  2949. }
  2950. remove_handle(ep->com.dev, &ep->com.dev->stid_idr, ep->stid);
  2951. cxgb4_free_stid(ep->com.dev->rdev.lldi.tids, ep->stid,
  2952. ep->com.local_addr.ss_family);
  2953. done:
  2954. cm_id->rem_ref(cm_id);
  2955. c4iw_put_ep(&ep->com);
  2956. return err;
  2957. }
  2958. int c4iw_ep_disconnect(struct c4iw_ep *ep, int abrupt, gfp_t gfp)
  2959. {
  2960. int ret = 0;
  2961. int close = 0;
  2962. int fatal = 0;
  2963. struct c4iw_rdev *rdev;
  2964. mutex_lock(&ep->com.mutex);
  2965. PDBG("%s ep %p state %s, abrupt %d\n", __func__, ep,
  2966. states[ep->com.state], abrupt);
  2967. rdev = &ep->com.dev->rdev;
  2968. if (c4iw_fatal_error(rdev)) {
  2969. fatal = 1;
  2970. close_complete_upcall(ep, -EIO);
  2971. ep->com.state = DEAD;
  2972. }
  2973. switch (ep->com.state) {
  2974. case MPA_REQ_WAIT:
  2975. case MPA_REQ_SENT:
  2976. case MPA_REQ_RCVD:
  2977. case MPA_REP_SENT:
  2978. case FPDU_MODE:
  2979. close = 1;
  2980. if (abrupt)
  2981. ep->com.state = ABORTING;
  2982. else {
  2983. ep->com.state = CLOSING;
  2984. start_ep_timer(ep);
  2985. }
  2986. set_bit(CLOSE_SENT, &ep->com.flags);
  2987. break;
  2988. case CLOSING:
  2989. if (!test_and_set_bit(CLOSE_SENT, &ep->com.flags)) {
  2990. close = 1;
  2991. if (abrupt) {
  2992. (void)stop_ep_timer(ep);
  2993. ep->com.state = ABORTING;
  2994. } else
  2995. ep->com.state = MORIBUND;
  2996. }
  2997. break;
  2998. case MORIBUND:
  2999. case ABORTING:
  3000. case DEAD:
  3001. PDBG("%s ignoring disconnect ep %p state %u\n",
  3002. __func__, ep, ep->com.state);
  3003. break;
  3004. default:
  3005. BUG();
  3006. break;
  3007. }
  3008. if (close) {
  3009. if (abrupt) {
  3010. set_bit(EP_DISC_ABORT, &ep->com.history);
  3011. close_complete_upcall(ep, -ECONNRESET);
  3012. ret = send_abort(ep, NULL, gfp);
  3013. } else {
  3014. set_bit(EP_DISC_CLOSE, &ep->com.history);
  3015. ret = send_halfclose(ep, gfp);
  3016. }
  3017. if (ret)
  3018. fatal = 1;
  3019. }
  3020. mutex_unlock(&ep->com.mutex);
  3021. if (fatal)
  3022. release_ep_resources(ep);
  3023. return ret;
  3024. }
  3025. static void active_ofld_conn_reply(struct c4iw_dev *dev, struct sk_buff *skb,
  3026. struct cpl_fw6_msg_ofld_connection_wr_rpl *req)
  3027. {
  3028. struct c4iw_ep *ep;
  3029. int atid = be32_to_cpu(req->tid);
  3030. ep = (struct c4iw_ep *)lookup_atid(dev->rdev.lldi.tids,
  3031. (__force u32) req->tid);
  3032. if (!ep)
  3033. return;
  3034. switch (req->retval) {
  3035. case FW_ENOMEM:
  3036. set_bit(ACT_RETRY_NOMEM, &ep->com.history);
  3037. if (ep->retry_count++ < ACT_OPEN_RETRY_COUNT) {
  3038. send_fw_act_open_req(ep, atid);
  3039. return;
  3040. }
  3041. case FW_EADDRINUSE:
  3042. set_bit(ACT_RETRY_INUSE, &ep->com.history);
  3043. if (ep->retry_count++ < ACT_OPEN_RETRY_COUNT) {
  3044. send_fw_act_open_req(ep, atid);
  3045. return;
  3046. }
  3047. break;
  3048. default:
  3049. pr_info("%s unexpected ofld conn wr retval %d\n",
  3050. __func__, req->retval);
  3051. break;
  3052. }
  3053. pr_err("active ofld_connect_wr failure %d atid %d\n",
  3054. req->retval, atid);
  3055. mutex_lock(&dev->rdev.stats.lock);
  3056. dev->rdev.stats.act_ofld_conn_fails++;
  3057. mutex_unlock(&dev->rdev.stats.lock);
  3058. connect_reply_upcall(ep, status2errno(req->retval));
  3059. state_set(&ep->com, DEAD);
  3060. remove_handle(dev, &dev->atid_idr, atid);
  3061. cxgb4_free_atid(dev->rdev.lldi.tids, atid);
  3062. dst_release(ep->dst);
  3063. cxgb4_l2t_release(ep->l2t);
  3064. c4iw_put_ep(&ep->com);
  3065. }
  3066. static void passive_ofld_conn_reply(struct c4iw_dev *dev, struct sk_buff *skb,
  3067. struct cpl_fw6_msg_ofld_connection_wr_rpl *req)
  3068. {
  3069. struct sk_buff *rpl_skb;
  3070. struct cpl_pass_accept_req *cpl;
  3071. int ret;
  3072. rpl_skb = (struct sk_buff *)(unsigned long)req->cookie;
  3073. BUG_ON(!rpl_skb);
  3074. if (req->retval) {
  3075. PDBG("%s passive open failure %d\n", __func__, req->retval);
  3076. mutex_lock(&dev->rdev.stats.lock);
  3077. dev->rdev.stats.pas_ofld_conn_fails++;
  3078. mutex_unlock(&dev->rdev.stats.lock);
  3079. kfree_skb(rpl_skb);
  3080. } else {
  3081. cpl = (struct cpl_pass_accept_req *)cplhdr(rpl_skb);
  3082. OPCODE_TID(cpl) = htonl(MK_OPCODE_TID(CPL_PASS_ACCEPT_REQ,
  3083. (__force u32) htonl(
  3084. (__force u32) req->tid)));
  3085. ret = pass_accept_req(dev, rpl_skb);
  3086. if (!ret)
  3087. kfree_skb(rpl_skb);
  3088. }
  3089. return;
  3090. }
  3091. static int deferred_fw6_msg(struct c4iw_dev *dev, struct sk_buff *skb)
  3092. {
  3093. struct cpl_fw6_msg *rpl = cplhdr(skb);
  3094. struct cpl_fw6_msg_ofld_connection_wr_rpl *req;
  3095. switch (rpl->type) {
  3096. case FW6_TYPE_CQE:
  3097. c4iw_ev_dispatch(dev, (struct t4_cqe *)&rpl->data[0]);
  3098. break;
  3099. case FW6_TYPE_OFLD_CONNECTION_WR_RPL:
  3100. req = (struct cpl_fw6_msg_ofld_connection_wr_rpl *)rpl->data;
  3101. switch (req->t_state) {
  3102. case TCP_SYN_SENT:
  3103. active_ofld_conn_reply(dev, skb, req);
  3104. break;
  3105. case TCP_SYN_RECV:
  3106. passive_ofld_conn_reply(dev, skb, req);
  3107. break;
  3108. default:
  3109. pr_err("%s unexpected ofld conn wr state %d\n",
  3110. __func__, req->t_state);
  3111. break;
  3112. }
  3113. break;
  3114. }
  3115. return 0;
  3116. }
  3117. static void build_cpl_pass_accept_req(struct sk_buff *skb, int stid , u8 tos)
  3118. {
  3119. u32 l2info;
  3120. u16 vlantag, len, hdr_len, eth_hdr_len;
  3121. u8 intf;
  3122. struct cpl_rx_pkt *cpl = cplhdr(skb);
  3123. struct cpl_pass_accept_req *req;
  3124. struct tcp_options_received tmp_opt;
  3125. struct c4iw_dev *dev;
  3126. dev = *((struct c4iw_dev **) (skb->cb + sizeof(void *)));
  3127. /* Store values from cpl_rx_pkt in temporary location. */
  3128. vlantag = (__force u16) cpl->vlan;
  3129. len = (__force u16) cpl->len;
  3130. l2info = (__force u32) cpl->l2info;
  3131. hdr_len = (__force u16) cpl->hdr_len;
  3132. intf = cpl->iff;
  3133. __skb_pull(skb, sizeof(*req) + sizeof(struct rss_header));
  3134. /*
  3135. * We need to parse the TCP options from SYN packet.
  3136. * to generate cpl_pass_accept_req.
  3137. */
  3138. memset(&tmp_opt, 0, sizeof(tmp_opt));
  3139. tcp_clear_options(&tmp_opt);
  3140. tcp_parse_options(skb, &tmp_opt, 0, NULL);
  3141. req = (struct cpl_pass_accept_req *)__skb_push(skb, sizeof(*req));
  3142. memset(req, 0, sizeof(*req));
  3143. req->l2info = cpu_to_be16(V_SYN_INTF(intf) |
  3144. V_SYN_MAC_IDX(G_RX_MACIDX(
  3145. (__force int) htonl(l2info))) |
  3146. F_SYN_XACT_MATCH);
  3147. eth_hdr_len = is_t4(dev->rdev.lldi.adapter_type) ?
  3148. G_RX_ETHHDR_LEN((__force int) htonl(l2info)) :
  3149. G_RX_T5_ETHHDR_LEN((__force int) htonl(l2info));
  3150. req->hdr_len = cpu_to_be32(V_SYN_RX_CHAN(G_RX_CHAN(
  3151. (__force int) htonl(l2info))) |
  3152. V_TCP_HDR_LEN(G_RX_TCPHDR_LEN(
  3153. (__force int) htons(hdr_len))) |
  3154. V_IP_HDR_LEN(G_RX_IPHDR_LEN(
  3155. (__force int) htons(hdr_len))) |
  3156. V_ETH_HDR_LEN(G_RX_ETHHDR_LEN(eth_hdr_len)));
  3157. req->vlan = (__force __be16) vlantag;
  3158. req->len = (__force __be16) len;
  3159. req->tos_stid = cpu_to_be32(PASS_OPEN_TID(stid) |
  3160. PASS_OPEN_TOS(tos));
  3161. req->tcpopt.mss = htons(tmp_opt.mss_clamp);
  3162. if (tmp_opt.wscale_ok)
  3163. req->tcpopt.wsf = tmp_opt.snd_wscale;
  3164. req->tcpopt.tstamp = tmp_opt.saw_tstamp;
  3165. if (tmp_opt.sack_ok)
  3166. req->tcpopt.sack = 1;
  3167. OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_PASS_ACCEPT_REQ, 0));
  3168. return;
  3169. }
  3170. static void send_fw_pass_open_req(struct c4iw_dev *dev, struct sk_buff *skb,
  3171. __be32 laddr, __be16 lport,
  3172. __be32 raddr, __be16 rport,
  3173. u32 rcv_isn, u32 filter, u16 window,
  3174. u32 rss_qid, u8 port_id)
  3175. {
  3176. struct sk_buff *req_skb;
  3177. struct fw_ofld_connection_wr *req;
  3178. struct cpl_pass_accept_req *cpl = cplhdr(skb);
  3179. int ret;
  3180. req_skb = alloc_skb(sizeof(struct fw_ofld_connection_wr), GFP_KERNEL);
  3181. req = (struct fw_ofld_connection_wr *)__skb_put(req_skb, sizeof(*req));
  3182. memset(req, 0, sizeof(*req));
  3183. req->op_compl = htonl(V_WR_OP(FW_OFLD_CONNECTION_WR) | FW_WR_COMPL_F);
  3184. req->len16_pkd = htonl(FW_WR_LEN16_V(DIV_ROUND_UP(sizeof(*req), 16)));
  3185. req->le.version_cpl = htonl(FW_OFLD_CONNECTION_WR_CPL_F);
  3186. req->le.filter = (__force __be32) filter;
  3187. req->le.lport = lport;
  3188. req->le.pport = rport;
  3189. req->le.u.ipv4.lip = laddr;
  3190. req->le.u.ipv4.pip = raddr;
  3191. req->tcb.rcv_nxt = htonl(rcv_isn + 1);
  3192. req->tcb.rcv_adv = htons(window);
  3193. req->tcb.t_state_to_astid =
  3194. htonl(FW_OFLD_CONNECTION_WR_T_STATE_V(TCP_SYN_RECV) |
  3195. FW_OFLD_CONNECTION_WR_RCV_SCALE_V(cpl->tcpopt.wsf) |
  3196. FW_OFLD_CONNECTION_WR_ASTID_V(
  3197. GET_PASS_OPEN_TID(ntohl(cpl->tos_stid))));
  3198. /*
  3199. * We store the qid in opt2 which will be used by the firmware
  3200. * to send us the wr response.
  3201. */
  3202. req->tcb.opt2 = htonl(RSS_QUEUE_V(rss_qid));
  3203. /*
  3204. * We initialize the MSS index in TCB to 0xF.
  3205. * So that when driver sends cpl_pass_accept_rpl
  3206. * TCB picks up the correct value. If this was 0
  3207. * TP will ignore any value > 0 for MSS index.
  3208. */
  3209. req->tcb.opt0 = cpu_to_be64(MSS_IDX_V(0xF));
  3210. req->cookie = (unsigned long)skb;
  3211. set_wr_txq(req_skb, CPL_PRIORITY_CONTROL, port_id);
  3212. ret = cxgb4_ofld_send(dev->rdev.lldi.ports[0], req_skb);
  3213. if (ret < 0) {
  3214. pr_err("%s - cxgb4_ofld_send error %d - dropping\n", __func__,
  3215. ret);
  3216. kfree_skb(skb);
  3217. kfree_skb(req_skb);
  3218. }
  3219. }
  3220. /*
  3221. * Handler for CPL_RX_PKT message. Need to handle cpl_rx_pkt
  3222. * messages when a filter is being used instead of server to
  3223. * redirect a syn packet. When packets hit filter they are redirected
  3224. * to the offload queue and driver tries to establish the connection
  3225. * using firmware work request.
  3226. */
  3227. static int rx_pkt(struct c4iw_dev *dev, struct sk_buff *skb)
  3228. {
  3229. int stid;
  3230. unsigned int filter;
  3231. struct ethhdr *eh = NULL;
  3232. struct vlan_ethhdr *vlan_eh = NULL;
  3233. struct iphdr *iph;
  3234. struct tcphdr *tcph;
  3235. struct rss_header *rss = (void *)skb->data;
  3236. struct cpl_rx_pkt *cpl = (void *)skb->data;
  3237. struct cpl_pass_accept_req *req = (void *)(rss + 1);
  3238. struct l2t_entry *e;
  3239. struct dst_entry *dst;
  3240. struct c4iw_ep *lep;
  3241. u16 window;
  3242. struct port_info *pi;
  3243. struct net_device *pdev;
  3244. u16 rss_qid, eth_hdr_len;
  3245. int step;
  3246. u32 tx_chan;
  3247. struct neighbour *neigh;
  3248. /* Drop all non-SYN packets */
  3249. if (!(cpl->l2info & cpu_to_be32(F_RXF_SYN)))
  3250. goto reject;
  3251. /*
  3252. * Drop all packets which did not hit the filter.
  3253. * Unlikely to happen.
  3254. */
  3255. if (!(rss->filter_hit && rss->filter_tid))
  3256. goto reject;
  3257. /*
  3258. * Calculate the server tid from filter hit index from cpl_rx_pkt.
  3259. */
  3260. stid = (__force int) cpu_to_be32((__force u32) rss->hash_val);
  3261. lep = (struct c4iw_ep *)lookup_stid(dev->rdev.lldi.tids, stid);
  3262. if (!lep) {
  3263. PDBG("%s connect request on invalid stid %d\n", __func__, stid);
  3264. goto reject;
  3265. }
  3266. eth_hdr_len = is_t4(dev->rdev.lldi.adapter_type) ?
  3267. G_RX_ETHHDR_LEN(htonl(cpl->l2info)) :
  3268. G_RX_T5_ETHHDR_LEN(htonl(cpl->l2info));
  3269. if (eth_hdr_len == ETH_HLEN) {
  3270. eh = (struct ethhdr *)(req + 1);
  3271. iph = (struct iphdr *)(eh + 1);
  3272. } else {
  3273. vlan_eh = (struct vlan_ethhdr *)(req + 1);
  3274. iph = (struct iphdr *)(vlan_eh + 1);
  3275. skb->vlan_tci = ntohs(cpl->vlan);
  3276. }
  3277. if (iph->version != 0x4)
  3278. goto reject;
  3279. tcph = (struct tcphdr *)(iph + 1);
  3280. skb_set_network_header(skb, (void *)iph - (void *)rss);
  3281. skb_set_transport_header(skb, (void *)tcph - (void *)rss);
  3282. skb_get(skb);
  3283. PDBG("%s lip 0x%x lport %u pip 0x%x pport %u tos %d\n", __func__,
  3284. ntohl(iph->daddr), ntohs(tcph->dest), ntohl(iph->saddr),
  3285. ntohs(tcph->source), iph->tos);
  3286. dst = find_route(dev, iph->daddr, iph->saddr, tcph->dest, tcph->source,
  3287. iph->tos);
  3288. if (!dst) {
  3289. pr_err("%s - failed to find dst entry!\n",
  3290. __func__);
  3291. goto reject;
  3292. }
  3293. neigh = dst_neigh_lookup_skb(dst, skb);
  3294. if (!neigh) {
  3295. pr_err("%s - failed to allocate neigh!\n",
  3296. __func__);
  3297. goto free_dst;
  3298. }
  3299. if (neigh->dev->flags & IFF_LOOPBACK) {
  3300. pdev = ip_dev_find(&init_net, iph->daddr);
  3301. e = cxgb4_l2t_get(dev->rdev.lldi.l2t, neigh,
  3302. pdev, 0);
  3303. pi = (struct port_info *)netdev_priv(pdev);
  3304. tx_chan = cxgb4_port_chan(pdev);
  3305. dev_put(pdev);
  3306. } else {
  3307. pdev = get_real_dev(neigh->dev);
  3308. e = cxgb4_l2t_get(dev->rdev.lldi.l2t, neigh,
  3309. pdev, 0);
  3310. pi = (struct port_info *)netdev_priv(pdev);
  3311. tx_chan = cxgb4_port_chan(pdev);
  3312. }
  3313. neigh_release(neigh);
  3314. if (!e) {
  3315. pr_err("%s - failed to allocate l2t entry!\n",
  3316. __func__);
  3317. goto free_dst;
  3318. }
  3319. step = dev->rdev.lldi.nrxq / dev->rdev.lldi.nchan;
  3320. rss_qid = dev->rdev.lldi.rxq_ids[pi->port_id * step];
  3321. window = (__force u16) htons((__force u16)tcph->window);
  3322. /* Calcuate filter portion for LE region. */
  3323. filter = (__force unsigned int) cpu_to_be32(cxgb4_select_ntuple(
  3324. dev->rdev.lldi.ports[0],
  3325. e));
  3326. /*
  3327. * Synthesize the cpl_pass_accept_req. We have everything except the
  3328. * TID. Once firmware sends a reply with TID we update the TID field
  3329. * in cpl and pass it through the regular cpl_pass_accept_req path.
  3330. */
  3331. build_cpl_pass_accept_req(skb, stid, iph->tos);
  3332. send_fw_pass_open_req(dev, skb, iph->daddr, tcph->dest, iph->saddr,
  3333. tcph->source, ntohl(tcph->seq), filter, window,
  3334. rss_qid, pi->port_id);
  3335. cxgb4_l2t_release(e);
  3336. free_dst:
  3337. dst_release(dst);
  3338. reject:
  3339. return 0;
  3340. }
  3341. /*
  3342. * These are the real handlers that are called from a
  3343. * work queue.
  3344. */
  3345. static c4iw_handler_func work_handlers[NUM_CPL_CMDS] = {
  3346. [CPL_ACT_ESTABLISH] = act_establish,
  3347. [CPL_ACT_OPEN_RPL] = act_open_rpl,
  3348. [CPL_RX_DATA] = rx_data,
  3349. [CPL_ABORT_RPL_RSS] = abort_rpl,
  3350. [CPL_ABORT_RPL] = abort_rpl,
  3351. [CPL_PASS_OPEN_RPL] = pass_open_rpl,
  3352. [CPL_CLOSE_LISTSRV_RPL] = close_listsrv_rpl,
  3353. [CPL_PASS_ACCEPT_REQ] = pass_accept_req,
  3354. [CPL_PASS_ESTABLISH] = pass_establish,
  3355. [CPL_PEER_CLOSE] = peer_close,
  3356. [CPL_ABORT_REQ_RSS] = peer_abort,
  3357. [CPL_CLOSE_CON_RPL] = close_con_rpl,
  3358. [CPL_RDMA_TERMINATE] = terminate,
  3359. [CPL_FW4_ACK] = fw4_ack,
  3360. [CPL_FW6_MSG] = deferred_fw6_msg,
  3361. [CPL_RX_PKT] = rx_pkt
  3362. };
  3363. static void process_timeout(struct c4iw_ep *ep)
  3364. {
  3365. struct c4iw_qp_attributes attrs;
  3366. int abort = 1;
  3367. mutex_lock(&ep->com.mutex);
  3368. PDBG("%s ep %p tid %u state %d\n", __func__, ep, ep->hwtid,
  3369. ep->com.state);
  3370. set_bit(TIMEDOUT, &ep->com.history);
  3371. switch (ep->com.state) {
  3372. case MPA_REQ_SENT:
  3373. __state_set(&ep->com, ABORTING);
  3374. connect_reply_upcall(ep, -ETIMEDOUT);
  3375. break;
  3376. case MPA_REQ_WAIT:
  3377. __state_set(&ep->com, ABORTING);
  3378. break;
  3379. case CLOSING:
  3380. case MORIBUND:
  3381. if (ep->com.cm_id && ep->com.qp) {
  3382. attrs.next_state = C4IW_QP_STATE_ERROR;
  3383. c4iw_modify_qp(ep->com.qp->rhp,
  3384. ep->com.qp, C4IW_QP_ATTR_NEXT_STATE,
  3385. &attrs, 1);
  3386. }
  3387. __state_set(&ep->com, ABORTING);
  3388. close_complete_upcall(ep, -ETIMEDOUT);
  3389. break;
  3390. case ABORTING:
  3391. case DEAD:
  3392. /*
  3393. * These states are expected if the ep timed out at the same
  3394. * time as another thread was calling stop_ep_timer().
  3395. * So we silently do nothing for these states.
  3396. */
  3397. abort = 0;
  3398. break;
  3399. default:
  3400. WARN(1, "%s unexpected state ep %p tid %u state %u\n",
  3401. __func__, ep, ep->hwtid, ep->com.state);
  3402. abort = 0;
  3403. }
  3404. if (abort)
  3405. abort_connection(ep, NULL, GFP_KERNEL);
  3406. mutex_unlock(&ep->com.mutex);
  3407. c4iw_put_ep(&ep->com);
  3408. }
  3409. static void process_timedout_eps(void)
  3410. {
  3411. struct c4iw_ep *ep;
  3412. spin_lock_irq(&timeout_lock);
  3413. while (!list_empty(&timeout_list)) {
  3414. struct list_head *tmp;
  3415. tmp = timeout_list.next;
  3416. list_del(tmp);
  3417. tmp->next = NULL;
  3418. tmp->prev = NULL;
  3419. spin_unlock_irq(&timeout_lock);
  3420. ep = list_entry(tmp, struct c4iw_ep, entry);
  3421. process_timeout(ep);
  3422. spin_lock_irq(&timeout_lock);
  3423. }
  3424. spin_unlock_irq(&timeout_lock);
  3425. }
  3426. static void process_work(struct work_struct *work)
  3427. {
  3428. struct sk_buff *skb = NULL;
  3429. struct c4iw_dev *dev;
  3430. struct cpl_act_establish *rpl;
  3431. unsigned int opcode;
  3432. int ret;
  3433. process_timedout_eps();
  3434. while ((skb = skb_dequeue(&rxq))) {
  3435. rpl = cplhdr(skb);
  3436. dev = *((struct c4iw_dev **) (skb->cb + sizeof(void *)));
  3437. opcode = rpl->ot.opcode;
  3438. BUG_ON(!work_handlers[opcode]);
  3439. ret = work_handlers[opcode](dev, skb);
  3440. if (!ret)
  3441. kfree_skb(skb);
  3442. process_timedout_eps();
  3443. }
  3444. }
  3445. static DECLARE_WORK(skb_work, process_work);
  3446. static void ep_timeout(unsigned long arg)
  3447. {
  3448. struct c4iw_ep *ep = (struct c4iw_ep *)arg;
  3449. int kickit = 0;
  3450. spin_lock(&timeout_lock);
  3451. if (!test_and_set_bit(TIMEOUT, &ep->com.flags)) {
  3452. /*
  3453. * Only insert if it is not already on the list.
  3454. */
  3455. if (!ep->entry.next) {
  3456. list_add_tail(&ep->entry, &timeout_list);
  3457. kickit = 1;
  3458. }
  3459. }
  3460. spin_unlock(&timeout_lock);
  3461. if (kickit)
  3462. queue_work(workq, &skb_work);
  3463. }
  3464. /*
  3465. * All the CM events are handled on a work queue to have a safe context.
  3466. */
  3467. static int sched(struct c4iw_dev *dev, struct sk_buff *skb)
  3468. {
  3469. /*
  3470. * Save dev in the skb->cb area.
  3471. */
  3472. *((struct c4iw_dev **) (skb->cb + sizeof(void *))) = dev;
  3473. /*
  3474. * Queue the skb and schedule the worker thread.
  3475. */
  3476. skb_queue_tail(&rxq, skb);
  3477. queue_work(workq, &skb_work);
  3478. return 0;
  3479. }
  3480. static int set_tcb_rpl(struct c4iw_dev *dev, struct sk_buff *skb)
  3481. {
  3482. struct cpl_set_tcb_rpl *rpl = cplhdr(skb);
  3483. if (rpl->status != CPL_ERR_NONE) {
  3484. printk(KERN_ERR MOD "Unexpected SET_TCB_RPL status %u "
  3485. "for tid %u\n", rpl->status, GET_TID(rpl));
  3486. }
  3487. kfree_skb(skb);
  3488. return 0;
  3489. }
  3490. static int fw6_msg(struct c4iw_dev *dev, struct sk_buff *skb)
  3491. {
  3492. struct cpl_fw6_msg *rpl = cplhdr(skb);
  3493. struct c4iw_wr_wait *wr_waitp;
  3494. int ret;
  3495. PDBG("%s type %u\n", __func__, rpl->type);
  3496. switch (rpl->type) {
  3497. case FW6_TYPE_WR_RPL:
  3498. ret = (int)((be64_to_cpu(rpl->data[0]) >> 8) & 0xff);
  3499. wr_waitp = (struct c4iw_wr_wait *)(__force unsigned long) rpl->data[1];
  3500. PDBG("%s wr_waitp %p ret %u\n", __func__, wr_waitp, ret);
  3501. if (wr_waitp)
  3502. c4iw_wake_up(wr_waitp, ret ? -ret : 0);
  3503. kfree_skb(skb);
  3504. break;
  3505. case FW6_TYPE_CQE:
  3506. case FW6_TYPE_OFLD_CONNECTION_WR_RPL:
  3507. sched(dev, skb);
  3508. break;
  3509. default:
  3510. printk(KERN_ERR MOD "%s unexpected fw6 msg type %u\n", __func__,
  3511. rpl->type);
  3512. kfree_skb(skb);
  3513. break;
  3514. }
  3515. return 0;
  3516. }
  3517. static int peer_abort_intr(struct c4iw_dev *dev, struct sk_buff *skb)
  3518. {
  3519. struct cpl_abort_req_rss *req = cplhdr(skb);
  3520. struct c4iw_ep *ep;
  3521. struct tid_info *t = dev->rdev.lldi.tids;
  3522. unsigned int tid = GET_TID(req);
  3523. ep = lookup_tid(t, tid);
  3524. if (!ep) {
  3525. printk(KERN_WARNING MOD
  3526. "Abort on non-existent endpoint, tid %d\n", tid);
  3527. kfree_skb(skb);
  3528. return 0;
  3529. }
  3530. if (is_neg_adv(req->status)) {
  3531. dev_warn(&dev->rdev.lldi.pdev->dev,
  3532. "Negative advice on abort - tid %u status %d (%s)\n",
  3533. ep->hwtid, req->status, neg_adv_str(req->status));
  3534. kfree_skb(skb);
  3535. return 0;
  3536. }
  3537. PDBG("%s ep %p tid %u state %u\n", __func__, ep, ep->hwtid,
  3538. ep->com.state);
  3539. /*
  3540. * Wake up any threads in rdma_init() or rdma_fini().
  3541. * However, if we are on MPAv2 and want to retry with MPAv1
  3542. * then, don't wake up yet.
  3543. */
  3544. if (mpa_rev == 2 && !ep->tried_with_mpa_v1) {
  3545. if (ep->com.state != MPA_REQ_SENT)
  3546. c4iw_wake_up(&ep->com.wr_wait, -ECONNRESET);
  3547. } else
  3548. c4iw_wake_up(&ep->com.wr_wait, -ECONNRESET);
  3549. sched(dev, skb);
  3550. return 0;
  3551. }
  3552. /*
  3553. * Most upcalls from the T4 Core go to sched() to
  3554. * schedule the processing on a work queue.
  3555. */
  3556. c4iw_handler_func c4iw_handlers[NUM_CPL_CMDS] = {
  3557. [CPL_ACT_ESTABLISH] = sched,
  3558. [CPL_ACT_OPEN_RPL] = sched,
  3559. [CPL_RX_DATA] = sched,
  3560. [CPL_ABORT_RPL_RSS] = sched,
  3561. [CPL_ABORT_RPL] = sched,
  3562. [CPL_PASS_OPEN_RPL] = sched,
  3563. [CPL_CLOSE_LISTSRV_RPL] = sched,
  3564. [CPL_PASS_ACCEPT_REQ] = sched,
  3565. [CPL_PASS_ESTABLISH] = sched,
  3566. [CPL_PEER_CLOSE] = sched,
  3567. [CPL_CLOSE_CON_RPL] = sched,
  3568. [CPL_ABORT_REQ_RSS] = peer_abort_intr,
  3569. [CPL_RDMA_TERMINATE] = sched,
  3570. [CPL_FW4_ACK] = sched,
  3571. [CPL_SET_TCB_RPL] = set_tcb_rpl,
  3572. [CPL_FW6_MSG] = fw6_msg,
  3573. [CPL_RX_PKT] = sched
  3574. };
  3575. int __init c4iw_cm_init(void)
  3576. {
  3577. spin_lock_init(&timeout_lock);
  3578. skb_queue_head_init(&rxq);
  3579. workq = create_singlethread_workqueue("iw_cxgb4");
  3580. if (!workq)
  3581. return -ENOMEM;
  3582. return 0;
  3583. }
  3584. void c4iw_cm_term(void)
  3585. {
  3586. WARN_ON(!list_empty(&timeout_list));
  3587. flush_workqueue(workq);
  3588. destroy_workqueue(workq);
  3589. }