xprt.c 40 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541
  1. /*
  2. * linux/net/sunrpc/xprt.c
  3. *
  4. * This is a generic RPC call interface supporting congestion avoidance,
  5. * and asynchronous calls.
  6. *
  7. * The interface works like this:
  8. *
  9. * - When a process places a call, it allocates a request slot if
  10. * one is available. Otherwise, it sleeps on the backlog queue
  11. * (xprt_reserve).
  12. * - Next, the caller puts together the RPC message, stuffs it into
  13. * the request struct, and calls xprt_transmit().
  14. * - xprt_transmit sends the message and installs the caller on the
  15. * transport's wait list. At the same time, if a reply is expected,
  16. * it installs a timer that is run after the packet's timeout has
  17. * expired.
  18. * - When a packet arrives, the data_ready handler walks the list of
  19. * pending requests for that transport. If a matching XID is found, the
  20. * caller is woken up, and the timer removed.
  21. * - When no reply arrives within the timeout interval, the timer is
  22. * fired by the kernel and runs xprt_timer(). It either adjusts the
  23. * timeout values (minor timeout) or wakes up the caller with a status
  24. * of -ETIMEDOUT.
  25. * - When the caller receives a notification from RPC that a reply arrived,
  26. * it should release the RPC slot, and process the reply.
  27. * If the call timed out, it may choose to retry the operation by
  28. * adjusting the initial timeout value, and simply calling rpc_call
  29. * again.
  30. *
  31. * Support for async RPC is done through a set of RPC-specific scheduling
  32. * primitives that `transparently' work for processes as well as async
  33. * tasks that rely on callbacks.
  34. *
  35. * Copyright (C) 1995-1997, Olaf Kirch <okir@monad.swb.de>
  36. *
  37. * Transport switch API copyright (C) 2005, Chuck Lever <cel@netapp.com>
  38. */
  39. #include <linux/module.h>
  40. #include <linux/types.h>
  41. #include <linux/interrupt.h>
  42. #include <linux/workqueue.h>
  43. #include <linux/net.h>
  44. #include <linux/ktime.h>
  45. #include <linux/sunrpc/clnt.h>
  46. #include <linux/sunrpc/metrics.h>
  47. #include <linux/sunrpc/bc_xprt.h>
  48. #include <linux/rcupdate.h>
  49. #include <trace/events/sunrpc.h>
  50. #include "sunrpc.h"
  51. /*
  52. * Local variables
  53. */
  54. #if IS_ENABLED(CONFIG_SUNRPC_DEBUG)
  55. # define RPCDBG_FACILITY RPCDBG_XPRT
  56. #endif
  57. /*
  58. * Local functions
  59. */
  60. static void xprt_init(struct rpc_xprt *xprt, struct net *net);
  61. static __be32 xprt_alloc_xid(struct rpc_xprt *xprt);
  62. static void xprt_connect_status(struct rpc_task *task);
  63. static int __xprt_get_cong(struct rpc_xprt *, struct rpc_task *);
  64. static void __xprt_put_cong(struct rpc_xprt *, struct rpc_rqst *);
  65. static void xprt_destroy(struct rpc_xprt *xprt);
  66. static DEFINE_SPINLOCK(xprt_list_lock);
  67. static LIST_HEAD(xprt_list);
  68. /**
  69. * xprt_register_transport - register a transport implementation
  70. * @transport: transport to register
  71. *
  72. * If a transport implementation is loaded as a kernel module, it can
  73. * call this interface to make itself known to the RPC client.
  74. *
  75. * Returns:
  76. * 0: transport successfully registered
  77. * -EEXIST: transport already registered
  78. * -EINVAL: transport module being unloaded
  79. */
  80. int xprt_register_transport(struct xprt_class *transport)
  81. {
  82. struct xprt_class *t;
  83. int result;
  84. result = -EEXIST;
  85. spin_lock(&xprt_list_lock);
  86. list_for_each_entry(t, &xprt_list, list) {
  87. /* don't register the same transport class twice */
  88. if (t->ident == transport->ident)
  89. goto out;
  90. }
  91. list_add_tail(&transport->list, &xprt_list);
  92. printk(KERN_INFO "RPC: Registered %s transport module.\n",
  93. transport->name);
  94. result = 0;
  95. out:
  96. spin_unlock(&xprt_list_lock);
  97. return result;
  98. }
  99. EXPORT_SYMBOL_GPL(xprt_register_transport);
  100. /**
  101. * xprt_unregister_transport - unregister a transport implementation
  102. * @transport: transport to unregister
  103. *
  104. * Returns:
  105. * 0: transport successfully unregistered
  106. * -ENOENT: transport never registered
  107. */
  108. int xprt_unregister_transport(struct xprt_class *transport)
  109. {
  110. struct xprt_class *t;
  111. int result;
  112. result = 0;
  113. spin_lock(&xprt_list_lock);
  114. list_for_each_entry(t, &xprt_list, list) {
  115. if (t == transport) {
  116. printk(KERN_INFO
  117. "RPC: Unregistered %s transport module.\n",
  118. transport->name);
  119. list_del_init(&transport->list);
  120. goto out;
  121. }
  122. }
  123. result = -ENOENT;
  124. out:
  125. spin_unlock(&xprt_list_lock);
  126. return result;
  127. }
  128. EXPORT_SYMBOL_GPL(xprt_unregister_transport);
  129. /**
  130. * xprt_load_transport - load a transport implementation
  131. * @transport_name: transport to load
  132. *
  133. * Returns:
  134. * 0: transport successfully loaded
  135. * -ENOENT: transport module not available
  136. */
  137. int xprt_load_transport(const char *transport_name)
  138. {
  139. struct xprt_class *t;
  140. int result;
  141. result = 0;
  142. spin_lock(&xprt_list_lock);
  143. list_for_each_entry(t, &xprt_list, list) {
  144. if (strcmp(t->name, transport_name) == 0) {
  145. spin_unlock(&xprt_list_lock);
  146. goto out;
  147. }
  148. }
  149. spin_unlock(&xprt_list_lock);
  150. result = request_module("xprt%s", transport_name);
  151. out:
  152. return result;
  153. }
  154. EXPORT_SYMBOL_GPL(xprt_load_transport);
  155. /**
  156. * xprt_reserve_xprt - serialize write access to transports
  157. * @task: task that is requesting access to the transport
  158. * @xprt: pointer to the target transport
  159. *
  160. * This prevents mixing the payload of separate requests, and prevents
  161. * transport connects from colliding with writes. No congestion control
  162. * is provided.
  163. */
  164. int xprt_reserve_xprt(struct rpc_xprt *xprt, struct rpc_task *task)
  165. {
  166. struct rpc_rqst *req = task->tk_rqstp;
  167. int priority;
  168. if (test_and_set_bit(XPRT_LOCKED, &xprt->state)) {
  169. if (task == xprt->snd_task)
  170. return 1;
  171. goto out_sleep;
  172. }
  173. xprt->snd_task = task;
  174. if (req != NULL)
  175. req->rq_ntrans++;
  176. return 1;
  177. out_sleep:
  178. dprintk("RPC: %5u failed to lock transport %p\n",
  179. task->tk_pid, xprt);
  180. task->tk_timeout = 0;
  181. task->tk_status = -EAGAIN;
  182. if (req == NULL)
  183. priority = RPC_PRIORITY_LOW;
  184. else if (!req->rq_ntrans)
  185. priority = RPC_PRIORITY_NORMAL;
  186. else
  187. priority = RPC_PRIORITY_HIGH;
  188. rpc_sleep_on_priority(&xprt->sending, task, NULL, priority);
  189. return 0;
  190. }
  191. EXPORT_SYMBOL_GPL(xprt_reserve_xprt);
  192. static void xprt_clear_locked(struct rpc_xprt *xprt)
  193. {
  194. xprt->snd_task = NULL;
  195. if (!test_bit(XPRT_CLOSE_WAIT, &xprt->state)) {
  196. smp_mb__before_atomic();
  197. clear_bit(XPRT_LOCKED, &xprt->state);
  198. smp_mb__after_atomic();
  199. } else
  200. queue_work(xprtiod_workqueue, &xprt->task_cleanup);
  201. }
  202. /*
  203. * xprt_reserve_xprt_cong - serialize write access to transports
  204. * @task: task that is requesting access to the transport
  205. *
  206. * Same as xprt_reserve_xprt, but Van Jacobson congestion control is
  207. * integrated into the decision of whether a request is allowed to be
  208. * woken up and given access to the transport.
  209. */
  210. int xprt_reserve_xprt_cong(struct rpc_xprt *xprt, struct rpc_task *task)
  211. {
  212. struct rpc_rqst *req = task->tk_rqstp;
  213. int priority;
  214. if (test_and_set_bit(XPRT_LOCKED, &xprt->state)) {
  215. if (task == xprt->snd_task)
  216. return 1;
  217. goto out_sleep;
  218. }
  219. if (req == NULL) {
  220. xprt->snd_task = task;
  221. return 1;
  222. }
  223. if (__xprt_get_cong(xprt, task)) {
  224. xprt->snd_task = task;
  225. req->rq_ntrans++;
  226. return 1;
  227. }
  228. xprt_clear_locked(xprt);
  229. out_sleep:
  230. if (req)
  231. __xprt_put_cong(xprt, req);
  232. dprintk("RPC: %5u failed to lock transport %p\n", task->tk_pid, xprt);
  233. task->tk_timeout = 0;
  234. task->tk_status = -EAGAIN;
  235. if (req == NULL)
  236. priority = RPC_PRIORITY_LOW;
  237. else if (!req->rq_ntrans)
  238. priority = RPC_PRIORITY_NORMAL;
  239. else
  240. priority = RPC_PRIORITY_HIGH;
  241. rpc_sleep_on_priority(&xprt->sending, task, NULL, priority);
  242. return 0;
  243. }
  244. EXPORT_SYMBOL_GPL(xprt_reserve_xprt_cong);
  245. static inline int xprt_lock_write(struct rpc_xprt *xprt, struct rpc_task *task)
  246. {
  247. int retval;
  248. spin_lock_bh(&xprt->transport_lock);
  249. retval = xprt->ops->reserve_xprt(xprt, task);
  250. spin_unlock_bh(&xprt->transport_lock);
  251. return retval;
  252. }
  253. static bool __xprt_lock_write_func(struct rpc_task *task, void *data)
  254. {
  255. struct rpc_xprt *xprt = data;
  256. struct rpc_rqst *req;
  257. req = task->tk_rqstp;
  258. xprt->snd_task = task;
  259. if (req)
  260. req->rq_ntrans++;
  261. return true;
  262. }
  263. static void __xprt_lock_write_next(struct rpc_xprt *xprt)
  264. {
  265. if (test_and_set_bit(XPRT_LOCKED, &xprt->state))
  266. return;
  267. if (rpc_wake_up_first_on_wq(xprtiod_workqueue, &xprt->sending,
  268. __xprt_lock_write_func, xprt))
  269. return;
  270. xprt_clear_locked(xprt);
  271. }
  272. static bool __xprt_lock_write_cong_func(struct rpc_task *task, void *data)
  273. {
  274. struct rpc_xprt *xprt = data;
  275. struct rpc_rqst *req;
  276. req = task->tk_rqstp;
  277. if (req == NULL) {
  278. xprt->snd_task = task;
  279. return true;
  280. }
  281. if (__xprt_get_cong(xprt, task)) {
  282. xprt->snd_task = task;
  283. req->rq_ntrans++;
  284. return true;
  285. }
  286. return false;
  287. }
  288. static void __xprt_lock_write_next_cong(struct rpc_xprt *xprt)
  289. {
  290. if (test_and_set_bit(XPRT_LOCKED, &xprt->state))
  291. return;
  292. if (RPCXPRT_CONGESTED(xprt))
  293. goto out_unlock;
  294. if (rpc_wake_up_first_on_wq(xprtiod_workqueue, &xprt->sending,
  295. __xprt_lock_write_cong_func, xprt))
  296. return;
  297. out_unlock:
  298. xprt_clear_locked(xprt);
  299. }
  300. static void xprt_task_clear_bytes_sent(struct rpc_task *task)
  301. {
  302. if (task != NULL) {
  303. struct rpc_rqst *req = task->tk_rqstp;
  304. if (req != NULL)
  305. req->rq_bytes_sent = 0;
  306. }
  307. }
  308. /**
  309. * xprt_release_xprt - allow other requests to use a transport
  310. * @xprt: transport with other tasks potentially waiting
  311. * @task: task that is releasing access to the transport
  312. *
  313. * Note that "task" can be NULL. No congestion control is provided.
  314. */
  315. void xprt_release_xprt(struct rpc_xprt *xprt, struct rpc_task *task)
  316. {
  317. if (xprt->snd_task == task) {
  318. xprt_task_clear_bytes_sent(task);
  319. xprt_clear_locked(xprt);
  320. __xprt_lock_write_next(xprt);
  321. }
  322. }
  323. EXPORT_SYMBOL_GPL(xprt_release_xprt);
  324. /**
  325. * xprt_release_xprt_cong - allow other requests to use a transport
  326. * @xprt: transport with other tasks potentially waiting
  327. * @task: task that is releasing access to the transport
  328. *
  329. * Note that "task" can be NULL. Another task is awoken to use the
  330. * transport if the transport's congestion window allows it.
  331. */
  332. void xprt_release_xprt_cong(struct rpc_xprt *xprt, struct rpc_task *task)
  333. {
  334. if (xprt->snd_task == task) {
  335. xprt_task_clear_bytes_sent(task);
  336. xprt_clear_locked(xprt);
  337. __xprt_lock_write_next_cong(xprt);
  338. }
  339. }
  340. EXPORT_SYMBOL_GPL(xprt_release_xprt_cong);
  341. static inline void xprt_release_write(struct rpc_xprt *xprt, struct rpc_task *task)
  342. {
  343. spin_lock_bh(&xprt->transport_lock);
  344. xprt->ops->release_xprt(xprt, task);
  345. spin_unlock_bh(&xprt->transport_lock);
  346. }
  347. /*
  348. * Van Jacobson congestion avoidance. Check if the congestion window
  349. * overflowed. Put the task to sleep if this is the case.
  350. */
  351. static int
  352. __xprt_get_cong(struct rpc_xprt *xprt, struct rpc_task *task)
  353. {
  354. struct rpc_rqst *req = task->tk_rqstp;
  355. if (req->rq_cong)
  356. return 1;
  357. dprintk("RPC: %5u xprt_cwnd_limited cong = %lu cwnd = %lu\n",
  358. task->tk_pid, xprt->cong, xprt->cwnd);
  359. if (RPCXPRT_CONGESTED(xprt))
  360. return 0;
  361. req->rq_cong = 1;
  362. xprt->cong += RPC_CWNDSCALE;
  363. return 1;
  364. }
  365. /*
  366. * Adjust the congestion window, and wake up the next task
  367. * that has been sleeping due to congestion
  368. */
  369. static void
  370. __xprt_put_cong(struct rpc_xprt *xprt, struct rpc_rqst *req)
  371. {
  372. if (!req->rq_cong)
  373. return;
  374. req->rq_cong = 0;
  375. xprt->cong -= RPC_CWNDSCALE;
  376. __xprt_lock_write_next_cong(xprt);
  377. }
  378. /**
  379. * xprt_release_rqst_cong - housekeeping when request is complete
  380. * @task: RPC request that recently completed
  381. *
  382. * Useful for transports that require congestion control.
  383. */
  384. void xprt_release_rqst_cong(struct rpc_task *task)
  385. {
  386. struct rpc_rqst *req = task->tk_rqstp;
  387. __xprt_put_cong(req->rq_xprt, req);
  388. }
  389. EXPORT_SYMBOL_GPL(xprt_release_rqst_cong);
  390. /**
  391. * xprt_adjust_cwnd - adjust transport congestion window
  392. * @xprt: pointer to xprt
  393. * @task: recently completed RPC request used to adjust window
  394. * @result: result code of completed RPC request
  395. *
  396. * The transport code maintains an estimate on the maximum number of out-
  397. * standing RPC requests, using a smoothed version of the congestion
  398. * avoidance implemented in 44BSD. This is basically the Van Jacobson
  399. * congestion algorithm: If a retransmit occurs, the congestion window is
  400. * halved; otherwise, it is incremented by 1/cwnd when
  401. *
  402. * - a reply is received and
  403. * - a full number of requests are outstanding and
  404. * - the congestion window hasn't been updated recently.
  405. */
  406. void xprt_adjust_cwnd(struct rpc_xprt *xprt, struct rpc_task *task, int result)
  407. {
  408. struct rpc_rqst *req = task->tk_rqstp;
  409. unsigned long cwnd = xprt->cwnd;
  410. if (result >= 0 && cwnd <= xprt->cong) {
  411. /* The (cwnd >> 1) term makes sure
  412. * the result gets rounded properly. */
  413. cwnd += (RPC_CWNDSCALE * RPC_CWNDSCALE + (cwnd >> 1)) / cwnd;
  414. if (cwnd > RPC_MAXCWND(xprt))
  415. cwnd = RPC_MAXCWND(xprt);
  416. __xprt_lock_write_next_cong(xprt);
  417. } else if (result == -ETIMEDOUT) {
  418. cwnd >>= 1;
  419. if (cwnd < RPC_CWNDSCALE)
  420. cwnd = RPC_CWNDSCALE;
  421. }
  422. dprintk("RPC: cong %ld, cwnd was %ld, now %ld\n",
  423. xprt->cong, xprt->cwnd, cwnd);
  424. xprt->cwnd = cwnd;
  425. __xprt_put_cong(xprt, req);
  426. }
  427. EXPORT_SYMBOL_GPL(xprt_adjust_cwnd);
  428. /**
  429. * xprt_wake_pending_tasks - wake all tasks on a transport's pending queue
  430. * @xprt: transport with waiting tasks
  431. * @status: result code to plant in each task before waking it
  432. *
  433. */
  434. void xprt_wake_pending_tasks(struct rpc_xprt *xprt, int status)
  435. {
  436. if (status < 0)
  437. rpc_wake_up_status(&xprt->pending, status);
  438. else
  439. rpc_wake_up(&xprt->pending);
  440. }
  441. EXPORT_SYMBOL_GPL(xprt_wake_pending_tasks);
  442. /**
  443. * xprt_wait_for_buffer_space - wait for transport output buffer to clear
  444. * @task: task to be put to sleep
  445. * @action: function pointer to be executed after wait
  446. *
  447. * Note that we only set the timer for the case of RPC_IS_SOFT(), since
  448. * we don't in general want to force a socket disconnection due to
  449. * an incomplete RPC call transmission.
  450. */
  451. void xprt_wait_for_buffer_space(struct rpc_task *task, rpc_action action)
  452. {
  453. struct rpc_rqst *req = task->tk_rqstp;
  454. struct rpc_xprt *xprt = req->rq_xprt;
  455. task->tk_timeout = RPC_IS_SOFT(task) ? req->rq_timeout : 0;
  456. rpc_sleep_on(&xprt->pending, task, action);
  457. }
  458. EXPORT_SYMBOL_GPL(xprt_wait_for_buffer_space);
  459. /**
  460. * xprt_write_space - wake the task waiting for transport output buffer space
  461. * @xprt: transport with waiting tasks
  462. *
  463. * Can be called in a soft IRQ context, so xprt_write_space never sleeps.
  464. */
  465. void xprt_write_space(struct rpc_xprt *xprt)
  466. {
  467. spin_lock_bh(&xprt->transport_lock);
  468. if (xprt->snd_task) {
  469. dprintk("RPC: write space: waking waiting task on "
  470. "xprt %p\n", xprt);
  471. rpc_wake_up_queued_task_on_wq(xprtiod_workqueue,
  472. &xprt->pending, xprt->snd_task);
  473. }
  474. spin_unlock_bh(&xprt->transport_lock);
  475. }
  476. EXPORT_SYMBOL_GPL(xprt_write_space);
  477. /**
  478. * xprt_set_retrans_timeout_def - set a request's retransmit timeout
  479. * @task: task whose timeout is to be set
  480. *
  481. * Set a request's retransmit timeout based on the transport's
  482. * default timeout parameters. Used by transports that don't adjust
  483. * the retransmit timeout based on round-trip time estimation.
  484. */
  485. void xprt_set_retrans_timeout_def(struct rpc_task *task)
  486. {
  487. task->tk_timeout = task->tk_rqstp->rq_timeout;
  488. }
  489. EXPORT_SYMBOL_GPL(xprt_set_retrans_timeout_def);
  490. /**
  491. * xprt_set_retrans_timeout_rtt - set a request's retransmit timeout
  492. * @task: task whose timeout is to be set
  493. *
  494. * Set a request's retransmit timeout using the RTT estimator.
  495. */
  496. void xprt_set_retrans_timeout_rtt(struct rpc_task *task)
  497. {
  498. int timer = task->tk_msg.rpc_proc->p_timer;
  499. struct rpc_clnt *clnt = task->tk_client;
  500. struct rpc_rtt *rtt = clnt->cl_rtt;
  501. struct rpc_rqst *req = task->tk_rqstp;
  502. unsigned long max_timeout = clnt->cl_timeout->to_maxval;
  503. task->tk_timeout = rpc_calc_rto(rtt, timer);
  504. task->tk_timeout <<= rpc_ntimeo(rtt, timer) + req->rq_retries;
  505. if (task->tk_timeout > max_timeout || task->tk_timeout == 0)
  506. task->tk_timeout = max_timeout;
  507. }
  508. EXPORT_SYMBOL_GPL(xprt_set_retrans_timeout_rtt);
  509. static void xprt_reset_majortimeo(struct rpc_rqst *req)
  510. {
  511. const struct rpc_timeout *to = req->rq_task->tk_client->cl_timeout;
  512. req->rq_majortimeo = req->rq_timeout;
  513. if (to->to_exponential)
  514. req->rq_majortimeo <<= to->to_retries;
  515. else
  516. req->rq_majortimeo += to->to_increment * to->to_retries;
  517. if (req->rq_majortimeo > to->to_maxval || req->rq_majortimeo == 0)
  518. req->rq_majortimeo = to->to_maxval;
  519. req->rq_majortimeo += jiffies;
  520. }
  521. /**
  522. * xprt_adjust_timeout - adjust timeout values for next retransmit
  523. * @req: RPC request containing parameters to use for the adjustment
  524. *
  525. */
  526. int xprt_adjust_timeout(struct rpc_rqst *req)
  527. {
  528. struct rpc_xprt *xprt = req->rq_xprt;
  529. const struct rpc_timeout *to = req->rq_task->tk_client->cl_timeout;
  530. int status = 0;
  531. if (time_before(jiffies, req->rq_majortimeo)) {
  532. if (to->to_exponential)
  533. req->rq_timeout <<= 1;
  534. else
  535. req->rq_timeout += to->to_increment;
  536. if (to->to_maxval && req->rq_timeout >= to->to_maxval)
  537. req->rq_timeout = to->to_maxval;
  538. req->rq_retries++;
  539. } else {
  540. req->rq_timeout = to->to_initval;
  541. req->rq_retries = 0;
  542. xprt_reset_majortimeo(req);
  543. /* Reset the RTT counters == "slow start" */
  544. spin_lock_bh(&xprt->transport_lock);
  545. rpc_init_rtt(req->rq_task->tk_client->cl_rtt, to->to_initval);
  546. spin_unlock_bh(&xprt->transport_lock);
  547. status = -ETIMEDOUT;
  548. }
  549. if (req->rq_timeout == 0) {
  550. printk(KERN_WARNING "xprt_adjust_timeout: rq_timeout = 0!\n");
  551. req->rq_timeout = 5 * HZ;
  552. }
  553. return status;
  554. }
  555. static void xprt_autoclose(struct work_struct *work)
  556. {
  557. struct rpc_xprt *xprt =
  558. container_of(work, struct rpc_xprt, task_cleanup);
  559. clear_bit(XPRT_CLOSE_WAIT, &xprt->state);
  560. xprt->ops->close(xprt);
  561. xprt_release_write(xprt, NULL);
  562. wake_up_bit(&xprt->state, XPRT_LOCKED);
  563. }
  564. /**
  565. * xprt_disconnect_done - mark a transport as disconnected
  566. * @xprt: transport to flag for disconnect
  567. *
  568. */
  569. void xprt_disconnect_done(struct rpc_xprt *xprt)
  570. {
  571. dprintk("RPC: disconnected transport %p\n", xprt);
  572. spin_lock_bh(&xprt->transport_lock);
  573. xprt_clear_connected(xprt);
  574. xprt_wake_pending_tasks(xprt, -EAGAIN);
  575. spin_unlock_bh(&xprt->transport_lock);
  576. }
  577. EXPORT_SYMBOL_GPL(xprt_disconnect_done);
  578. /**
  579. * xprt_force_disconnect - force a transport to disconnect
  580. * @xprt: transport to disconnect
  581. *
  582. */
  583. void xprt_force_disconnect(struct rpc_xprt *xprt)
  584. {
  585. /* Don't race with the test_bit() in xprt_clear_locked() */
  586. spin_lock_bh(&xprt->transport_lock);
  587. set_bit(XPRT_CLOSE_WAIT, &xprt->state);
  588. /* Try to schedule an autoclose RPC call */
  589. if (test_and_set_bit(XPRT_LOCKED, &xprt->state) == 0)
  590. queue_work(xprtiod_workqueue, &xprt->task_cleanup);
  591. xprt_wake_pending_tasks(xprt, -EAGAIN);
  592. spin_unlock_bh(&xprt->transport_lock);
  593. }
  594. EXPORT_SYMBOL_GPL(xprt_force_disconnect);
  595. /**
  596. * xprt_conditional_disconnect - force a transport to disconnect
  597. * @xprt: transport to disconnect
  598. * @cookie: 'connection cookie'
  599. *
  600. * This attempts to break the connection if and only if 'cookie' matches
  601. * the current transport 'connection cookie'. It ensures that we don't
  602. * try to break the connection more than once when we need to retransmit
  603. * a batch of RPC requests.
  604. *
  605. */
  606. void xprt_conditional_disconnect(struct rpc_xprt *xprt, unsigned int cookie)
  607. {
  608. /* Don't race with the test_bit() in xprt_clear_locked() */
  609. spin_lock_bh(&xprt->transport_lock);
  610. if (cookie != xprt->connect_cookie)
  611. goto out;
  612. if (test_bit(XPRT_CLOSING, &xprt->state))
  613. goto out;
  614. set_bit(XPRT_CLOSE_WAIT, &xprt->state);
  615. /* Try to schedule an autoclose RPC call */
  616. if (test_and_set_bit(XPRT_LOCKED, &xprt->state) == 0)
  617. queue_work(xprtiod_workqueue, &xprt->task_cleanup);
  618. xprt_wake_pending_tasks(xprt, -EAGAIN);
  619. out:
  620. spin_unlock_bh(&xprt->transport_lock);
  621. }
  622. static bool
  623. xprt_has_timer(const struct rpc_xprt *xprt)
  624. {
  625. return xprt->idle_timeout != 0;
  626. }
  627. static void
  628. xprt_schedule_autodisconnect(struct rpc_xprt *xprt)
  629. __must_hold(&xprt->transport_lock)
  630. {
  631. if (list_empty(&xprt->recv) && xprt_has_timer(xprt))
  632. mod_timer(&xprt->timer, xprt->last_used + xprt->idle_timeout);
  633. }
  634. static void
  635. xprt_init_autodisconnect(struct timer_list *t)
  636. {
  637. struct rpc_xprt *xprt = from_timer(xprt, t, timer);
  638. spin_lock(&xprt->transport_lock);
  639. if (!list_empty(&xprt->recv))
  640. goto out_abort;
  641. /* Reset xprt->last_used to avoid connect/autodisconnect cycling */
  642. xprt->last_used = jiffies;
  643. if (test_and_set_bit(XPRT_LOCKED, &xprt->state))
  644. goto out_abort;
  645. spin_unlock(&xprt->transport_lock);
  646. queue_work(xprtiod_workqueue, &xprt->task_cleanup);
  647. return;
  648. out_abort:
  649. spin_unlock(&xprt->transport_lock);
  650. }
  651. bool xprt_lock_connect(struct rpc_xprt *xprt,
  652. struct rpc_task *task,
  653. void *cookie)
  654. {
  655. bool ret = false;
  656. spin_lock_bh(&xprt->transport_lock);
  657. if (!test_bit(XPRT_LOCKED, &xprt->state))
  658. goto out;
  659. if (xprt->snd_task != task)
  660. goto out;
  661. xprt_task_clear_bytes_sent(task);
  662. xprt->snd_task = cookie;
  663. ret = true;
  664. out:
  665. spin_unlock_bh(&xprt->transport_lock);
  666. return ret;
  667. }
  668. void xprt_unlock_connect(struct rpc_xprt *xprt, void *cookie)
  669. {
  670. spin_lock_bh(&xprt->transport_lock);
  671. if (xprt->snd_task != cookie)
  672. goto out;
  673. if (!test_bit(XPRT_LOCKED, &xprt->state))
  674. goto out;
  675. xprt->snd_task =NULL;
  676. xprt->ops->release_xprt(xprt, NULL);
  677. xprt_schedule_autodisconnect(xprt);
  678. out:
  679. spin_unlock_bh(&xprt->transport_lock);
  680. wake_up_bit(&xprt->state, XPRT_LOCKED);
  681. }
  682. /**
  683. * xprt_connect - schedule a transport connect operation
  684. * @task: RPC task that is requesting the connect
  685. *
  686. */
  687. void xprt_connect(struct rpc_task *task)
  688. {
  689. struct rpc_xprt *xprt = task->tk_rqstp->rq_xprt;
  690. dprintk("RPC: %5u xprt_connect xprt %p %s connected\n", task->tk_pid,
  691. xprt, (xprt_connected(xprt) ? "is" : "is not"));
  692. if (!xprt_bound(xprt)) {
  693. task->tk_status = -EAGAIN;
  694. return;
  695. }
  696. if (!xprt_lock_write(xprt, task))
  697. return;
  698. if (test_and_clear_bit(XPRT_CLOSE_WAIT, &xprt->state))
  699. xprt->ops->close(xprt);
  700. if (!xprt_connected(xprt)) {
  701. task->tk_rqstp->rq_bytes_sent = 0;
  702. task->tk_timeout = task->tk_rqstp->rq_timeout;
  703. task->tk_rqstp->rq_connect_cookie = xprt->connect_cookie;
  704. rpc_sleep_on(&xprt->pending, task, xprt_connect_status);
  705. if (test_bit(XPRT_CLOSING, &xprt->state))
  706. return;
  707. if (xprt_test_and_set_connecting(xprt))
  708. return;
  709. xprt->stat.connect_start = jiffies;
  710. xprt->ops->connect(xprt, task);
  711. }
  712. xprt_release_write(xprt, task);
  713. }
  714. static void xprt_connect_status(struct rpc_task *task)
  715. {
  716. struct rpc_xprt *xprt = task->tk_rqstp->rq_xprt;
  717. if (task->tk_status == 0) {
  718. xprt->stat.connect_count++;
  719. xprt->stat.connect_time += (long)jiffies - xprt->stat.connect_start;
  720. dprintk("RPC: %5u xprt_connect_status: connection established\n",
  721. task->tk_pid);
  722. return;
  723. }
  724. switch (task->tk_status) {
  725. case -ECONNREFUSED:
  726. case -ECONNRESET:
  727. case -ECONNABORTED:
  728. case -ENETUNREACH:
  729. case -EHOSTUNREACH:
  730. case -EPIPE:
  731. case -EAGAIN:
  732. dprintk("RPC: %5u xprt_connect_status: retrying\n", task->tk_pid);
  733. break;
  734. case -ETIMEDOUT:
  735. dprintk("RPC: %5u xprt_connect_status: connect attempt timed "
  736. "out\n", task->tk_pid);
  737. break;
  738. default:
  739. dprintk("RPC: %5u xprt_connect_status: error %d connecting to "
  740. "server %s\n", task->tk_pid, -task->tk_status,
  741. xprt->servername);
  742. task->tk_status = -EIO;
  743. }
  744. }
  745. /**
  746. * xprt_lookup_rqst - find an RPC request corresponding to an XID
  747. * @xprt: transport on which the original request was transmitted
  748. * @xid: RPC XID of incoming reply
  749. *
  750. * Caller holds xprt->recv_lock.
  751. */
  752. struct rpc_rqst *xprt_lookup_rqst(struct rpc_xprt *xprt, __be32 xid)
  753. {
  754. struct rpc_rqst *entry;
  755. list_for_each_entry(entry, &xprt->recv, rq_list)
  756. if (entry->rq_xid == xid) {
  757. trace_xprt_lookup_rqst(xprt, xid, 0);
  758. entry->rq_rtt = ktime_sub(ktime_get(), entry->rq_xtime);
  759. return entry;
  760. }
  761. dprintk("RPC: xprt_lookup_rqst did not find xid %08x\n",
  762. ntohl(xid));
  763. trace_xprt_lookup_rqst(xprt, xid, -ENOENT);
  764. xprt->stat.bad_xids++;
  765. return NULL;
  766. }
  767. EXPORT_SYMBOL_GPL(xprt_lookup_rqst);
  768. /**
  769. * xprt_pin_rqst - Pin a request on the transport receive list
  770. * @req: Request to pin
  771. *
  772. * Caller must ensure this is atomic with the call to xprt_lookup_rqst()
  773. * so should be holding the xprt transport lock.
  774. */
  775. void xprt_pin_rqst(struct rpc_rqst *req)
  776. {
  777. set_bit(RPC_TASK_MSG_RECV, &req->rq_task->tk_runstate);
  778. }
  779. EXPORT_SYMBOL_GPL(xprt_pin_rqst);
  780. /**
  781. * xprt_unpin_rqst - Unpin a request on the transport receive list
  782. * @req: Request to pin
  783. *
  784. * Caller should be holding the xprt transport lock.
  785. */
  786. void xprt_unpin_rqst(struct rpc_rqst *req)
  787. {
  788. struct rpc_task *task = req->rq_task;
  789. clear_bit(RPC_TASK_MSG_RECV, &task->tk_runstate);
  790. if (test_bit(RPC_TASK_MSG_RECV_WAIT, &task->tk_runstate))
  791. wake_up_bit(&task->tk_runstate, RPC_TASK_MSG_RECV);
  792. }
  793. EXPORT_SYMBOL_GPL(xprt_unpin_rqst);
  794. static void xprt_wait_on_pinned_rqst(struct rpc_rqst *req)
  795. __must_hold(&req->rq_xprt->recv_lock)
  796. {
  797. struct rpc_task *task = req->rq_task;
  798. if (task && test_bit(RPC_TASK_MSG_RECV, &task->tk_runstate)) {
  799. spin_unlock(&req->rq_xprt->recv_lock);
  800. set_bit(RPC_TASK_MSG_RECV_WAIT, &task->tk_runstate);
  801. wait_on_bit(&task->tk_runstate, RPC_TASK_MSG_RECV,
  802. TASK_UNINTERRUPTIBLE);
  803. clear_bit(RPC_TASK_MSG_RECV_WAIT, &task->tk_runstate);
  804. spin_lock(&req->rq_xprt->recv_lock);
  805. }
  806. }
  807. /**
  808. * xprt_update_rtt - Update RPC RTT statistics
  809. * @task: RPC request that recently completed
  810. *
  811. * Caller holds xprt->recv_lock.
  812. */
  813. void xprt_update_rtt(struct rpc_task *task)
  814. {
  815. struct rpc_rqst *req = task->tk_rqstp;
  816. struct rpc_rtt *rtt = task->tk_client->cl_rtt;
  817. unsigned int timer = task->tk_msg.rpc_proc->p_timer;
  818. long m = usecs_to_jiffies(ktime_to_us(req->rq_rtt));
  819. if (timer) {
  820. if (req->rq_ntrans == 1)
  821. rpc_update_rtt(rtt, timer, m);
  822. rpc_set_timeo(rtt, timer, req->rq_ntrans - 1);
  823. }
  824. }
  825. EXPORT_SYMBOL_GPL(xprt_update_rtt);
  826. /**
  827. * xprt_complete_rqst - called when reply processing is complete
  828. * @task: RPC request that recently completed
  829. * @copied: actual number of bytes received from the transport
  830. *
  831. * Caller holds xprt->recv_lock.
  832. */
  833. void xprt_complete_rqst(struct rpc_task *task, int copied)
  834. {
  835. struct rpc_rqst *req = task->tk_rqstp;
  836. struct rpc_xprt *xprt = req->rq_xprt;
  837. dprintk("RPC: %5u xid %08x complete (%d bytes received)\n",
  838. task->tk_pid, ntohl(req->rq_xid), copied);
  839. trace_xprt_complete_rqst(xprt, req->rq_xid, copied);
  840. xprt->stat.recvs++;
  841. list_del_init(&req->rq_list);
  842. req->rq_private_buf.len = copied;
  843. /* Ensure all writes are done before we update */
  844. /* req->rq_reply_bytes_recvd */
  845. smp_wmb();
  846. req->rq_reply_bytes_recvd = copied;
  847. rpc_wake_up_queued_task(&xprt->pending, task);
  848. }
  849. EXPORT_SYMBOL_GPL(xprt_complete_rqst);
  850. static void xprt_timer(struct rpc_task *task)
  851. {
  852. struct rpc_rqst *req = task->tk_rqstp;
  853. struct rpc_xprt *xprt = req->rq_xprt;
  854. if (task->tk_status != -ETIMEDOUT)
  855. return;
  856. trace_xprt_timer(xprt, req->rq_xid, task->tk_status);
  857. if (!req->rq_reply_bytes_recvd) {
  858. if (xprt->ops->timer)
  859. xprt->ops->timer(xprt, task);
  860. } else
  861. task->tk_status = 0;
  862. }
  863. /**
  864. * xprt_prepare_transmit - reserve the transport before sending a request
  865. * @task: RPC task about to send a request
  866. *
  867. */
  868. bool xprt_prepare_transmit(struct rpc_task *task)
  869. {
  870. struct rpc_rqst *req = task->tk_rqstp;
  871. struct rpc_xprt *xprt = req->rq_xprt;
  872. bool ret = false;
  873. dprintk("RPC: %5u xprt_prepare_transmit\n", task->tk_pid);
  874. spin_lock_bh(&xprt->transport_lock);
  875. if (!req->rq_bytes_sent) {
  876. if (req->rq_reply_bytes_recvd) {
  877. task->tk_status = req->rq_reply_bytes_recvd;
  878. goto out_unlock;
  879. }
  880. if ((task->tk_flags & RPC_TASK_NO_RETRANS_TIMEOUT)
  881. && xprt_connected(xprt)
  882. && req->rq_connect_cookie == xprt->connect_cookie) {
  883. xprt->ops->set_retrans_timeout(task);
  884. rpc_sleep_on(&xprt->pending, task, xprt_timer);
  885. goto out_unlock;
  886. }
  887. }
  888. if (!xprt->ops->reserve_xprt(xprt, task)) {
  889. task->tk_status = -EAGAIN;
  890. goto out_unlock;
  891. }
  892. ret = true;
  893. out_unlock:
  894. spin_unlock_bh(&xprt->transport_lock);
  895. return ret;
  896. }
  897. void xprt_end_transmit(struct rpc_task *task)
  898. {
  899. xprt_release_write(task->tk_rqstp->rq_xprt, task);
  900. }
  901. /**
  902. * xprt_transmit - send an RPC request on a transport
  903. * @task: controlling RPC task
  904. *
  905. * We have to copy the iovec because sendmsg fiddles with its contents.
  906. */
  907. void xprt_transmit(struct rpc_task *task)
  908. {
  909. struct rpc_rqst *req = task->tk_rqstp;
  910. struct rpc_xprt *xprt = req->rq_xprt;
  911. unsigned int connect_cookie;
  912. int status;
  913. dprintk("RPC: %5u xprt_transmit(%u)\n", task->tk_pid, req->rq_slen);
  914. if (!req->rq_reply_bytes_recvd) {
  915. if (list_empty(&req->rq_list) && rpc_reply_expected(task)) {
  916. /*
  917. * Add to the list only if we're expecting a reply
  918. */
  919. /* Update the softirq receive buffer */
  920. memcpy(&req->rq_private_buf, &req->rq_rcv_buf,
  921. sizeof(req->rq_private_buf));
  922. /* Add request to the receive list */
  923. spin_lock(&xprt->recv_lock);
  924. list_add_tail(&req->rq_list, &xprt->recv);
  925. spin_unlock(&xprt->recv_lock);
  926. xprt_reset_majortimeo(req);
  927. /* Turn off autodisconnect */
  928. del_singleshot_timer_sync(&xprt->timer);
  929. }
  930. } else if (!req->rq_bytes_sent)
  931. return;
  932. connect_cookie = xprt->connect_cookie;
  933. status = xprt->ops->send_request(task);
  934. trace_xprt_transmit(xprt, req->rq_xid, status);
  935. if (status != 0) {
  936. task->tk_status = status;
  937. return;
  938. }
  939. xprt_inject_disconnect(xprt);
  940. dprintk("RPC: %5u xmit complete\n", task->tk_pid);
  941. task->tk_flags |= RPC_TASK_SENT;
  942. spin_lock_bh(&xprt->transport_lock);
  943. xprt->ops->set_retrans_timeout(task);
  944. xprt->stat.sends++;
  945. xprt->stat.req_u += xprt->stat.sends - xprt->stat.recvs;
  946. xprt->stat.bklog_u += xprt->backlog.qlen;
  947. xprt->stat.sending_u += xprt->sending.qlen;
  948. xprt->stat.pending_u += xprt->pending.qlen;
  949. spin_unlock_bh(&xprt->transport_lock);
  950. req->rq_connect_cookie = connect_cookie;
  951. if (rpc_reply_expected(task) && !READ_ONCE(req->rq_reply_bytes_recvd)) {
  952. /*
  953. * Sleep on the pending queue if we're expecting a reply.
  954. * The spinlock ensures atomicity between the test of
  955. * req->rq_reply_bytes_recvd, and the call to rpc_sleep_on().
  956. */
  957. spin_lock(&xprt->recv_lock);
  958. if (!req->rq_reply_bytes_recvd) {
  959. rpc_sleep_on(&xprt->pending, task, xprt_timer);
  960. /*
  961. * Send an extra queue wakeup call if the
  962. * connection was dropped in case the call to
  963. * rpc_sleep_on() raced.
  964. */
  965. if (!xprt_connected(xprt))
  966. xprt_wake_pending_tasks(xprt, -ENOTCONN);
  967. }
  968. spin_unlock(&xprt->recv_lock);
  969. }
  970. }
  971. static void xprt_add_backlog(struct rpc_xprt *xprt, struct rpc_task *task)
  972. {
  973. set_bit(XPRT_CONGESTED, &xprt->state);
  974. rpc_sleep_on(&xprt->backlog, task, NULL);
  975. }
  976. static void xprt_wake_up_backlog(struct rpc_xprt *xprt)
  977. {
  978. if (rpc_wake_up_next(&xprt->backlog) == NULL)
  979. clear_bit(XPRT_CONGESTED, &xprt->state);
  980. }
  981. static bool xprt_throttle_congested(struct rpc_xprt *xprt, struct rpc_task *task)
  982. {
  983. bool ret = false;
  984. if (!test_bit(XPRT_CONGESTED, &xprt->state))
  985. goto out;
  986. spin_lock(&xprt->reserve_lock);
  987. if (test_bit(XPRT_CONGESTED, &xprt->state)) {
  988. rpc_sleep_on(&xprt->backlog, task, NULL);
  989. ret = true;
  990. }
  991. spin_unlock(&xprt->reserve_lock);
  992. out:
  993. return ret;
  994. }
  995. static struct rpc_rqst *xprt_dynamic_alloc_slot(struct rpc_xprt *xprt)
  996. {
  997. struct rpc_rqst *req = ERR_PTR(-EAGAIN);
  998. if (xprt->num_reqs >= xprt->max_reqs)
  999. goto out;
  1000. ++xprt->num_reqs;
  1001. spin_unlock(&xprt->reserve_lock);
  1002. req = kzalloc(sizeof(struct rpc_rqst), GFP_NOFS);
  1003. spin_lock(&xprt->reserve_lock);
  1004. if (req != NULL)
  1005. goto out;
  1006. --xprt->num_reqs;
  1007. req = ERR_PTR(-ENOMEM);
  1008. out:
  1009. return req;
  1010. }
  1011. static bool xprt_dynamic_free_slot(struct rpc_xprt *xprt, struct rpc_rqst *req)
  1012. {
  1013. if (xprt->num_reqs > xprt->min_reqs) {
  1014. --xprt->num_reqs;
  1015. kfree(req);
  1016. return true;
  1017. }
  1018. return false;
  1019. }
  1020. void xprt_alloc_slot(struct rpc_xprt *xprt, struct rpc_task *task)
  1021. {
  1022. struct rpc_rqst *req;
  1023. spin_lock(&xprt->reserve_lock);
  1024. if (!list_empty(&xprt->free)) {
  1025. req = list_entry(xprt->free.next, struct rpc_rqst, rq_list);
  1026. list_del(&req->rq_list);
  1027. goto out_init_req;
  1028. }
  1029. req = xprt_dynamic_alloc_slot(xprt);
  1030. if (!IS_ERR(req))
  1031. goto out_init_req;
  1032. switch (PTR_ERR(req)) {
  1033. case -ENOMEM:
  1034. dprintk("RPC: dynamic allocation of request slot "
  1035. "failed! Retrying\n");
  1036. task->tk_status = -ENOMEM;
  1037. break;
  1038. case -EAGAIN:
  1039. xprt_add_backlog(xprt, task);
  1040. dprintk("RPC: waiting for request slot\n");
  1041. /* fall through */
  1042. default:
  1043. task->tk_status = -EAGAIN;
  1044. }
  1045. spin_unlock(&xprt->reserve_lock);
  1046. return;
  1047. out_init_req:
  1048. xprt->stat.max_slots = max_t(unsigned int, xprt->stat.max_slots,
  1049. xprt->num_reqs);
  1050. spin_unlock(&xprt->reserve_lock);
  1051. task->tk_status = 0;
  1052. task->tk_rqstp = req;
  1053. }
  1054. EXPORT_SYMBOL_GPL(xprt_alloc_slot);
  1055. void xprt_lock_and_alloc_slot(struct rpc_xprt *xprt, struct rpc_task *task)
  1056. {
  1057. /* Note: grabbing the xprt_lock_write() ensures that we throttle
  1058. * new slot allocation if the transport is congested (i.e. when
  1059. * reconnecting a stream transport or when out of socket write
  1060. * buffer space).
  1061. */
  1062. if (xprt_lock_write(xprt, task)) {
  1063. xprt_alloc_slot(xprt, task);
  1064. xprt_release_write(xprt, task);
  1065. }
  1066. }
  1067. EXPORT_SYMBOL_GPL(xprt_lock_and_alloc_slot);
  1068. void xprt_free_slot(struct rpc_xprt *xprt, struct rpc_rqst *req)
  1069. {
  1070. spin_lock(&xprt->reserve_lock);
  1071. if (!xprt_dynamic_free_slot(xprt, req)) {
  1072. memset(req, 0, sizeof(*req)); /* mark unused */
  1073. list_add(&req->rq_list, &xprt->free);
  1074. }
  1075. xprt_wake_up_backlog(xprt);
  1076. spin_unlock(&xprt->reserve_lock);
  1077. }
  1078. EXPORT_SYMBOL_GPL(xprt_free_slot);
  1079. static void xprt_free_all_slots(struct rpc_xprt *xprt)
  1080. {
  1081. struct rpc_rqst *req;
  1082. while (!list_empty(&xprt->free)) {
  1083. req = list_first_entry(&xprt->free, struct rpc_rqst, rq_list);
  1084. list_del(&req->rq_list);
  1085. kfree(req);
  1086. }
  1087. }
  1088. struct rpc_xprt *xprt_alloc(struct net *net, size_t size,
  1089. unsigned int num_prealloc,
  1090. unsigned int max_alloc)
  1091. {
  1092. struct rpc_xprt *xprt;
  1093. struct rpc_rqst *req;
  1094. int i;
  1095. xprt = kzalloc(size, GFP_KERNEL);
  1096. if (xprt == NULL)
  1097. goto out;
  1098. xprt_init(xprt, net);
  1099. for (i = 0; i < num_prealloc; i++) {
  1100. req = kzalloc(sizeof(struct rpc_rqst), GFP_KERNEL);
  1101. if (!req)
  1102. goto out_free;
  1103. list_add(&req->rq_list, &xprt->free);
  1104. }
  1105. if (max_alloc > num_prealloc)
  1106. xprt->max_reqs = max_alloc;
  1107. else
  1108. xprt->max_reqs = num_prealloc;
  1109. xprt->min_reqs = num_prealloc;
  1110. xprt->num_reqs = num_prealloc;
  1111. return xprt;
  1112. out_free:
  1113. xprt_free(xprt);
  1114. out:
  1115. return NULL;
  1116. }
  1117. EXPORT_SYMBOL_GPL(xprt_alloc);
  1118. void xprt_free(struct rpc_xprt *xprt)
  1119. {
  1120. put_net(xprt->xprt_net);
  1121. xprt_free_all_slots(xprt);
  1122. kfree_rcu(xprt, rcu);
  1123. }
  1124. EXPORT_SYMBOL_GPL(xprt_free);
  1125. /**
  1126. * xprt_reserve - allocate an RPC request slot
  1127. * @task: RPC task requesting a slot allocation
  1128. *
  1129. * If the transport is marked as being congested, or if no more
  1130. * slots are available, place the task on the transport's
  1131. * backlog queue.
  1132. */
  1133. void xprt_reserve(struct rpc_task *task)
  1134. {
  1135. struct rpc_xprt *xprt = task->tk_xprt;
  1136. task->tk_status = 0;
  1137. if (task->tk_rqstp != NULL)
  1138. return;
  1139. task->tk_timeout = 0;
  1140. task->tk_status = -EAGAIN;
  1141. if (!xprt_throttle_congested(xprt, task))
  1142. xprt->ops->alloc_slot(xprt, task);
  1143. }
  1144. /**
  1145. * xprt_retry_reserve - allocate an RPC request slot
  1146. * @task: RPC task requesting a slot allocation
  1147. *
  1148. * If no more slots are available, place the task on the transport's
  1149. * backlog queue.
  1150. * Note that the only difference with xprt_reserve is that we now
  1151. * ignore the value of the XPRT_CONGESTED flag.
  1152. */
  1153. void xprt_retry_reserve(struct rpc_task *task)
  1154. {
  1155. struct rpc_xprt *xprt = task->tk_xprt;
  1156. task->tk_status = 0;
  1157. if (task->tk_rqstp != NULL)
  1158. return;
  1159. task->tk_timeout = 0;
  1160. task->tk_status = -EAGAIN;
  1161. xprt->ops->alloc_slot(xprt, task);
  1162. }
  1163. static inline __be32 xprt_alloc_xid(struct rpc_xprt *xprt)
  1164. {
  1165. __be32 xid;
  1166. spin_lock(&xprt->reserve_lock);
  1167. xid = (__force __be32)xprt->xid++;
  1168. spin_unlock(&xprt->reserve_lock);
  1169. return xid;
  1170. }
  1171. static inline void xprt_init_xid(struct rpc_xprt *xprt)
  1172. {
  1173. xprt->xid = prandom_u32();
  1174. }
  1175. void xprt_request_init(struct rpc_task *task)
  1176. {
  1177. struct rpc_xprt *xprt = task->tk_xprt;
  1178. struct rpc_rqst *req = task->tk_rqstp;
  1179. INIT_LIST_HEAD(&req->rq_list);
  1180. req->rq_timeout = task->tk_client->cl_timeout->to_initval;
  1181. req->rq_task = task;
  1182. req->rq_xprt = xprt;
  1183. req->rq_buffer = NULL;
  1184. req->rq_xid = xprt_alloc_xid(xprt);
  1185. req->rq_connect_cookie = xprt->connect_cookie - 1;
  1186. req->rq_bytes_sent = 0;
  1187. req->rq_snd_buf.len = 0;
  1188. req->rq_snd_buf.buflen = 0;
  1189. req->rq_rcv_buf.len = 0;
  1190. req->rq_rcv_buf.buflen = 0;
  1191. req->rq_release_snd_buf = NULL;
  1192. xprt_reset_majortimeo(req);
  1193. dprintk("RPC: %5u reserved req %p xid %08x\n", task->tk_pid,
  1194. req, ntohl(req->rq_xid));
  1195. }
  1196. /**
  1197. * xprt_release - release an RPC request slot
  1198. * @task: task which is finished with the slot
  1199. *
  1200. */
  1201. void xprt_release(struct rpc_task *task)
  1202. {
  1203. struct rpc_xprt *xprt;
  1204. struct rpc_rqst *req = task->tk_rqstp;
  1205. if (req == NULL) {
  1206. if (task->tk_client) {
  1207. xprt = task->tk_xprt;
  1208. if (xprt->snd_task == task)
  1209. xprt_release_write(xprt, task);
  1210. }
  1211. return;
  1212. }
  1213. xprt = req->rq_xprt;
  1214. if (task->tk_ops->rpc_count_stats != NULL)
  1215. task->tk_ops->rpc_count_stats(task, task->tk_calldata);
  1216. else if (task->tk_client)
  1217. rpc_count_iostats(task, task->tk_client->cl_metrics);
  1218. spin_lock(&xprt->recv_lock);
  1219. if (!list_empty(&req->rq_list)) {
  1220. list_del_init(&req->rq_list);
  1221. xprt_wait_on_pinned_rqst(req);
  1222. }
  1223. spin_unlock(&xprt->recv_lock);
  1224. spin_lock_bh(&xprt->transport_lock);
  1225. xprt->ops->release_xprt(xprt, task);
  1226. if (xprt->ops->release_request)
  1227. xprt->ops->release_request(task);
  1228. xprt->last_used = jiffies;
  1229. xprt_schedule_autodisconnect(xprt);
  1230. spin_unlock_bh(&xprt->transport_lock);
  1231. if (req->rq_buffer)
  1232. xprt->ops->buf_free(task);
  1233. xprt_inject_disconnect(xprt);
  1234. if (req->rq_cred != NULL)
  1235. put_rpccred(req->rq_cred);
  1236. task->tk_rqstp = NULL;
  1237. if (req->rq_release_snd_buf)
  1238. req->rq_release_snd_buf(req);
  1239. dprintk("RPC: %5u release request %p\n", task->tk_pid, req);
  1240. if (likely(!bc_prealloc(req)))
  1241. xprt->ops->free_slot(xprt, req);
  1242. else
  1243. xprt_free_bc_request(req);
  1244. }
  1245. static void xprt_init(struct rpc_xprt *xprt, struct net *net)
  1246. {
  1247. kref_init(&xprt->kref);
  1248. spin_lock_init(&xprt->transport_lock);
  1249. spin_lock_init(&xprt->reserve_lock);
  1250. spin_lock_init(&xprt->recv_lock);
  1251. INIT_LIST_HEAD(&xprt->free);
  1252. INIT_LIST_HEAD(&xprt->recv);
  1253. #if defined(CONFIG_SUNRPC_BACKCHANNEL)
  1254. spin_lock_init(&xprt->bc_pa_lock);
  1255. INIT_LIST_HEAD(&xprt->bc_pa_list);
  1256. #endif /* CONFIG_SUNRPC_BACKCHANNEL */
  1257. INIT_LIST_HEAD(&xprt->xprt_switch);
  1258. xprt->last_used = jiffies;
  1259. xprt->cwnd = RPC_INITCWND;
  1260. xprt->bind_index = 0;
  1261. rpc_init_wait_queue(&xprt->binding, "xprt_binding");
  1262. rpc_init_wait_queue(&xprt->pending, "xprt_pending");
  1263. rpc_init_priority_wait_queue(&xprt->sending, "xprt_sending");
  1264. rpc_init_priority_wait_queue(&xprt->backlog, "xprt_backlog");
  1265. xprt_init_xid(xprt);
  1266. xprt->xprt_net = get_net(net);
  1267. }
  1268. /**
  1269. * xprt_create_transport - create an RPC transport
  1270. * @args: rpc transport creation arguments
  1271. *
  1272. */
  1273. struct rpc_xprt *xprt_create_transport(struct xprt_create *args)
  1274. {
  1275. struct rpc_xprt *xprt;
  1276. struct xprt_class *t;
  1277. spin_lock(&xprt_list_lock);
  1278. list_for_each_entry(t, &xprt_list, list) {
  1279. if (t->ident == args->ident) {
  1280. spin_unlock(&xprt_list_lock);
  1281. goto found;
  1282. }
  1283. }
  1284. spin_unlock(&xprt_list_lock);
  1285. dprintk("RPC: transport (%d) not supported\n", args->ident);
  1286. return ERR_PTR(-EIO);
  1287. found:
  1288. xprt = t->setup(args);
  1289. if (IS_ERR(xprt)) {
  1290. dprintk("RPC: xprt_create_transport: failed, %ld\n",
  1291. -PTR_ERR(xprt));
  1292. goto out;
  1293. }
  1294. if (args->flags & XPRT_CREATE_NO_IDLE_TIMEOUT)
  1295. xprt->idle_timeout = 0;
  1296. INIT_WORK(&xprt->task_cleanup, xprt_autoclose);
  1297. if (xprt_has_timer(xprt))
  1298. timer_setup(&xprt->timer, xprt_init_autodisconnect, 0);
  1299. else
  1300. timer_setup(&xprt->timer, NULL, 0);
  1301. if (strlen(args->servername) > RPC_MAXNETNAMELEN) {
  1302. xprt_destroy(xprt);
  1303. return ERR_PTR(-EINVAL);
  1304. }
  1305. xprt->servername = kstrdup(args->servername, GFP_KERNEL);
  1306. if (xprt->servername == NULL) {
  1307. xprt_destroy(xprt);
  1308. return ERR_PTR(-ENOMEM);
  1309. }
  1310. rpc_xprt_debugfs_register(xprt);
  1311. dprintk("RPC: created transport %p with %u slots\n", xprt,
  1312. xprt->max_reqs);
  1313. out:
  1314. return xprt;
  1315. }
  1316. static void xprt_destroy_cb(struct work_struct *work)
  1317. {
  1318. struct rpc_xprt *xprt =
  1319. container_of(work, struct rpc_xprt, task_cleanup);
  1320. rpc_xprt_debugfs_unregister(xprt);
  1321. rpc_destroy_wait_queue(&xprt->binding);
  1322. rpc_destroy_wait_queue(&xprt->pending);
  1323. rpc_destroy_wait_queue(&xprt->sending);
  1324. rpc_destroy_wait_queue(&xprt->backlog);
  1325. kfree(xprt->servername);
  1326. /*
  1327. * Tear down transport state and free the rpc_xprt
  1328. */
  1329. xprt->ops->destroy(xprt);
  1330. }
  1331. /**
  1332. * xprt_destroy - destroy an RPC transport, killing off all requests.
  1333. * @xprt: transport to destroy
  1334. *
  1335. */
  1336. static void xprt_destroy(struct rpc_xprt *xprt)
  1337. {
  1338. dprintk("RPC: destroying transport %p\n", xprt);
  1339. /*
  1340. * Exclude transport connect/disconnect handlers and autoclose
  1341. */
  1342. wait_on_bit_lock(&xprt->state, XPRT_LOCKED, TASK_UNINTERRUPTIBLE);
  1343. del_timer_sync(&xprt->timer);
  1344. /*
  1345. * Destroy sockets etc from the system workqueue so they can
  1346. * safely flush receive work running on rpciod.
  1347. */
  1348. INIT_WORK(&xprt->task_cleanup, xprt_destroy_cb);
  1349. schedule_work(&xprt->task_cleanup);
  1350. }
  1351. static void xprt_destroy_kref(struct kref *kref)
  1352. {
  1353. xprt_destroy(container_of(kref, struct rpc_xprt, kref));
  1354. }
  1355. /**
  1356. * xprt_get - return a reference to an RPC transport.
  1357. * @xprt: pointer to the transport
  1358. *
  1359. */
  1360. struct rpc_xprt *xprt_get(struct rpc_xprt *xprt)
  1361. {
  1362. if (xprt != NULL && kref_get_unless_zero(&xprt->kref))
  1363. return xprt;
  1364. return NULL;
  1365. }
  1366. EXPORT_SYMBOL_GPL(xprt_get);
  1367. /**
  1368. * xprt_put - release a reference to an RPC transport.
  1369. * @xprt: pointer to the transport
  1370. *
  1371. */
  1372. void xprt_put(struct rpc_xprt *xprt)
  1373. {
  1374. if (xprt != NULL)
  1375. kref_put(&xprt->kref, xprt_destroy_kref);
  1376. }
  1377. EXPORT_SYMBOL_GPL(xprt_put);